| 
									
										
										
										
											2021-12-16 13:01:44 +01:00
										 |  |  | % Generated by roxygen2: do not edit by hand | 
					
						
							| 
									
										
										
										
											2022-01-26 09:58:33 +01:00
										 |  |  | % Please edit documentation in R/method_clustering.R | 
					
						
							| 
									
										
										
										
											2021-12-16 13:01:44 +01:00
										 |  |  | \name{clusteriness} | 
					
						
							|  |  |  | \alias{clusteriness} | 
					
						
							|  |  |  | \title{Perform a cluster analysis.} | 
					
						
							|  |  |  | \usage{ | 
					
						
							| 
									
										
										
										
											2022-06-22 11:05:51 +02:00
										 |  |  | clusteriness( | 
					
						
							|  |  |  |   data, | 
					
						
							|  |  |  |   span = 1e+05, | 
					
						
							|  |  |  |   weight = 0.7, | 
					
						
							|  |  |  |   n_clusters = NULL, | 
					
						
							|  |  |  |   relation = NULL | 
					
						
							|  |  |  | ) | 
					
						
							| 
									
										
										
										
											2021-12-16 13:01:44 +01:00
										 |  |  | } | 
					
						
							|  |  |  | \arguments{ | 
					
						
							|  |  |  | \item{data}{The values that should be scored.} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | \item{span}{The maximum span of values considered to be in one cluster.} | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | \item{weight}{The weight that will be given to the next largest cluster in | 
					
						
							|  |  |  | relation to the previous one. For example, if \code{weight} is 0.7 (the | 
					
						
							|  |  |  | default), the first cluster will weigh 1.0, the second 0.7, the third 0.49 | 
					
						
							|  |  |  | etc.} | 
					
						
							| 
									
										
										
										
											2022-06-16 19:45:59 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | \item{n_clusters}{Maximum number of clusters that should be taken into | 
					
						
							|  |  |  | account. By default, all clusters will be regarded.} | 
					
						
							| 
									
										
										
										
											2022-06-22 11:05:51 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | \item{relation}{Number of items that the cluster size should be based on. | 
					
						
							|  |  |  | This should always at least the length of the data. By default, the length | 
					
						
							|  |  |  | of the data is used.} | 
					
						
							| 
									
										
										
										
											2022-06-16 19:45:59 +02:00
										 |  |  | } | 
					
						
							|  |  |  | \value{ | 
					
						
							|  |  |  | A score between 0.0 and 1.0 summarizing how much the data clusters. | 
					
						
							| 
									
										
										
										
											2021-12-16 13:01:44 +01:00
										 |  |  | } | 
					
						
							|  |  |  | \description{ | 
					
						
							|  |  |  | This function will cluster the data using \code{\link[stats:hclust]{stats::hclust()}} and | 
					
						
							|  |  |  | \code{\link[stats:cutree]{stats::cutree()}}. Every cluster with at least two members qualifies for | 
					
						
							|  |  |  | further analysis. Clusters are then ranked based on their size in relation | 
					
						
							|  |  |  | to the total number of values. The return value is a final score between | 
					
						
							|  |  |  | 0.0 and 1.0. Lower ranking clusters contribute less to this score. | 
					
						
							|  |  |  | } |