Revision 20aefc9955133b9d3a2f3ea6366edd542e26701d authored by David Hofmeyr on 16 February 2018, 12:43:08 UTC, committed by cran-robot on 16 February 2018, 12:43:08 UTC
1 parent af98636
cluster_performance.Rd
\name{cluster_performance}
\alias{cluster_performance}
\title{External Cluster Validity Metrics}
\description{
Computes four popular external cluster validity metrics (adjusted Rand index, purity, V-measure and Normalised Mutual Information) through comparison of cluster assignments and true class labels.
}
\usage{
cluster_performance(assigned, labels, beta)
}
\arguments{
\item{assigned}{a vector of cluster assignments made by a clustering algorithm.}
\item{labels}{a vector of true class labels to be compared with assigned.}
\item{beta}{(optional) positive numeric, used in the computation of V-measure. larger values apply higher weight to homogeneity over completeness measures. if omitted then beta = 1 (equal weight applied to both measures).}
}
\value{
a vector containing the four evaluation metrics listed in the description.
}
\references{
Zhao Y., Karypis G. (2004) Empirical and Theoretical Comparisons of Selected Criterion
Functions for Document Clustering. \emph{Machine Learning}, \bold{55}(3), 311--331.
Strehl A., Ghosh J. (2002) Cluster ensembles—a knowledge reuse framework for combining
multiple partitions. \emph{Journal of Machine Learning Research}, \bold{3}, 583--617.
Rosenberg A., Hirschberg J. (2007) V-Measure: A Conditional Entropy-Based External
Cluster Evaluation Measure. \emph{EMNLP-CoNLL}, \bold{7}, 410--420. Citeseer.
Hubert, L., Arabie, P. (1985) Comparing Partitions. \emph{Journal of Classification}, \bold{2}(1), 193--218.
}
\examples{
## load dermatology dataset
data(dermatology)
## obtain clustering solution using MCDC
sol <- mcdc(dermatology$x, 6)
## evaluate solution using external cluster validity measures
cluster_performance(sol$cluster, dermatology$c)
}
\keyword{file}

Computing file changes ...