Spark library for generalized K-Means clustering. Supports general Bregman divergences. Suitable for clustering probabilistic data, time series data, high dimensional data, and very large data.
- spark
- embeddings
- spark-mllib
- itakura-saito-divergence
- cosine-similarity
- kullback-leibler-divergence
- k-means
- entropy
- clustering
- euclidean-distance
- bregman-divergence
- similarity-search
Scala versions:
2.10
massivedatascience-clusterer 1.1.0
Group ID:
com.massivedatascience
Artifact ID:
massivedatascience-clusterer_2.10
Version:
1.1.0
Release Date:
Mar 6, 2015
Licenses:
libraryDependencies += "com.massivedatascience" %% "massivedatascience-clusterer" % "1.1.0" resolvers += Resolver.bintrayRepo("derrickburns", "maven")
ivy"com.massivedatascience::massivedatascience-clusterer:1.1.0" MavenRepository("https://dl.bintray.com/derrickburns/maven")
//> using dep "com.massivedatascience::massivedatascience-clusterer:1.1.0"
import $ivy.`com.massivedatascience::massivedatascience-clusterer:1.1.0` import ammonite._, Resolvers._ val res = Resolver.Http( "Bintray derrickburns maven", "Some(https://dl.bintray.com/derrickburns/maven)", IvyPattern, false) interp.resolvers() = interp.resolvers() :+ res
<dependency> <groupId>com.massivedatascience</groupId> <artifactId>massivedatascience-clusterer_2.10</artifactId> <version>1.1.0</version> </dependency>
compile group: 'com.massivedatascience', name: 'massivedatascience-clusterer_2.10', version: '1.1.0'