PyDataBlog · Apr 13, 2020
diff --git a/‎Project.toml‎
Lines changed: 1 addition & 1 deletion b/‎Project.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/src/index.md‎
Lines changed: 3 additions & 2 deletions b/‎docs/src/index.md‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎src/ParallelKMeans.jl‎
Lines changed: 5 additions & 3 deletions b/‎src/ParallelKMeans.jl‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎src/elkan.jl‎
Lines changed: 278 additions & 0 deletions b/‎src/elkan.jl‎
Lines changed: 278 additions & 0 deletions
diff --git a/‎src/hamerly.jl‎
Lines changed: 30 additions & 44 deletions b/‎src/hamerly.jl‎
Lines changed: 30 additions & 44 deletions
diff --git a/‎src/kmeans.jl‎
Lines changed: 1 addition & 109 deletions b/‎src/kmeans.jl‎
Lines changed: 1 addition & 109 deletions
diff --git a/‎src/light_elkan.jl‎
Lines changed: 0 additions & 150 deletions b/‎src/light_elkan.jl‎
Lines changed: 0 additions & 150 deletions
diff --git a/‎src/lloyd.jl‎
Lines changed: 94 additions & 25 deletions b/‎src/lloyd.jl‎
Lines changed: 94 additions & 25 deletions
diff --git a/‎src/mlj_interface.jl‎
Lines changed: 42 additions & 35 deletions b/‎src/mlj_interface.jl‎
Lines changed: 42 additions & 35 deletions
diff --git a/‎test/test02_kmeans.jl‎ renamed to ‎test/test02_lloyd.jl‎
Lines changed: 1 addition & 1 deletion b/‎test/test02_kmeans.jl‎ renamed to ‎test/test02_lloyd.jl‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎test/test04_elkan.jl‎
Lines changed: 11 additions & 28 deletions b/‎test/test04_elkan.jl‎
Lines changed: 11 additions & 28 deletions
diff --git a/‎test/test05_hamerly.jl‎
Lines changed: 2 additions & 2 deletions b/‎test/test05_hamerly.jl‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎test/test06_verbose.jl‎
Lines changed: 19 additions & 2 deletions b/‎test/test06_verbose.jl‎
Lines changed: 19 additions & 2 deletions
diff --git a/‎test/test07_mlj_interface.jl‎
Lines changed: 27 additions & 41 deletions b/‎test/test07_mlj_interface.jl‎
Lines changed: 27 additions & 41 deletions
@@ -1,7 +1,7 @@
 name = "ParallelKMeans"
 uuid = "42b8e9d4-006b-409a-8472-7f34b3fb58af"
 authors = ["Bernard Brenyah", "Andrey Oskin"]
-version = "0.1.1"
+version = "0.1.2"
 
 [deps]
 Distances = "b4f34e82-e78d-54a5-968a-f98e89d6e8f7"
 
@@ -1,4 +1,4 @@
-# ParallelKMeans.jl Package
+# [ParallelKMeans.jl Package](https://github.com/PyDataBlog/ParallelKMeans.jl)
 
 ```@contents
 Depth = 4
@@ -59,7 +59,7 @@ git checkout experimental
 
 - [X] Implementation of [Hamerly implementation](https://www.researchgate.net/publication/220906984_Making_k-means_Even_Faster).
 - [X] Interface for inclusion in Alan Turing Institute's [MLJModels](https://github.com/alan-turing-institute/MLJModels.jl#who-is-this-repo-for).
-- [ ] Full Implementation of Triangle inequality based on [Elkan - 2003 Using the Triangle Inequality to Accelerate K-Means"](https://www.aaai.org/Papers/ICML/2003/ICML03-022.pdf).
+- [X] Full Implementation of Triangle inequality based on [Elkan - 2003 Using the Triangle Inequality to Accelerate K-Means"](https://www.aaai.org/Papers/ICML/2003/ICML03-022.pdf).
 - [ ] Implementation of [Geometric methods to accelerate k-means algorithm](http://cs.baylor.edu/~hamerly/papers/sdm2016_rysavy_hamerly.pdf).
 - [ ] Native support for tabular data inputs outside of MLJModels' interface.
 - [ ] Refactoring and finalizaiton of API desgin.
@@ -177,6 +177,7 @@ ________________________________________________________________________________
 
 - 0.1.0 Initial release
 - 0.1.1 Added interface for MLJ
+- 0.1.2 Added Elkan algorithm
 
 ## Contributing
 
 
@@ -1,18 +1,20 @@
 module ParallelKMeans
 
 using StatsBase
-using MLJModelInterface
+import MLJModelInterface
 import Base.Threads: @spawn
 import Distances
 
+const MMI = MLJModelInterface
+
 include("seeding.jl")
 include("kmeans.jl")
 include("lloyd.jl")
-include("light_elkan.jl")
 include("hamerly.jl")
+include("elkan.jl")
 include("mlj_interface.jl")
 
 export kmeans
-export Lloyd, LightElkan, Hamerly
+export Lloyd, Hamerly, Elkan
 
 end # module
@@ -0,0 +1,278 @@
+"""
+    Elkan()
+
+Elkan algorithm implementation, based on "Charles Elkan. 2003.
+Using the triangle inequality to accelerate k-means.
+In Proceedings of the Twentieth International Conference on
+International Conference on Machine Learning (ICML’03). AAAI Press, 147–153."
+
+This algorithm provides much faster convergence than Lloyd algorithm especially
+for high dimensional data.
+It can be used directly in `kmeans` function
+
+```julia
+X = rand(30, 100_000)   # 100_000 random points in 30 dimensions
+
+kmeans(Elkan(), X, 3) # 3 clusters, Elkan algorithm
+```
+"""
+struct Elkan <: AbstractKMeansAlg end
+
+function kmeans!(alg::Elkan, containers, X, k;
+                n_threads = Threads.nthreads(),
+                k_init = "k-means++", max_iters = 300,
+                tol = 1e-6, verbose = false, init = nothing)
+    nrow, ncol = size(X)
+    centroids = init == nothing ? smart_init(X, k, n_threads, init=k_init).centroids : deepcopy(init)
+
+    update_containers(alg, containers, centroids, n_threads)
+    @parallelize n_threads ncol chunk_initialize(alg, containers, centroids, X)
+
+    converged = false
+    niters = 0
+    J_previous = 0.0
+
+    # Update centroids & labels with closest members until convergence
+    while niters < max_iters
+        niters += 1
+        # Core iteration
+        @parallelize n_threads ncol chunk_update_centroids(alg, containers, centroids, X)
+
+        # Collect distributed containers (such as centroids_new, centroids_cnt)
+        # in paper it is step 4
+        collect_containers(alg, containers, n_threads)
+
+        J = sum(containers.ub)
+
+        # auxiliary calculation, in paper it's d(c, m(c))
+        calculate_centroids_movement(alg, containers, centroids)
+
+        # lower and ounds update, in paper it's steps 5 and 6
+        @parallelize n_threads ncol chunk_update_bounds(alg, containers, centroids)
+
+        # Step 7, final assignment of new centroids
+        centroids .= containers.centroids_new[end]
+
+        if verbose
+            # Show progress and terminate if J stopped decreasing.
+            println("Iteration $niters: Jclust = $J")
+        end
+
+        # Check for convergence
+        if (niters > 1) & (abs(J - J_previous) < (tol * J))
+            converged = true
+            break
+        end
+
+        # Step 1 in original paper, calulation of distance d(c, c')
+        update_containers(alg, containers, centroids, n_threads)
+        J_previous = J
+    end
+
+    @parallelize n_threads ncol sum_of_squares(containers, X, containers.labels, centroids)
+    totalcost = sum(containers.sum_of_squares)
+
+    # Terminate algorithm with the assumption that K-means has converged
+    if verbose & converged
+        println("Successfully terminated with convergence.")
+    end
+
+    # TODO empty placeholder vectors should be calculated
+    # TODO Float64 type definitions is too restrictive, should be relaxed
+    # especially during GPU related development
+    return KmeansResult(centroids, containers.labels, Float64[], Int[], Float64[], totalcost, niters, converged)
+end
+
+function create_containers(::Elkan, k, nrow, ncol, n_threads)
+    lng = n_threads + 1
+    centroids_new = Vector{Array{Float64,2}}(undef, lng)
+    centroids_cnt = Vector{Vector{Int}}(undef, lng)
+
+    for i = 1:lng
+        centroids_new[i] = zeros(nrow, k)
+        centroids_cnt[i] = zeros(k)
+    end
+
+    centroids_dist = Matrix{Float64}(undef, k, k)
+
+    # lower bounds
+    lb = Matrix{Float64}(undef, k, ncol)
+
+    # upper bounds
+    ub = Vector{Float64}(undef, ncol)
+
+    # r(x) in original paper, shows whether point distance should be updated
+    stale = ones(Bool, ncol)
+
+    # distance that centroid moved
+    p = Vector{Float64}(undef, k)
+
+    labels = zeros(Int, ncol)
+
+    # total_sum_calculation
+    sum_of_squares = Vector{Float64}(undef, n_threads)
+
+    return (
+        centroids_new = centroids_new,
+        centroids_cnt = centroids_cnt,
+        labels = labels,
+        centroids_dist = centroids_dist,
+        lb = lb,
+        ub = ub,
+        stale = stale,
+        p = p,
+        sum_of_squares = sum_of_squares
+    )
+end
+
+function chunk_initialize(::Elkan, containers, centroids, X, r, idx)
+    ub = containers.ub
+    lb = containers.lb
+    centroids_dist = containers.centroids_dist
+    labels = containers.labels
+    centroids_new = containers.centroids_new[idx]
+    centroids_cnt = containers.centroids_cnt[idx]
+
+    @inbounds for i in r
+        min_dist = distance(X, centroids, i, 1)
+        label = 1
+        lb[label, i] = min_dist
+        for j in 2:size(centroids, 2)
+            # triangular inequality
+            if centroids_dist[j, label] > min_dist
+                lb[j, i] = min_dist
+            else
+                dist = distance(X, centroids, i, j)
+                label = dist < min_dist ? j : label
+                min_dist = dist < min_dist ? dist : min_dist
+                lb[j, i] = dist
+            end
+        end
+        ub[i] = min_dist
+        labels[i] = label
+        centroids_cnt[label] += 1
+        for j in axes(X, 1)
+            centroids_new[j, label] += X[j, i]
+        end
+    end
+end
+
+function update_containers(::Elkan, containers, centroids, n_threads)
+    # unpack containers for easier manipulations
+    centroids_dist = containers.centroids_dist
+
+    k = size(centroids_dist, 1) # number of clusters
+    @inbounds for j in axes(centroids_dist, 2)
+        min_dist = Inf
+        for i in j + 1:k
+            d = distance(centroids, centroids, i, j)
+            centroids_dist[i, j] = d
+            centroids_dist[j, i] = d
+            min_dist = min_dist < d ? min_dist : d
+        end
+        for i in 1:j - 1
+            min_dist = min_dist < centroids_dist[j, i] ? min_dist : centroids_dist[j, i]
+        end
+        centroids_dist[j, j] = min_dist
+    end
+
+    # TODO: oh, one should be careful here. inequality holds for eucledian metrics
+    # not square eucledian. So, for Lp norm it should be something like
+    # centroids_dist = 0.5^p. Should check one more time original paper
+    centroids_dist .*= 0.25
+
+    return centroids_dist
+end
+
+function chunk_update_centroids(::Elkan, containers, centroids, X, r, idx)
+    # unpack
+    ub = containers.ub
+    lb = containers.lb
+    centroids_dist = containers.centroids_dist
+    labels = containers.labels
+    stale = containers.stale
+    centroids_new = containers.centroids_new[idx]
+    centroids_cnt = containers.centroids_cnt[idx]
+
+    @inbounds for i in r
+        label_old = labels[i]
+        label = label_old
+        min_dist = ub[i]
+        # tighten the loop, exclude points that very close to center
+        min_dist <= centroids_dist[label, label] && continue
+        for j in axes(centroids, 2)
+            # tighten the loop once more, exclude far away centers
+            j == label && continue
+            min_dist <= lb[j, i] && continue
+            min_dist <= centroids_dist[j, label] && continue
+
+            # one calculation per iteration is enough
+            if stale[i]
+                min_dist = distance(X, centroids, i, label)
+                lb[label, i] = min_dist
+                ub[i] = min_dist
+                stale[i] = false
+            end
+
+            if (min_dist > lb[j, i]) | (min_dist > centroids_dist[j, label])
+                dist = distance(X, centroids, i, j)
+                lb[j, i] = dist
+                if dist < min_dist
+                    min_dist = dist
+                    label = j
+                end
+            end
+        end
+
+        if label != label_old
+            labels[i] = label
+            centroids_cnt[label_old] -= 1
+            centroids_cnt[label] += 1
+            for j in axes(X, 1)
+                centroids_new[j, label_old] -= X[j, i]
+                centroids_new[j, label] += X[j, i]
+            end
+        end
+    end
+end
+
+function collect_containers(alg::Elkan, containers, n_threads)
+    if n_threads == 1
+        @inbounds containers.centroids_new[end] .= containers.centroids_new[1] ./ containers.centroids_cnt[1]'
+    else
+        @inbounds containers.centroids_new[end] .= containers.centroids_new[1]
+        @inbounds containers.centroids_cnt[end] .= containers.centroids_cnt[1]
+        @inbounds for i in 2:n_threads
+            containers.centroids_new[end] .+= containers.centroids_new[i]
+            containers.centroids_cnt[end] .+= containers.centroids_cnt[i]
+        end
+
+        @inbounds containers.centroids_new[end] .= containers.centroids_new[end] ./ containers.centroids_cnt[end]'
+    end
+end
+
+function calculate_centroids_movement(alg::Elkan, containers, centroids)
+    p = containers.p
+    centroids_new = containers.centroids_new[end]
+
+    for i in axes(centroids, 2)
+        p[i] = distance(centroids, centroids_new, i, i)
+    end
+end
+
+
+function chunk_update_bounds(alg, containers, centroids, r, idx)
+    p = containers.p
+    lb = containers.lb
+    ub = containers.ub
+    stale = containers.stale
+    labels = containers.labels
+
+    @inbounds for i in r
+        for j in axes(centroids, 2)
+            lb[j, i] = lb[j, i] > p[j] ? lb[j, i] + p[j] - 2*sqrt(abs(lb[j, i]*p[j])) : 0.0
+        end
+        stale[i] = true
+        ub[i] += p[labels[i]] + 2*sqrt(abs(ub[i]*p[labels[i]]))
+    end
+end
@@ -18,27 +18,14 @@ kmeans(Hamerly(), X, 3) # 3 clusters, Hamerly algorithm
 struct Hamerly <: AbstractKMeansAlg end
 
 
-function kmeans(alg::Hamerly, design_matrix, k;
+function kmeans!(alg::Hamerly, containers, X, k;
                 n_threads = Threads.nthreads(),
                 k_init = "k-means++", max_iters = 300,
                 tol = 1e-6, verbose = false, init = nothing)
-    nrow, ncol = size(design_matrix)
-    containers = create_containers(alg, k, nrow, ncol, n_threads)
+    nrow, ncol = size(X)
+    centroids = init == nothing ? smart_init(X, k, n_threads, init=k_init).centroids : deepcopy(init)
 
-    return kmeans!(alg, containers, design_matrix, k, n_threads = n_threads,
-                    k_init = k_init, max_iters = max_iters, tol = tol,
-                    verbose = verbose, init = init)
-end
-
-
-function kmeans!(alg::Hamerly, containers, design_matrix, k;
-                n_threads = Threads.nthreads(),
-                k_init = "k-means++", max_iters = 300,
-                tol = 1e-6, verbose = false, init = nothing)
-    nrow, ncol = size(design_matrix)
-    centroids = init == nothing ? smart_init(design_matrix, k, n_threads, init=k_init).centroids : deepcopy(init)
-
-    @parallelize n_threads ncol chunk_initialize!(alg, containers, centroids, design_matrix)
+    @parallelize n_threads ncol chunk_initialize(alg, containers, centroids, X)
 
     converged = false
     niters = 0
@@ -48,15 +35,15 @@ function kmeans!(alg::Hamerly, containers, design_matrix, k;
     # Update centroids & labels with closest members until convergence
     while niters < max_iters
         niters += 1
-        update_containers!(containers, alg, centroids, n_threads)
-        @parallelize n_threads ncol chunk_update_centroids!(centroids, containers, alg, design_matrix)
+        update_containers(alg, containers, centroids, n_threads)
+        @parallelize n_threads ncol chunk_update_centroids(alg, containers, centroids, X)
         collect_containers(alg, containers, n_threads)
 
         J = sum(containers.ub)
-        move_centers!(centroids, containers, alg)
+        move_centers(alg, containers, centroids)
 
         r1, r2, pr1, pr2 = double_argmax(p)
-        @parallelize n_threads ncol chunk_update_bounds!(containers, r1, r2, pr1, pr2)
+        @parallelize n_threads ncol chunk_update_bounds(alg, containers, r1, r2, pr1, pr2)
 
         if verbose
             # Show progress and terminate if J stops decreasing as specified by the tolerance level.
@@ -70,10 +57,9 @@ function kmeans!(alg::Hamerly, containers, design_matrix, k;
         end
 
         J_previous = J
-
     end
 
-    @parallelize n_threads ncol sum_of_squares(containers, design_matrix, containers.labels, centroids)
+    @parallelize n_threads ncol sum_of_squares(containers, X, containers.labels, centroids)
     totalcost = sum(containers.sum_of_squares)
 
     # Terminate algorithm with the assumption that K-means has converged
@@ -144,29 +130,29 @@ function create_containers(alg::Hamerly, k, nrow, ncol, n_threads)
 end
 
 """
-    chunk_initialize!(alg::Hamerly, containers, centroids, design_matrix, r, idx)
+    chunk_initialize(alg::Hamerly, containers, centroids, design_matrix, r, idx)
 
 Initial calulation of all bounds and points labeling.
 """
-function chunk_initialize!(alg::Hamerly, containers, centroids, design_matrix, r, idx)
+function chunk_initialize(alg::Hamerly, containers, centroids, X, r, idx)
     centroids_cnt = containers.centroids_cnt[idx]
     centroids_new = containers.centroids_new[idx]
 
     @inbounds for i in r
-        label = point_all_centers!(containers, centroids, design_matrix, i)
+        label = point_all_centers!(containers, centroids, X, i)
         centroids_cnt[label] += 1
-        for j in axes(design_matrix, 1)
-            centroids_new[j, label] += design_matrix[j, i]
+        for j in axes(X, 1)
+            centroids_new[j, label] += X[j, i]
         end
     end
 end
 
 """
-    update_containers!(containers, ::Hamerly, centroids, n_threads)
+    update_containers(::Hamerly, containers, centroids, n_threads)
 
 Calculates minimum distances from centers to each other.
 """
-function update_containers!(containers, ::Hamerly, centroids, n_threads)
+function update_containers(::Hamerly, containers, centroids, n_threads)
     s = containers.s
     s .= Inf
     @inbounds for i in axes(centroids, 2)
@@ -180,13 +166,13 @@ function update_containers!(containers, ::Hamerly, centroids, n_threads)
 end
 
 """
-    chunk_update_centroids!(centroids, containers, alg::Hamerly, design_matrix, r, idx)
+    chunk_update_centroids(::Hamerly, containers, centroids, X, r, idx)
 
 Detailed description of this function can be found in the original paper. It iterates through
 all points and tries to skip some calculation using known upper and lower bounds of distances
 from point to centers. If it fails to skip than it fall back to generic `point_all_centers!` function.
 """
-function chunk_update_centroids!(centroids, containers, alg::Hamerly, design_matrix, r, idx)
+function chunk_update_centroids(alg::Hamerly, containers, centroids, X, r, idx)
 
     # unpack containers for easier manipulations
     centroids_new = containers.centroids_new[idx]
@@ -203,17 +189,17 @@ function chunk_update_centroids!(centroids, containers, alg::Hamerly, design_mat
         if ub[i] > m
             # tighten upper bound
             label = labels[i]
-            ub[i] = distance(design_matrix, centroids, i, label)
+            ub[i] = distance(X, centroids, i, label)
             # second bound test
             if ub[i] > m
-                label_new = point_all_centers!(containers, centroids, design_matrix, i)
+                label_new = point_all_centers!(containers, centroids, X, i)
                 if label != label_new
                     labels[i] = label_new
                     centroids_cnt[label_new] += 1
                     centroids_cnt[label] -= 1
-                    for j in axes(design_matrix, 1)
-                        centroids_new[j, label_new] += design_matrix[j, i]
-                        centroids_new[j, label] -= design_matrix[j, i]
+                    for j in axes(X, 1)
+                        centroids_new[j, label_new] += X[j, i]
+                        centroids_new[j, label] -= X[j, i]
                     end
                 end
             end
@@ -222,11 +208,11 @@ function chunk_update_centroids!(centroids, containers, alg::Hamerly, design_mat
 end
 
 """
-    point_all_centers!(containers, centroids, design_matrix, i)
+    point_all_centers!(containers, centroids, X, i)
 
 Calculates new labels and upper and lower bounds for all points.
 """
-function point_all_centers!(containers, centroids, design_matrix, i)
+function point_all_centers!(containers, centroids, X, i)
     ub = containers.ub
     lb = containers.lb
     labels = containers.labels
@@ -235,7 +221,7 @@ function point_all_centers!(containers, centroids, design_matrix, i)
     min_distance2 = Inf
     label = 1
     @inbounds for k in axes(centroids, 2)
-        dist = distance(design_matrix, centroids, i, k)
+        dist = distance(X, centroids, i, k)
         if min_distance > dist
             label = k
             min_distance2 = min_distance
@@ -253,12 +239,12 @@ function point_all_centers!(containers, centroids, design_matrix, i)
 end
 
 """
-    move_centers!(centroids, containers, ::Hamerly)
+    move_centers(::Hamerly, containers, centroids)
 
 Calculates new positions of centers and distance they have moved. Results are stored
 in `centroids` and `p` respectively.
 """
-function move_centers!(centroids, containers, ::Hamerly)
+function move_centers(::Hamerly, containers, centroids)
     centroids_new = containers.centroids_new[end]
     p = containers.p
 
@@ -273,11 +259,11 @@ function move_centers!(centroids, containers, ::Hamerly)
 end
 
 """
-    chunk_update_bounds!(containers, r1, r2, pr1, pr2, r, idx)
+    chunk_update_bounds(alg::Hamerly, containers, r1, r2, pr1, pr2, r, idx)
 
 Updates upper and lower bounds of point distance to the centers, with regard to the centers movement.
 """
-function chunk_update_bounds!(containers, r1, r2, pr1, pr2, r, idx)
+function chunk_update_bounds(alg::Hamerly, containers, r1, r2, pr1, pr2, r, idx)
     p = containers.p
     ub = containers.ub
     lb = containers.lb
 
@@ -93,6 +93,7 @@ Allocationless calculation of square eucledean distance between vectors X1[:, i1
 """
 function distance(X1, X2, i1, i2)
     d = 0.0
+    # TODO: break of the loop if d is larger than threshold (known minimum disatnce)
     @inbounds for i in axes(X1, 1)
         d += (X1[i, i1] - X2[i, i2])^2
     end
@@ -108,18 +109,6 @@ design matrix(x), centroids (centre), and the number of desired groups (k).
 
 A Float type representing the computed metric is returned.
 """
-function sum_of_squares(x, labels, centre)
-    s = 0.0
-
-    @inbounds for j in axes(x, 2)
-        for i in axes(x, 1)
-            s += (x[i, j] - centre[i, labels[j]])^2
-        end
-    end
-
-    return s
-end
-
 function sum_of_squares(containers, x, labels, centre, r, idx)
     s = 0.0
 
@@ -170,100 +159,3 @@ function kmeans(alg, design_matrix, k;
                     k_init = k_init, max_iters = max_iters, tol = tol,
                     verbose = verbose, init = init)
 end
-
-
-"""
-    Kmeans!(alg::AbstractKMeansAlg, containers, design_matrix, k; n_threads = nthreads(), k_init="k-means++", max_iters=300, tol=1e-6, verbose=false)
-
-Mutable version of `kmeans` function. Definition of arguments and results can be
-found in `kmeans`.
-
-Argument `containers` represent algorithm specific containers, such as labels, intermidiate
-centroids and so on, which are used during calculations.
-"""
-function kmeans!(alg, containers, design_matrix, k;
-                n_threads = Threads.nthreads(),
-                k_init = "k-means++", max_iters = 300,
-                tol = 1e-6, verbose = false, init = nothing)
-    nrow, ncol = size(design_matrix)
-    centroids = init == nothing ? smart_init(design_matrix, k, n_threads, init=k_init).centroids : deepcopy(init)
-
-    converged = false
-    niters = 0
-    J_previous = 0.0
-
-    # Update centroids & labels with closest members until convergence
-
-    while niters < max_iters
-        niters += 1
-
-        update_containers!(containers, alg, centroids, n_threads)
-        J = update_centroids!(centroids, containers, alg, design_matrix, n_threads)
-
-        if verbose
-            # Show progress and terminate if J stopped decreasing.
-            println("Iteration $niters: Jclust = $J")
-        end
-
-        # Check for convergence
-        if (niters > 1) & (abs(J - J_previous) < (tol * J))
-            converged = true
-            break
-        end
-
-        J_previous = J
-
-    end
-
-    totalcost = sum_of_squares(design_matrix, containers.labels, centroids)
-
-    # Terminate algorithm with the assumption that K-means has converged
-    if verbose & converged
-        println("Successfully terminated with convergence.")
-    end
-
-    # TODO empty placeholder vectors should be calculated
-    # TODO Float64 type definitions is too restrictive, should be relaxed
-    # especially during GPU related development
-    return KmeansResult(centroids, containers.labels, Float64[], Int[], Float64[], totalcost, niters, converged)
-end
-
-"""
-    update_centroids!(centroids, containers, alg, design_matrix, n_threads)
-
-Internal function, used to update centroids by utilizing one of `alg`. It works as
-a wrapper of internal `chunk_update_centroids!` function, splitting incoming
-`design_matrix` in chunks and combining results together.
-"""
-function update_centroids!(centroids, containers, alg, design_matrix, n_threads)
-    ncol = size(design_matrix, 2)
-
-    if n_threads == 1
-        r = axes(design_matrix, 2)
-        J = chunk_update_centroids!(centroids, containers, alg, design_matrix, r, 1)
-
-        centroids .= containers.new_centroids[1] ./ containers.centroids_cnt[1]'
-    else
-        ranges = splitter(ncol, n_threads)
-
-        waiting_list = Vector{Task}(undef, n_threads - 1)
-
-        for i in 1:length(ranges) - 1
-            waiting_list[i] = @spawn chunk_update_centroids!(centroids, containers,
-                alg, design_matrix, ranges[i], i + 1)
-        end
-
-        J = chunk_update_centroids!(centroids, containers, alg, design_matrix, ranges[end], 1)
-
-        J += sum(fetch.(waiting_list))
-
-        for i in 1:length(ranges) - 1
-            containers.new_centroids[1] .+= containers.new_centroids[i + 1]
-            containers.centroids_cnt[1] .+= containers.centroids_cnt[i + 1]
-        end
-
-        centroids .= containers.new_centroids[1] ./ containers.centroids_cnt[1]'
-    end
-
-    return J
-end
@@ -5,6 +5,61 @@ Basic algorithm for k-means calculation.
 """
 struct Lloyd <: AbstractKMeansAlg end
 
+"""
+    Kmeans!(alg::AbstractKMeansAlg, containers, design_matrix, k; n_threads = nthreads(), k_init="k-means++", max_iters=300, tol=1e-6, verbose=true)
+
+Mutable version of `kmeans` function. Definition of arguments and results can be
+found in `kmeans`.
+
+Argument `containers` represent algorithm specific containers, such as labels, intermidiate
+centroids and so on, which are used during calculations.
+"""
+function kmeans!(alg::Lloyd, containers, X, k;
+                n_threads = Threads.nthreads(),
+                k_init = "k-means++", max_iters = 300,
+                tol = 1e-6, verbose = false, init = nothing)
+    nrow, ncol = size(X)
+    centroids = init == nothing ? smart_init(X, k, n_threads, init=k_init).centroids : deepcopy(init)
+
+    converged = false
+    niters = 1
+    J_previous = 0.0
+
+    # Update centroids & labels with closest members until convergence
+    while niters <= max_iters
+        @parallelize n_threads ncol chunk_update_centroids(alg, containers, centroids, X)
+        collect_containers(alg, containers, centroids, n_threads)
+        J = sum(containers.J)
+
+        if verbose
+            # Show progress and terminate if J stopped decreasing.
+            println("Iteration $niters: Jclust = $J")
+        end
+
+        # Check for convergence
+        if (niters > 1) & (abs(J - J_previous) < (tol * J))
+            converged = true
+            break
+        end
+
+        J_previous = J
+        niters += 1
+    end
+
+    @parallelize n_threads ncol sum_of_squares(containers, X, containers.labels, centroids)
+    totalcost = sum(containers.sum_of_squares)
+
+    # Terminate algorithm with the assumption that K-means has converged
+    if verbose & converged
+        println("Successfully terminated with convergence.")
+    end
+
+    # TODO empty placeholder vectors should be calculated
+    # TODO Float64 type definitions is too restrictive, should be relaxed
+    # especially during GPU related development
+    return KmeansResult(centroids, containers.labels, Float64[], Int[], Float64[], totalcost, niters, converged)
+end
+
 kmeans(design_matrix, k;
     n_threads = Threads.nthreads(),
     k_init = "k-means++", max_iters = 300, tol = 1e-6,
@@ -17,56 +72,70 @@ kmeans(design_matrix, k;
 
 Internal function for the creation of all necessary intermidiate structures.
 
-- `new_centroids` - container which holds new positions of centroids
+- `centroids_new` - container which holds new positions of centroids
 - `centroids_cnt` - container which holds number of points for each centroid
 - `labels` - vector which holds labels of corresponding points
 """
 function create_containers(::Lloyd, k, nrow, ncol, n_threads)
-    new_centroids = Vector{Array{Float64, 2}}(undef, n_threads)
-    centroids_cnt = Vector{Vector{Int}}(undef, n_threads)
+    lng = n_threads + 1
+    centroids_new = Vector{Array{Float64,2}}(undef, lng)
+    centroids_cnt = Vector{Vector{Int}}(undef, lng)
 
-    for i in 1:n_threads
-        new_centroids[i] = Array{Float64, 2}(undef, nrow, k)
+    for i in 1:lng
+        centroids_new[i] = Array{Float64, 2}(undef, nrow, k)
         centroids_cnt[i] = Vector{Int}(undef, k)
     end
 
     labels = Vector{Int}(undef, ncol)
 
-    return (new_centroids = new_centroids, centroids_cnt = centroids_cnt,
-            labels = labels)
-end
+    J = Vector{Float64}(undef, n_threads)
 
-update_containers!(containers, ::Lloyd, centroids, n_threads) = nothing
+    # total_sum_calculation
+    sum_of_squares = Vector{Float64}(undef, n_threads)
 
-function chunk_update_centroids!(centroids, containers, ::Lloyd,
-    design_matrix, r, idx)
+    return (centroids_new = centroids_new, centroids_cnt = centroids_cnt,
+            labels = labels, J = J, sum_of_squares = sum_of_squares)
+end
 
+function chunk_update_centroids(::Lloyd, containers, centroids, X, r, idx)
     # unpack containers for easier manipulations
-    new_centroids = containers.new_centroids[idx]
+    centroids_new = containers.centroids_new[idx]
     centroids_cnt = containers.centroids_cnt[idx]
     labels = containers.labels
 
-    new_centroids .= 0.0
+    centroids_new .= 0.0
     centroids_cnt .= 0
     J = 0.0
     @inbounds for i in r
-        min_distance = Inf
+        min_dist = distance(X, centroids, i, 1)
         label = 1
-        for k in axes(centroids, 2)
-            distance = 0.0
-            for j in axes(design_matrix, 1)
-                distance += (design_matrix[j, i] - centroids[j, k])^2
-            end
-            label = min_distance > distance ? k : label
-            min_distance = min_distance > distance ? distance : min_distance
+        for j in 2:size(centroids, 2)
+            dist = distance(X, centroids, i, j)
+            label = dist < min_dist ? j : label
+            min_dist = dist < min_dist ? dist : min_dist
         end
         labels[i] = label
         centroids_cnt[label] += 1
-        for j in axes(design_matrix, 1)
-            new_centroids[j, label] += design_matrix[j, i]
+        for j in axes(X, 1)
+            centroids_new[j, label] += X[j, i]
         end
-        J += min_distance
+        J += min_dist
     end
 
-    return J
+    containers.J[idx] = J
+end
+
+function collect_containers(alg::Lloyd, containers, centroids, n_threads)
+    if n_threads == 1
+        @inbounds centroids .= containers.centroids_new[1] ./ containers.centroids_cnt[1]'
+    else
+        @inbounds containers.centroids_new[end] .= containers.centroids_new[1]
+        @inbounds containers.centroids_cnt[end] .= containers.centroids_cnt[1]
+        @inbounds for i in 2:n_threads
+            containers.centroids_new[end] .+= containers.centroids_new[i]
+            containers.centroids_cnt[end] .+= containers.centroids_cnt[i]
+        end
+
+        @inbounds centroids .= containers.centroids_new[end] ./ containers.centroids_cnt[end]'
+    end
 end
@@ -5,13 +5,13 @@ const ParallelKMeans_Desc = "Parallel & lightning fast implementation of all ava
 # availalbe variants for reference
 const MLJDICT = Dict(:Lloyd => Lloyd(),
                      :Hamerly => Hamerly(),
-                     :LightElkan => LightElkan())
+                     :Elkan => Elkan())
 
 ####
 #### MODEL DEFINITION
 ####
 
-mutable struct KMeans <: MLJModelInterface.Unsupervised
+mutable struct KMeans <: MMI.Unsupervised
     algo::Symbol
     k_init::String
     k::Int
@@ -24,49 +24,56 @@ mutable struct KMeans <: MLJModelInterface.Unsupervised
 end
 
 
-function KMeans(; algo=:Lloyd, k_init="k-means++",
+function KMeans(; algo=:Hamerly, k_init="k-means++",
                 k=3, tol=1e-6, max_iters=300, copy=true,
                 threads=Threads.nthreads(), verbosity=0, init=nothing)
 
     model   = KMeans(algo, k_init, k, tol, max_iters, copy, threads, verbosity, init)
-    message = MLJModelInterface.clean!(model)
+    message = MMI.clean!(model)
     isempty(message) || @warn message
     return model
 end
 
 
-function MLJModelInterface.clean!(m::KMeans)
-    warning = ""
+function MMI.clean!(m::KMeans)
+    warning = String[]
 
     if !(m.algo ∈ keys(MLJDICT))
-        warning *= "Unsupported KMeans variant, Defauting to KMeans++ seeding algorithm."
-        m.algo = :Lloyd
+        push!(warning, "Unsupported KMeans variant. Defaulting to Hamerly algorithm.")
+        m.algo = :Hamerly
+	end
 
-    elseif m.k_init != "k-means++"
-        warning *= "Only `k-means++` or random seeding algorithms are supported. Defaulting to random seeding."
-        m.k_init = "random"
+    if !(m.k_init ∈ ["k-means++", "random"])
+        push!(warning, "Only \"k-means++\" or \"random\" seeding algorithms are supported. Defaulting to k-means++ seeding.")
+        m.k_init = "kmeans++"
+	end
 
-    elseif m.k < 1
-        warning *= "Number of clusters must be greater than 0. Defaulting to 3 clusters."
+    if m.k < 1
+        push!(warning, "Number of clusters must be greater than 0. Defaulting to 3 clusters.")
         m.k = 3
+	end
 
-    elseif !(m.tol < 1.0)
-        warning *= "Tolerance level must be less than 1. Defaulting to tol of 1e-6."
+    if !(m.tol < 1.0)
+        push!(warning, "Tolerance level must be less than 1. Defaulting to tol of 1e-6.")
         m.tol = 1e-6
+	end
 
-    elseif !(m.max_iters > 0)
-        warning *= "Number of permitted iterations must be greater than 0. Defaulting to 300 iterations."
+    if !(m.max_iters > 0)
+        push!(warning, "Number of permitted iterations must be greater than 0. Defaulting to 300 iterations.")
         m.max_iters = 300
+	end
 
-    elseif !(m.threads > 0)
-        warning *= "Number of threads must be at least 1. Defaulting to all threads available."
+    if !(m.threads > 0)
+        push!(warning, "Number of threads must be at least 1. Defaulting to all threads available.")
         m.threads = Threads.nthreads()
+	end
 
-    elseif !(m.verbosity ∈ (0, 1))
-        warning *= "Verbosity must be either 0 (no info) or 1 (info requested). Defaulting to 0."
-        m.verbosity = 0
+    if !(m.verbosity ∈ (0, 1))
+        push!(warning, "Verbosity must be either 0 (no info) or 1 (info requested). Defaulting to 1.")
+        m.verbosity = 1
     end
-    return warning
+
+    return join(warning, "\n")
 end
 
 
@@ -78,14 +85,14 @@ end
 
     See also the [package documentation](https://pydatablog.github.io/ParallelKMeans.jl/stable).
 """
-function MLJModelInterface.fit(m::KMeans, X)
+function MMI.fit(m::KMeans, X)
     # convert tabular input data into the matrix model expects. Column assumed as features so input data is permuted
     if !m.copy
         # permutes dimensions of input table without copying and pass to model
-        DMatrix = convert(Array{Float64, 2}, MLJModelInterface.matrix(X)')
+        DMatrix = convert(Array{Float64, 2}, MMI.matrix(X)')
     else
         # permutes dimensions of input table as a column major matrix from a copy of the data
-        DMatrix = convert(Array{Float64, 2}, MLJModelInterface.matrix(X, transpose=true))
+        DMatrix = convert(Array{Float64, 2}, MMI.matrix(X, transpose=true))
     end
 
     # lookup available algorithms
@@ -106,7 +113,7 @@ function MLJModelInterface.fit(m::KMeans, X)
 end
 
 
-function MLJModelInterface.fitted_params(model::KMeans, fitresult)
+function MMI.fitted_params(model::KMeans, fitresult)
     # extract what's relevant from `fitresult`
     results, _, _ = fitresult  # unpack fitresult
     centers = results.centers
@@ -124,15 +131,15 @@ end
 #### PREDICT FUNCTION
 ####
 
-function MLJModelInterface.transform(m::KMeans, fitresult, Xnew)
+function MMI.transform(m::KMeans, fitresult, Xnew)
     # make predictions/assignments using the learned centroids
 
     if !m.copy
         # permutes dimensions of input table without copying and pass to model
-        DMatrix = convert(Array{Float64, 2}, MLJModelInterface.matrix(Xnew)')
+        DMatrix = convert(Array{Float64, 2}, MMI.matrix(Xnew)')
     else
         # permutes dimensions of input table as a column major matrix from a copy of the data
-        DMatrix = convert(Array{Float64, 2}, MLJModelInterface.matrix(Xnew, transpose=true))
+        DMatrix = convert(Array{Float64, 2}, MMI.matrix(Xnew, transpose=true))
     end
 
     # TODO: Warn users if fitresult is from a `non-converged` fit?
@@ -147,7 +154,7 @@ function MLJModelInterface.transform(m::KMeans, fitresult, Xnew)
     centroids = results.centers
     distances = Distances.pairwise(Distances.SqEuclidean(), DMatrix, centroids; dims=2)
     preds = argmin.(eachrow(distances))
-    return MLJModelInterface.table(reshape(preds, :, 1), prototype=Xnew)
+    return MMI.table(reshape(preds, :, 1), prototype=Xnew)
 end
 
 
@@ -156,7 +163,7 @@ end
 ####
 
 # TODO 4: metadata for the package and for each of the model interfaces
-metadata_pkg.(KMeans,
+MMI.metadata_pkg.(KMeans,
     name = "ParallelKMeans",
     uuid = "42b8e9d4-006b-409a-8472-7f34b3fb58af",
     url  = "https://github.com/PyDataBlog/ParallelKMeans.jl",
@@ -166,9 +173,9 @@ metadata_pkg.(KMeans,
 
 
 # Metadata for ParaKMeans model interface
-metadata_model(KMeans,
-    input   = MLJModelInterface.Table(MLJModelInterface.Continuous),
-    output  = MLJModelInterface.Table(MLJModelInterface.Count),
+MMI.metadata_model(KMeans,
+    input   = MMI.Table(MMI.Continuous),
+    output  = MMI.Table(MMI.Count),
     weights = false,
     descr   = ParallelKMeans_Desc,
 	path	= "ParallelKMeans.KMeans")
@@ -1,4 +1,4 @@
-module TestKMeans
+module TestLloyd
 
 using ParallelKMeans
 using Test
 
@@ -1,64 +1,47 @@
 module TestElkan
 
 using ParallelKMeans
-using ParallelKMeans: update_containers!
 using Test
 using Random
 
-@testset "centroid distances" begin
-    containers = (centroids_dist = Matrix{Float64}(undef, 3, 3), )
-    centroids = [1.0 2.0 4.0; 2.0 1.0 3.0]
-    update_containers!(containers, LightElkan(), centroids, 1)
-    centroids_dist = containers.centroids_dist
-    @test centroids_dist[1, 2] == centroids_dist[2, 1]
-    @test centroids_dist[1, 3] == centroids_dist[3, 1]
-    @test centroids_dist[2, 3] == centroids_dist[3, 2]
-    @test centroids_dist[1, 2] == 0.5
-    @test centroids_dist[1, 3] == 2.5
-    @test centroids_dist[2, 3] == 2.0
-    @test centroids_dist[1, 1] == 0.5
-    @test centroids_dist[2, 2] == 0.5
-    @test centroids_dist[3, 3] == 2.0
-end
-
-@testset "basic kmeans" begin
+@testset "basic kmeans elkan" begin
     X = [1. 2. 4.;]
-    res = kmeans(LightElkan(), X, 1; n_threads = 1, tol = 1e-6, verbose = false)
+    res = kmeans(Elkan(), X, 1; n_threads = 1, tol = 1e-6, verbose = false)
     @test res.assignments == [1, 1, 1]
     @test res.centers[1] ≈ 2.3333333333333335
     @test res.totalcost ≈ 4.666666666666666
     @test res.converged
 
-    res = kmeans(LightElkan(), X, 2; n_threads = 1, init = [1.0 4.0], tol = 1e-6, verbose = false)
+    res = kmeans(Elkan(), X, 2; n_threads = 1, init = [1.0 4.0], tol = 1e-6, verbose = false)
     @test res.assignments == [1, 1, 2]
     @test res.centers ≈ [1.5 4.0]
     @test res.totalcost ≈ 0.5
     @test res.converged
 end
 
-@testset "no convergence yield last result" begin
+@testset "elkan no convergence yield last result" begin
     X = [1. 2. 4.;]
-    res = kmeans(LightElkan(), X, 2; n_threads = 1, init = [1.0 4.0], tol = 1e-6, max_iters = 1, verbose = false)
+    res = kmeans(Elkan(), X, 2; n_threads = 1, init = [1.0 4.0], tol = 1e-6, max_iters = 1, verbose = false)
     @test !res.converged
     @test res.totalcost ≈ 0.5
 end
 
-@testset "singlethread linear separation" begin
+@testset "elkan singlethread linear separation" begin
     Random.seed!(2020)
 
     X = rand(3, 100)
-    res = kmeans(LightElkan(), X, 3; n_threads = 1, tol = 1e-6, verbose = false)
+    res = kmeans(Elkan(), X, 3; n_threads = 1, tol = 1e-10, max_iters = 10, verbose = false)
 
     @test res.totalcost ≈ 14.16198704459199
-    @test res.converged
-    @test res.iterations == 11
+    @test !res.converged
+    @test res.iterations == 10
 end
 
-@testset "multithread linear separation quasi two threads" begin
+@testset "elkan multithread linear separation quasi two threads" begin
     Random.seed!(2020)
 
     X = rand(3, 100)
-    res = kmeans(LightElkan(), X, 3; n_threads = 2, tol = 1e-6, verbose = false)
+    res = kmeans(Elkan(), X, 3; n_threads = 2, tol = 1e-6, verbose = false)
 
     @test res.totalcost ≈ 14.16198704459199
     @test res.converged
 
@@ -1,7 +1,7 @@
 module TestHamerly
 
 using ParallelKMeans
-using ParallelKMeans: chunk_initialize!, double_argmax
+using ParallelKMeans: chunk_initialize, double_argmax
 using Test
 using Random
 
@@ -11,7 +11,7 @@ using Random
     nrow, ncol = size(X)
     containers = ParallelKMeans.create_containers(Hamerly(), 3, nrow, ncol, 1)
 
-    ParallelKMeans.chunk_initialize!(Hamerly(), containers, centroids, X, 1:ncol, 1)
+    ParallelKMeans.chunk_initialize(Hamerly(), containers, centroids, X, 1:ncol, 1)
     @test containers.lb == [18.0, 20.0, 5.0, 5.0]
     @test containers.ub == [0.0, 2.0, 0.0, 0.0]
 end
 
@@ -6,7 +6,7 @@ using Test
 using Suppressor
 
 
-@testset "Testing verbosity of implementation" begin
+@testset "LLoyd: Testing verbosity of implementation" begin
     Random.seed!(2020)
     X = rand(4, 150)
     Random.seed!(2020)
@@ -15,5 +15,22 @@ using Suppressor
     @test r == "Iteration 1: Jclust = 46.534795844478815\n"
 end
 
-end # module
+@testset "Hamerly: Testing verbosity of implementation" begin
+    Random.seed!(2020)
+    X = rand(4, 150)
+    Random.seed!(2020)
+    # Capture output and compare
+    r = @capture_out kmeans(Hamerly(), X, 3; n_threads=1, max_iters=1, verbose=true)
+    @test r == "Iteration 1: Jclust = 46.534795844478815\n"
+end
 
+@testset "Elkan: Testing verbosity of implementation" begin
+    Random.seed!(2020)
+    X = rand(4, 150)
+    Random.seed!(2020)
+    # Capture output and compare
+    r = @capture_out kmeans(Elkan(), X, 3; n_threads=1, max_iters=1, verbose=true)
+    @test r == "Iteration 1: Jclust = 46.534795844478815\n"
+end
+
+end # module
@@ -11,7 +11,7 @@ using MLJBase
 @testset "Test struct construction" begin
     model = KMeans()
 
-    @test model.algo            == :Lloyd
+    @test model.algo            == :Hamerly
     @test model.init            == nothing
     @test model.k               == 3
     @test model.k_init          == "k-means++"
@@ -24,13 +24,13 @@ end
 
 
 @testset "Test bad struct warings" begin
-    @test_logs (:warn, "Unsupported KMeans variant, Defauting to KMeans++ seeding algorithm.") ParallelKMeans.KMeans(algo=:Fake)
-    @test_logs (:warn, "Only `k-means++` or random seeding algorithms are supported. Defaulting to random seeding.") ParallelKMeans.KMeans(k_init="abc")
+    @test_logs (:warn, "Unsupported KMeans variant. Defaulting to Hamerly algorithm.") ParallelKMeans.KMeans(algo=:Fake)
+    @test_logs (:warn, "Only \"k-means++\" or \"random\" seeding algorithms are supported. Defaulting to k-means++ seeding.") ParallelKMeans.KMeans(k_init="abc")
     @test_logs (:warn, "Number of clusters must be greater than 0. Defaulting to 3 clusters.") ParallelKMeans.KMeans(k=0)
     @test_logs (:warn, "Tolerance level must be less than 1. Defaulting to tol of 1e-6.") ParallelKMeans.KMeans(tol=2)
     @test_logs (:warn, "Number of permitted iterations must be greater than 0. Defaulting to 300 iterations.") ParallelKMeans.KMeans(max_iters=0)
     @test_logs (:warn, "Number of threads must be at least 1. Defaulting to all threads available.") ParallelKMeans.KMeans(threads=0)
-    @test_logs (:warn, "Verbosity must be either 0 (no info) or 1 (info requested). Defaulting to 0.") ParallelKMeans.KMeans(verbosity=100)
+    @test_logs (:warn, "Verbosity must be either 0 (no info) or 1 (info requested). Defaulting to 1.") ParallelKMeans.KMeans(verbosity=100)
 end
 
 
@@ -47,75 +47,62 @@ end
 @testset "Test Lloyd model fitting" begin
     Random.seed!(2020)
     X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
-    model = KMeans(k=2)
-    results = fit(model, X)
-
-    @test results[2]             == nothing
-    @test results[end].converged == true
-    @test results[end].totalcost == 16
-end
-
+    X_test = table([10 1])
 
-@testset "Test Hamerly model fitting" begin
-    Random.seed!(2020)
-    X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
-    model = KMeans(algo=:Hamerly, k=2)
+    model = KMeans(algo = :Lloyd, k=2)
     results = fit(model, X)
 
     @test results[2]             == nothing
     @test results[end].converged == true
     @test results[end].totalcost == 16
-end
-
-
-@testset "Test Lloyd fitted params" begin
-    Random.seed!(2020)
-    X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
-    model = KMeans(k=2)
-    results = fit(model, X)
 
     params = fitted_params(model, results)
     @test params.converged == true
     @test params.totalcost == 16
+
+    # Use trained model to cluster new data X_test
+    preds = transform(model, results, X_test)
+    @test preds[:x1][1] == 2
 end
 
 
-@testset "Test Hamerly fitted params" begin
+@testset "Test Hamerly model fitting" begin
     Random.seed!(2020)
     X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
+    X_test = table([10 1])
+
     model = KMeans(algo=:Hamerly, k=2)
     results = fit(model, X)
 
+    @test results[2]             == nothing
+    @test results[end].converged == true
+    @test results[end].totalcost == 16
+
     params = fitted_params(model, results)
     @test params.converged == true
     @test params.totalcost == 16
-end
-
-
-@testset "Test Lloyd transform" begin
-    Random.seed!(2020)
-    X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
-    X_test = table([10 1])
-
-    # Train model using training data X
-    model = KMeans(k=2)
-    results = fit(model, X)
 
     # Use trained model to cluster new data X_test
     preds = transform(model, results, X_test)
     @test preds[:x1][1] == 2
 end
 
-
-@testset "Test Hamerly transform" begin
+@testset "Test Elkan model fitting" begin
     Random.seed!(2020)
     X = table([1 2; 1 4; 1 0; 10 2; 10 4; 10 0])
     X_test = table([10 1])
 
-    # Train model using training data X
-    model = KMeans(algo=:Hamerly, k=2)
+    model = KMeans(algo=:Elkan, k=2)
     results = fit(model, X)
 
+    @test results[2]             == nothing
+    @test results[end].converged == true
+    @test results[end].totalcost == 16
+
+    params = fitted_params(model, results)
+    @test params.converged == true
+    @test params.totalcost == 16
+
     # Use trained model to cluster new data X_test
     preds = transform(model, results, X_test)
     @test preds[:x1][1] == 2
@@ -133,4 +120,3 @@ end
 end
 
 end # module
-
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-module TestKMeans`
	`1`	`+module TestLloyd`
`2`	`2`
`3`	`3`	`using ParallelKMeans`
`4`	`4`	`using Test`