kmeans: Also test bytearray

jonnor · jonnor · commit 1dc371d8add8 · 2024-07-06T00:38:57.000+02:00
diff --git a/tests/test_kmeans.py b/tests/test_kmeans.py
@@ -4,28 +4,47 @@
 import array
 import gc
 
-def test_kmeans_two_clusters():
-    """
-    Data that is grouped into high/low should be clusterable into 2
-    """
+def make_two_cluster_data(typecode):
 
     n_features = 3
-    dataset = array.array('B', [
+    dataset = [
+        # cluster1
         0, 0, 0,
         10, 5, 2,
-
+    
+        # cluster2
         200, 50, 100,
         255, 255, 255,        
-    ])
+    ]
 
-    centroids = array.array('B', [
+    centroids = [
         0, 0, 0,
         200, 200, 200,
-    ])
+    ]
+
+    if typecode == 'bytearray':
+        dataset = bytearray(dataset)
+        centroids = bytearray(centroids)        
+    else:
+        dataset = array.array(typecode, dataset)
+        centroids = array.array(typecode, centroids)
+
+    return dataset, centroids
+
+
+def test_kmeans_two_clusters():
+    """
+    Data that is grouped into high/low should be clusterable into 2
+    """
+
+    n_features = 3
+    # test both with "bytearray" and "array.array"
+    for typecode in ['bytearray', 'B']:
+        dataset, centroids = make_two_cluster_data(typecode)
 
-    assignments = emlkmeans.cluster(dataset, centroids, channels=n_features)
-    assert len(assignments) == len(dataset)/n_features
-    assert list(assignments) == [0, 0, 1, 1], assignments
+        assignments = emlkmeans.cluster(dataset, centroids, channels=n_features)
+        assert len(assignments) == len(dataset)/n_features
+        assert list(assignments) == [0, 0, 1, 1], assignments
 
 
 test_kmeans_two_clusters()