subhadarship
diff --git a/‎.ipynb_checkpoints/batch_processing-checkpoint.ipynb
+334 b/‎.ipynb_checkpoints/batch_processing-checkpoint.ipynb
+334
diff --git a/‎.ipynb_checkpoints/cpu_vs_gpu-checkpoint.ipynb
+364 b/‎.ipynb_checkpoints/cpu_vs_gpu-checkpoint.ipynb
+364
diff --git a/‎.ipynb_checkpoints/example-checkpoint.ipynb
+343 b/‎.ipynb_checkpoints/example-checkpoint.ipynb
+343
diff --git a/‎batch_processing.ipynb
+334 b/‎batch_processing.ipynb
+334
diff --git a/‎cpu_vs_gpu.ipynb
+357-346 b/‎cpu_vs_gpu.ipynb
+357-346
diff --git a/‎example.ipynb
+334-323 b/‎example.ipynb
+334-323
diff --git a/‎kmeans_pytorch/.ipynb_checkpoints/__init__-checkpoint.py
+173 b/‎kmeans_pytorch/.ipynb_checkpoints/__init__-checkpoint.py
+173
diff --git a/‎kmeans_pytorch/.ipynb_checkpoints/main-checkpoint.py
+12 b/‎kmeans_pytorch/.ipynb_checkpoints/main-checkpoint.py
+12
diff --git a/‎kmeans_pytorch/__init__.py
+16-2 b/‎kmeans_pytorch/__init__.py
+16-2
@@ -0,0 +1,173 @@
+import numpy as np
+import torch
+from tqdm import tqdm
+
+# ToDo: Can't choose a cluster if two points are too close to each other, that's where the nan come from
+
+
+def initialize(X, num_clusters):
+    """
+    initialize cluster centers
+    :param X: (torch.tensor) matrix
+    :param num_clusters: (int) number of clusters
+    :return: (np.array) initial state
+    """
+    num_samples = len(X)
+    indices = np.random.choice(num_samples, num_clusters, replace=False)
+    initial_state = X[indices]
+    return initial_state
+
+
+def kmeans(
+        X,
+        num_clusters,
+        distance='euclidean',
+        cluster_centers = [],
+        tol=1e-4,
+        device=torch.device('cpu')
+):
+    """
+    perform kmeans
+    :param X: (torch.tensor) matrix
+    :param num_clusters: (int) number of clusters
+    :param distance: (str) distance [options: 'euclidean', 'cosine'] [default: 'euclidean']
+    :param tol: (float) threshold [default: 0.0001]
+    :param device: (torch.device) device [default: cpu]
+    :return: (torch.tensor, torch.tensor) cluster ids, cluster centers
+    """
+    print(f'running k-means on {device}..')
+
+    if distance == 'euclidean':
+        pairwise_distance_function = pairwise_distance
+    elif distance == 'cosine':
+        pairwise_distance_function = pairwise_cosine
+    else:
+        raise NotImplementedError
+
+    # convert to float
+    X = X.float()
+
+    # transfer to device
+    X = X.to(device)
+
+    # initialize
+    if type(cluster_centers) == list: #ToDo: make this less annoyingly weird
+        initial_state = initialize(X, num_clusters)
+    else:
+        print('resuming')
+        # find data point closest to the initial cluster center
+        initial_state = cluster_centers
+        dis = pairwise_distance_function(X, initial_state)
+        choice_points = torch.argmin(dis, dim=0)
+        initial_state = X[choice_points]
+        initial_state = initial_state.to(device)
+        
+    iteration = 0
+    tqdm_meter = tqdm(desc='[running kmeans]')
+    while True:
+        
+        dis = pairwise_distance_function(X, initial_state)
+
+        choice_cluster = torch.argmin(dis, dim=1)
+
+        initial_state_pre = initial_state.clone()
+
+        for index in range(num_clusters):
+            selected = torch.nonzero(choice_cluster == index).squeeze().to(device)
+
+            selected = torch.index_select(X, 0, selected)
+
+            initial_state[index] = selected.mean(dim=0)
+
+        center_shift = torch.sum(
+            torch.sqrt(
+                torch.sum((initial_state - initial_state_pre) ** 2, dim=1)
+            ))
+
+        # increment iteration
+        iteration = iteration + 1
+
+        # update tqdm meter
+        tqdm_meter.set_postfix(
+            iteration=f'{iteration}',
+            center_shift=f'{center_shift ** 2:0.6f}',
+            tol=f'{tol:0.6f}'
+        )
+        tqdm_meter.update()
+        if center_shift ** 2 < tol:
+            break
+
+    return choice_cluster.cpu(), initial_state.cpu()
+
+
+def kmeans_predict(
+        X,
+        cluster_centers,
+        distance='euclidean',
+        device=torch.device('cpu')
+):
+    """
+    predict using cluster centers
+    :param X: (torch.tensor) matrix
+    :param cluster_centers: (torch.tensor) cluster centers
+    :param distance: (str) distance [options: 'euclidean', 'cosine'] [default: 'euclidean']
+    :param device: (torch.device) device [default: 'cpu']
+    :return: (torch.tensor) cluster ids
+    """
+    print(f'predicting on {device}..')
+
+    if distance == 'euclidean':
+        pairwise_distance_function = pairwise_distance
+    elif distance == 'cosine':
+        pairwise_distance_function = pairwise_cosine
+    else:
+        raise NotImplementedError
+
+    # convert to float
+    X = X.float()
+
+    # transfer to device
+    X = X.to(device)
+
+    dis = pairwise_distance_function(X, cluster_centers)
+    choice_cluster = torch.argmin(dis, dim=1)
+
+    return choice_cluster.cpu()
+
+
+def pairwise_distance(data1, data2, device=torch.device('cpu')):
+    # transfer to device
+    data1, data2 = data1.to(device), data2.to(device)
+
+    # N*1*M
+    A = data1.unsqueeze(dim=1)
+
+    # 1*N*M
+    B = data2.unsqueeze(dim=0)
+
+    dis = (A - B) ** 2.0
+    # return N*N matrix for pairwise distance
+    dis = dis.sum(dim=-1).squeeze()
+    return dis
+
+
+def pairwise_cosine(data1, data2, device=torch.device('cpu')):
+    # transfer to device
+    data1, data2 = data1.to(device), data2.to(device)
+
+    # N*1*M
+    A = data1.unsqueeze(dim=1)
+
+    # 1*N*M
+    B = data2.unsqueeze(dim=0)
+
+    # normalize the points  | [0.3, 0.4] -> [0.3/sqrt(0.09 + 0.16), 0.4/sqrt(0.09 + 0.16)] = [0.3/0.5, 0.4/0.5]
+    A_normalized = A / A.norm(dim=-1, keepdim=True)
+    B_normalized = B / B.norm(dim=-1, keepdim=True)
+
+    cosine = A_normalized * B_normalized
+
+    # return N*N matrix for pairwise distance
+    cosine_dis = 1 - cosine.sum(dim=-1).squeeze()
+    return cosine_dis
+
@@ -0,0 +1,12 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+
+__version__ = "0.3"
+
+
+def main():
+    print("TODO")
+
+
+if __name__ == "__main__":
+    main()
@@ -2,6 +2,8 @@
 import torch
 from tqdm import tqdm
 
+# ToDo: Can't choose a cluster if two points are too close to each other, that's where the nan come from
+
 
 def initialize(X, num_clusters):
     """
@@ -20,6 +22,7 @@ def kmeans(
         X,
         num_clusters,
         distance='euclidean',
+        cluster_centers = [],
         tol=1e-4,
         device=torch.device('cpu')
 ):
@@ -48,11 +51,21 @@ def kmeans(
     X = X.to(device)
 
     # initialize
-    initial_state = initialize(X, num_clusters)
-
+    if type(cluster_centers) == list: #ToDo: make this less annoyingly weird
+        initial_state = initialize(X, num_clusters)
+    else:
+        print('resuming')
+        # find data point closest to the initial cluster center
+        initial_state = cluster_centers
+        dis = pairwise_distance_function(X, initial_state)
+        choice_points = torch.argmin(dis, dim=0)
+        initial_state = X[choice_points]
+        initial_state = initial_state.to(device)
+        
     iteration = 0
     tqdm_meter = tqdm(desc='[running kmeans]')
     while True:
+        
         dis = pairwise_distance_function(X, initial_state)
 
         choice_cluster = torch.argmin(dis, dim=1)
@@ -63,6 +76,7 @@ def kmeans(
             selected = torch.nonzero(choice_cluster == index).squeeze().to(device)
 
             selected = torch.index_select(X, 0, selected)
+
             initial_state[index] = selected.mean(dim=0)
 
         center_shift = torch.sum(