diff --git a/src/k_medoids_model.py b/src/k_medoids_model.py
new file mode 100644
index 0000000..53889de
--- /dev/null
+++ b/src/k_medoids_model.py
@@ -0,0 +1,206 @@
+import sys
+import numpy as np
+import matplotlib.pyplot as plt
+
+class KMedoidsModel():
+    # class variables
+
+    non_2d_data             = 'Data must be two-dimensional in order to plot'
+    non_numpy_array         = 'Data must be in the form of a numpy array'
+    non_positive_integer    = 'must be an integer greater than zero'
+    positive_integer_params = ['clusters', 'initializations', 'iterations']
+    shape_mismatch          = 'Shape of point does not match training data'
+    too_many_clusters       = 'Clusters outnumber data points'
+    zero_element_array      = 'Numpy array must contain at least one element'
+
+    # main method
+
+    def __init__(self, data, clusters, initializations = 10, iterations = 300, plot = False):
+        # model parameters are set as instance variables
+        self.data = data
+        self.clusters = clusters
+        self.iterations = iterations
+        self.initializations = initializations
+
+        self.validate_parameters()
+
+        # get distances between points once in advance as proposed in the abstract of
+        # https://www.sciencedirect.com/science/article/pii/S095741740800081X
+        self.distances = self.calculate_distance_matrix()
+
+        self.run()
+
+        if plot:
+            self.plot()
+
+    # parameter validation methods
+
+    def validate_parameters(self):
+        self.validate_data()
+        self.validate_clusters()
+        for parameter in KMedoidsModel.positive_integer_params:
+            self.validate_positive_integer_parameter(parameter)
+
+    def validate_data(self):
+        KMedoidsModel.raise_exception_for(ValueError, type(self.data) != np.ndarray, KMedoidsModel.non_numpy_array)
+        KMedoidsModel.raise_exception_for(ValueError, len(self.data) < 1, KMedoidsModel.zero_element_array)
+
+    def validate_clusters(self):
+        KMedoidsModel.raise_exception_for(
+            ValueError,
+            self.data.shape[0] < self.clusters,
+            "{}: {} > {}".format(KMedoidsModel.too_many_clusters, self.clusters, self.data.shape[0])
+        )
+
+    def validate_positive_integer_parameter(self, parameter):
+        KMedoidsModel.raise_exception_for(
+            ValueError,
+            vars(self)[parameter] < 1 or vars(self)[parameter] != int(vars(self)[parameter]),
+            "{} {}".format(parameter.capitalize(), KMedoidsModel.non_positive_integer)
+        )
+
+    # distance methods
+
+    def calculate_distance_matrix(self):
+        distance_matrix = np.zeros((self.data.shape[0], self.data.shape[0]))
+        # since matrix is symmetric with zeros in the diagonal we only need to
+        # calculate half of the off-diagonal elements:
+        for i in range(0, len(self.data)):
+            for j in range(i + 1, len(self.data)):
+                distance = np.linalg.norm(self.data[i] - self.data[j])
+                distance_matrix[i][j] = distance_matrix[j][i] = distance
+        return distance_matrix
+
+    # k-medoids algorithm methods
+
+    def run(self):
+        # as we iterate we keep track of the best model as measured by cost: the sum
+        # of absolute distances between medoids and their corresponding cluster
+        # "subscribers"
+        best_cost = sys.maxsize
+        best_labels_with_medoid_distances = None
+        best_medoids = None
+        # since this algorithm's outcome is sensitive to medoid initialization,
+        # we will run it multiple times with random initializations and choose
+        # the model that has the best cost
+        for initialization in range(0, self.initializations):
+            self.medoids = self.randomly_initialize_medoids()
+            # assign initial clusters to the data points by running an initial expectation step
+            self.labels_with_medoid_distances, self.cost = self.run_expectation_step()
+            # on each iteration find better medoids by running a maximization step
+            # followed by re-drawing the clusters with an expectation step
+            for iteration in range(0, self.iterations):
+                new_medoids = self.run_maximization_step()
+                # if the medoids are the same as the previous iteration, we have
+                # not found better medoids and we should stop iterating
+                if np.array_equal(new_medoids, self.medoids):
+                    break
+                self.medoids = new_medoids
+                self.labels_with_medoid_distances, self.cost = self.run_expectation_step()
+            # update the best running totals if, after the iterations, there are better values
+            if self.cost < best_cost:
+                best_cost = self.cost
+                best_labels_with_medoid_distances = self.labels_with_medoid_distances
+                best_medoids = self.medoids
+        # set the model as the one with best cost
+        self.cost = best_cost
+        self.labels_with_medoid_distances = best_labels_with_medoid_distances
+        self.medoids = best_medoids
+
+    def randomly_initialize_medoids(self):
+        return np.random.choice(self.data.shape[0], self.clusters, replace = False)
+
+    def run_expectation_step(self):
+        # for each data point, we calculate the closest medoid, the distance to it,
+        # and the total cost resulting from this choice of medoids
+        labels_with_medoid_distances = np.zeros((self.data.shape[0], 2))
+        cost = 0
+        for datapoint_index in range(0, len(self.distances)):
+            closest_medoid_distance = sys.maxsize
+            closest_medoid_index = -1
+            for medoid_index in self.medoids:
+                if self.distances[datapoint_index][medoid_index] < closest_medoid_distance:
+                    closest_medoid_distance = self.distances[datapoint_index][medoid_index]
+                    closest_medoid_index = medoid_index
+            labels_with_medoid_distances[datapoint_index] = [closest_medoid_index, closest_medoid_distance]
+            cost += closest_medoid_distance
+        return labels_with_medoid_distances, cost
+
+    def run_maximization_step(self):
+        # this method's goal is to return medoids that improve the cost within each
+        # cluster (which means we can end up with the same medoids) by randomly trying
+        # new medoids and comparing the resulting cost for each cluster
+        new_medoids = np.copy(self.medoids)
+        for index, current_medoid in enumerate(self.medoids):
+            subscribers_indeces = np.where(self.labels_with_medoid_distances[:, 0] == current_medoid)[0]
+            cluster_cost_before = KMedoidsModel.sum_second_column(
+                self.labels_with_medoid_distances[subscribers_indeces]
+            )
+            # randomly choose the next candidates to replace the cluster's medoid
+            # from the pool of cluster subscribers
+            index_of_new_medoid = -1
+            for candidate in KMedoidsModel.shuffle_array(subscribers_indeces):
+                change_in_cluster_cost = 0
+                cluster_cost_after = 0
+                # calculate the cluster cost using the current candidate as medoid
+                for subscriber_index in subscribers_indeces:
+                    cluster_cost_after += self.distances[subscriber_index][candidate]
+                change_in_cluster_cost = cluster_cost_after - cluster_cost_before
+                # if candidate improves cluster cost, assign it to replace current medoid
+                # and stop iterating
+                if change_in_cluster_cost < 0:
+                    index_of_new_medoid = candidate
+                    break
+            if index_of_new_medoid > -1:
+                new_medoids[index] = index_of_new_medoid
+        return new_medoids
+
+    # plotting methods
+
+    def plot(self,
+             xlabel = 'x',
+             ylabel = 'y',
+             title = '',
+             figsize = (8, 6),
+             edgecolor = 'black',
+             lw = 1.5,
+             s = 100,
+             cmap = plt.get_cmap('viridis')):
+        self.validate_two_dimensionality()
+        plt.figure(figsize = figsize)
+        plt.scatter(self.data[:, 0], self.data[:, 1], c = self.labels_with_medoid_distances[:, 0],
+                    edgecolor = edgecolor, lw = lw, s = s, cmap = cmap)
+        plt.xlabel(xlabel)
+        plt.ylabel(ylabel)
+        plt.title(title)
+        plt.show()
+
+    def validate_two_dimensionality(self):
+        KMedoidsModel.raise_exception_for(ValueError, self.data.shape[1] != 2, KMedoidsModel.non_2d_data)
+
+    # prediction methods
+
+    def predict_cluster(self, point):
+        self.validate_shape_of_new_point(point)
+        best_medoid, best_distance = None, sys.maxsize
+        for medoid in self.medoids:
+            distance = np.linalg.norm(self.data[medoid] - point)
+            if best_distance > distance:
+                best_medoid, best_distance = medoid, distance
+        return best_medoid, best_distance
+
+    def validate_shape_of_new_point(self, point):
+        KMedoidsModel.raise_exception_for(ValueError, point.shape != self.data[0].shape, KMedoidsModel.shape_mismatch)
+
+    # class methods
+
+    def sum_second_column(data_with_at_least_2_columns):
+        return np.sum(data_with_at_least_2_columns, axis=0)[1]
+
+    def shuffle_array(array):
+        shuffled_array = np.copy(array)
+        np.random.shuffle(shuffled_array)
+        return shuffled_array
+
+    def raise_exception_for(exception_type, condition, error_string):
+        if condition: raise exception_type(error_string)
diff --git a/test/test_k_medoids_model.py b/test/test_k_medoids_model.py
new file mode 100644
index 0000000..6609bcf
--- /dev/null
+++ b/test/test_k_medoids_model.py
@@ -0,0 +1,210 @@
+import unittest
+import numpy as np
+
+from src.k_medoids_model import KMedoidsModel
+
+class TestKMedoidsModel(unittest.TestCase):
+    # class variables pre-load models and datasets used in tests
+
+    model_1   = KMedoidsModel(np.array([[0, 0  ], [0.03, 0.01  ], [0.1, -0.4  ], [-0.47, -0.09], [-0.33, 0.4 ],
+                                        [1, 1  ], [1.03, 1.01  ], [1.1, 0.7   ], [0.77, 0.91  ], [0.88, 1.2  ],
+                                        [-1, -1], [-1.05, -1.03], [-1.2, -0.68], [-0.67, -0.93], [-0.89, -1.3],
+                                        [-1, 1 ], [-1.1, 1.12  ], [-1.23, 0.59], [-0.68, 0.75 ], [-0.93, 1.21],
+                                        [1, -1 ], [1.15, -1.23 ], [0.85, -1.14], [0.77, -0.87 ], [1.45, -0.9]]), 5)
+    model_2   = KMedoidsModel(np.array([[7, 6], [2, 6], [3, 8], [8, 5], [7, 4],
+                                        [4, 7], [6, 2], [7, 3], [6, 4], [3, 4]]), 2)
+    dataset_1 = np.array([[0, 0], [1, 1], [-1, -1], [-1, 1], [1, -1]])
+    model_3   = KMedoidsModel(dataset_1, 3)
+
+    # validation tests
+
+    def test_no_arguments(self):
+        with self.assertRaises(TypeError) as context:
+            KMedoidsModel()
+        self.assertTrue("__init__() missing 2 required positional arguments: 'data' and 'clusters'" in str(context.exception))
+
+    def test_missing_arguments(self):
+        with self.assertRaises(TypeError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]))
+        self.assertTrue("__init__() missing 1 required positional argument: 'clusters'" in str(context.exception))
+        with self.assertRaises(TypeError) as context:
+            KMedoidsModel(clusters = 5)
+        self.assertTrue("__init__() missing 1 required positional argument: 'data'" in str(context.exception))
+
+    def test_non_numpy_array(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel([[1, 2], [3, 4], [5, 6]], 2)
+        self.assertTrue('Data must be in the form of a numpy array' in str(context.exception))
+
+    def test_zero_element_array(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([]), 2)
+        self.assertTrue('Numpy array must contain at least one element' in str(context.exception))
+
+    def test_negative_clusters(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), - 2)
+        self.assertTrue('Clusters must be an integer greater than zero' in str(context.exception))
+
+    def test_float_clusters(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 1.2)
+        self.assertTrue('Clusters must be an integer greater than zero' in str(context.exception))
+
+    def test_negative_iterations(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 2, iterations = - 10)
+        self.assertTrue('Iterations must be an integer greater than zero' in str(context.exception))
+
+    def test_float_iterations(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 2, iterations = 10.4)
+        self.assertTrue('Iterations must be an integer greater than zero' in str(context.exception))
+
+    def test_negative_initializations(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 2, initializations = - 10)
+        self.assertTrue('Initializations must be an integer greater than zero' in str(context.exception))
+
+    def test_float_initializations(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 2, initializations = 10.6)
+        self.assertTrue('Initializations must be an integer greater than zero' in str(context.exception))
+
+    def test_too_many_clusters(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2], [3, 4], [5, 6]]), 4)
+        self.assertTrue('Clusters outnumber data points: 4 > 3' in str(context.exception))
+
+    def test_plotting_non_2_d(self):
+        with self.assertRaises(ValueError) as context:
+            KMedoidsModel(np.array([[1, 2, 2], [3, 4, 7], [5, 6, 1]]), 2, plot=True)
+        self.assertTrue('Data must be two-dimensional in order to plot' in str(context.exception))
+
+    def test_raise_exception_for(self):
+        with self.assertRaises(AttributeError) as context:
+            KMedoidsModel.raise_exception_for(AttributeError, True,  'Testing')
+        self.assertTrue('Testing' in str(context.exception))
+
+    def test_predict_cluster_error(self):
+        model = TestKMedoidsModel.model_3
+        with self.assertRaises(ValueError) as context:
+            model.predict_cluster(np.array([1, 2, 3]))
+        self.assertTrue('Shape of point does not match training data' in str(context.exception))
+
+    # distance tests
+
+    def test_calculate_distance_matrix(self):
+        model = KMedoidsModel(TestKMedoidsModel.dataset_1, 4)
+        true_distances = np.array([[ 0.        , 1.41421356, 1.41421356, 1.41421356, 1.41421356],
+                                   [ 1.41421356, 0.        , 2.82842712, 2.        , 2.        ],
+                                   [ 1.41421356, 2.82842712, 0.        , 2.        , 2.        ],
+                                   [ 1.41421356, 2.        , 2.        , 0.        , 2.82842712],
+                                   [ 1.41421356, 2.        , 2.        , 2.82842712, 0.        ]])
+        self.assertTrue(np.allclose(model.distances, true_distances, rtol = 1e-05, atol = 1e-08))
+        self.assertTrue(np.allclose(model.calculate_distance_matrix(), true_distances, rtol = 1e-05, atol = 1e-08))
+
+    # KMedoidsModel class methods tests
+
+    def test_sum_second_column(self):
+        self.assertEqual(KMedoidsModel.sum_second_column(np.array([[ 1., 1  ], [ 1., 2 ], [ 1., 3]])), 6.0)
+        self.assertEqual(KMedoidsModel.sum_second_column(np.array([[ 1., 1  ], [ 1., -2], [ 1., 1]])), 0.0)
+        self.assertEqual(KMedoidsModel.sum_second_column(np.array([[ 1., 5.6], [ 1., 23], [ 1., 0]])), 28.6)
+        self.assertEqual(KMedoidsModel.sum_second_column(np.array([[ 1., 0  ], [ 1., 0 ], [ 1., 0]])), 0.0)
+        self.assertEqual(KMedoidsModel.sum_second_column(np.array([[ 1., -1 ], [ 1., -2], [ 1., -3]])), - 6.0)
+
+    def test_shuffle_array(self):
+        original_array = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20])
+        self.assertFalse(np.array_equal(original_array, KMedoidsModel.shuffle_array(original_array)))
+
+    # k-medoids algorithm tests
+
+    def test_initialize_medoids(self):
+        model = TestKMedoidsModel.model_3
+        self.assertEqual(len(model.medoids), 3)
+        self.assertEqual(model.medoids[0] >= 0, True)
+        self.assertEqual(model.medoids[1] >= 0, True)
+        self.assertEqual(model.medoids[2] >= 0, True)
+        self.assertEqual(model.medoids[0] < 5,  True)
+        self.assertEqual(model.medoids[1] < 5,  True)
+        self.assertEqual(model.medoids[2] < 5,  True)
+        self.assertEqual(model.medoids[0] != model.medoids[1] != model.medoids[2], True)
+
+    def test_run_expectation_step(self):
+        model = TestKMedoidsModel.model_3
+        model.medoids = np.array([1, 2, 4])
+        true_labels_with_medoid_distances = np.array([[ 1., 1.41421356],
+                                                      [ 1., 0.        ],
+                                                      [ 2., 0.        ],
+                                                      [ 1., 2.        ],
+                                                      [ 4., 0.        ]])
+        self.assertTrue(np.allclose(model.run_expectation_step()[0], true_labels_with_medoid_distances, rtol = 1e-05, atol = 1e-08))
+        self.assertTrue(np.allclose(model.run_expectation_step()[1], 3.41421356, rtol = 1e-05, atol = 1e-08))
+
+    def test_run(self):
+        model = TestKMedoidsModel.model_1
+        medoids = model.medoids.sort()
+        true_medoids = np.array([0, 15, 20, 10,  5]).sort()
+        self.assertEqual(round(model.cost, 2), 5.82)
+        self.assertTrue(np.array_equal(medoids, true_medoids))
+        self.assertTrue(np.allclose(model.labels_with_medoid_distances, np.array([[  0., 0.        ],
+                                                                                  [  0., 0.03162278],
+                                                                                  [  0., 0.41231056],
+                                                                                  [  0., 0.47853944],
+                                                                                  [  0., 0.51855569],
+                                                                                  [  5., 0.        ],
+                                                                                  [  5., 0.03162278],
+                                                                                  [  5., 0.31622777],
+                                                                                  [  5., 0.24698178],
+                                                                                  [  5., 0.23323808],
+                                                                                  [ 10., 0.        ],
+                                                                                  [ 10., 0.05830952],
+                                                                                  [ 10., 0.37735925],
+                                                                                  [ 10., 0.33734256],
+                                                                                  [ 10., 0.31953091],
+                                                                                  [ 15., 0.        ],
+                                                                                  [ 15., 0.15620499],
+                                                                                  [ 15., 0.47010637],
+                                                                                  [ 15., 0.40607881],
+                                                                                  [ 15., 0.22135944],
+                                                                                  [ 20., 0.        ],
+                                                                                  [ 20., 0.2745906 ],
+                                                                                  [ 20., 0.20518285],
+                                                                                  [ 20., 0.2641969 ],
+                                                                                  [ 20., 0.46097722]]), rtol = 1e-05, atol = 1e-08))
+        model = TestKMedoidsModel.model_2
+        medoids = model.medoids.sort()
+        true_medoids = np.array([4, 1]).sort()
+        self.assertEqual(round(model.cost, 2), 14.36)
+        self.assertTrue(np.array_equal(medoids, true_medoids))
+        self.assertTrue(np.allclose(model.labels_with_medoid_distances, np.array([[ 4., 2.        ],
+                                                                                  [ 1., 0.        ],
+                                                                                  [ 1., 2.23606798],
+                                                                                  [ 4., 1.41421356],
+                                                                                  [ 4., 0.        ],
+                                                                                  [ 1., 2.23606798],
+                                                                                  [ 4., 2.23606798],
+                                                                                  [ 4., 1.        ],
+                                                                                  [ 4., 1.        ],
+                                                                                  [ 1., 2.23606798]]), rtol = 1e-05, atol = 1e-08))
+
+    # prediction tests
+
+    def test_predict_cluster(self):
+        self.assertEqual(TestKMedoidsModel.model_1.predict_cluster(np.array([1, 2])), (5, 1.0))
+
+    # visual inspection tests (commented out as they may get annoying- uncomment to enable)
+
+    # def test_visual_inspection(self):
+    #     TestKMedoidsModel.visually_inspect(self, TestKMedoidsModel.model_1, 1)
+    #     TestKMedoidsModel.visually_inspect(self, TestKMedoidsModel.model_2, 2)
+    #
+    # def visually_inspect(class_self, model, number):
+    #     visually_inspect_model = input('\n Enter 1 if you wish to visually inspect model {}, and any key otherwise \n'.format(number))
+    #     if visually_inspect_model == '1':
+    #         model.plot(title = 'Inspect model {} using data in test/test_k_medoids_model.py and then close this window'.format(number))
+    #         model_visual_evaluation = input('\n Enter 1 if you think model {} looks good, and any key otherwise \n'.format(number))
+    #         class_self.assertTrue(model_visual_evaluation == '1')
+
+if __name__ == "__main__":
+    unittest.main()