mirror of
https://github.com/fenago/data-science.git
synced 2026-05-04 08:31:59 +00:00
32 lines
1008 B
Python
32 lines
1008 B
Python
import unittest
|
|
import import_ipynb
|
|
import pandas as pd
|
|
import pandas.testing as pd_testing
|
|
from sklearn.cluster import KMeans
|
|
|
|
class Test(unittest.TestCase):
|
|
def setUp(self):
|
|
import Exercise11_01
|
|
self.exercises = Exercise11_01
|
|
|
|
self.file_url = '../dataset/breast-cancer-wisconsin.data'
|
|
self.df = pd.read_csv(self.file_url, header=None)
|
|
self.col_names = ['Sample code number', 'Clump Thickness', 'Uniformity of Cell Size', 'Uniformity of Cell Shape',
|
|
'Marginal Adhesion', 'Single Epithelial Cell Size',
|
|
'Bare Nuclei', 'Bland Chromatin', 'Normal Nucleoli', 'Mitoses', 'Class']
|
|
self.df.columns = self.col_names
|
|
self.df_unique = self.df.drop_duplicates(keep='first')
|
|
|
|
|
|
def test_file_url(self):
|
|
self.assertEqual(self.exercises.file_url, self.file_url)
|
|
|
|
def test_df(self):
|
|
pd_testing.assert_frame_equal(self.exercises.df, self.df)
|
|
|
|
def test_df_unique(self):
|
|
pd_testing.assert_frame_equal(self.exercises.df_unique, self.df_unique)
|
|
|
|
if __name__ == '__main__':
|
|
unittest.main()
|