-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathmain.py
More file actions
38 lines (30 loc) · 949 Bytes
/
main.py
File metadata and controls
38 lines (30 loc) · 949 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import pandas as pd
from model import CartDecisionTree
import pandas as pd
from sklearn.model_selection import train_test_split
def read_data(files: list) -> pd.DataFrame:
try:
data_frames = [pd.read_csv(f, sep=";") for f in files]
except FileExistsError as e:
print(e)
data = pd.concat(data_frames, ignore_index=True)
return data
def clean_data(data: pd.DataFrame) -> pd.DataFrame:
columns = data.columns[0].split(';')
newData = pd.DataFrame(columns=columns)
for idx in range(len(data)):
row = data.iloc[idx][0].split(";")
# print(columns)
# print(row)
newData.loc[len(newData)] = row
return newData
def main():
print("Reading data.......")
data = read_data(["cardio_train.csv"])
print("Done!")
model = CartDecisionTree(data, "cardio")
print("Training model.....")
# model.fit()
print("Done!")
if __name__ == "__main__":
main()