diff --git a/datasist/feature_engineering.py b/datasist/feature_engineering.py index b07ce273..e240262c 100644 --- a/datasist/feature_engineering.py +++ b/datasist/feature_engineering.py @@ -16,7 +16,7 @@ import seaborn as sns -from .structdata import get_cat_feats, get_num_feats, get_date_cols +from datasist.structdata import get_cat_feats, get_num_feats, get_date_cols from dateutil.parser import parse @@ -153,13 +153,13 @@ def fill_missing_num(data=None, num_features=None, method='mean', missing_col=Fa for feat in features: if missing_col: df[feat + '_missing_value'] = (df[feat].isna()).astype('int64') - if method is 'mean': + if method == 'mean': mean = df[feat].mean() df[feat].fillna(mean, inplace=True) - elif method is 'median': + elif method == 'median': median = df[feat].median() df[feat].fillna(median, inplace=True) - elif method is 'mode': + elif method == 'mode': mode = df[feat].mode()[0] df[feat].fillna(mode, inplace=True) else: diff --git a/datasist/visualizations.py b/datasist/visualizations.py index 78aa8aa9..6e673d49 100644 --- a/datasist/visualizations.py +++ b/datasist/visualizations.py @@ -7,7 +7,7 @@ import numpy as np import matplotlib.pyplot as plt import seaborn as sns -from . import structdata +from datasist import structdata from IPython.display import display from sklearn.metrics import confusion_matrix from sklearn.utils.multiclass import unique_labels