diff --git a/tensnsorflow/feature_engineering.py b/tensnsorflow/feature_engineering.py index b06045834b2c1e3f71e75ed1b8f3a9d86537f45d..c42dde9f0664e8687af81c7e342e71e0fd2c30cb 100644 --- a/tensnsorflow/feature_engineering.py +++ b/tensnsorflow/feature_engineering.py @@ -47,6 +47,7 @@ def get_data(): df = df.drop_duplicates(["ucity_id", "clevel1_id", "ccity_name", "device_type", "manufacturer", "channel", "top", "l1","l2", "time", "stat_date"]) print(df.shape) + print(df.count()) unique_values = [] features = ["ucity_id", "clevel1_id", "ccity_name", "device_type", "manufacturer",