Commit 7a5e54d0 authored by 张彦钊's avatar 张彦钊

删除歧义样本

parent bbc59eed
......@@ -166,6 +166,8 @@ def get_data():
print(df.shape)
print("after")
df = df.drop_duplicates()
df = df.drop_duplicates(["ucity_id", "clevel1_id", "ccity_name", "device_type", "manufacturer",
"channel", "top", "level2_ids", "time","stat_date"])
print(df.shape)
df["clevel1_id"] = df["clevel1_id"].astype("str")
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment