Commit 9cebd53e authored by 张彦钊's avatar 张彦钊

add app list

parent bdbaab40
...@@ -15,6 +15,13 @@ def con_sql(db,sql): ...@@ -15,6 +15,13 @@ def con_sql(db,sql):
db.close() db.close()
return df return df
def is_json(myjson):
try:
json.loads(myjson)
except ValueError:
return False
return True
def json_format(x): def json_format(x):
a = json.loads(x) a = json.loads(x)
return set([x["appName"] for x in a]) return set([x["appName"] for x in a])
...@@ -24,7 +31,7 @@ def sort_app(): ...@@ -24,7 +31,7 @@ def sort_app():
sql = "select device_id,app_list from device_id_applist limit 20000" sql = "select device_id,app_list from device_id_applist limit 20000"
df = con_sql(db, sql).dropna() df = con_sql(db, sql).dropna()
df = df.rename(columns={0: "device_id", 1: "app_list"}) df = df.rename(columns={0: "device_id", 1: "app_list"})
df = df.loc[df["app_list"].str.startswith('[{"appName":')] df = df.loc[df["app_list"].apply(is_json)]
category = {"competitor":{"新氧微整形", "新氧SoYoung"}, category = {"competitor":{"新氧微整形", "新氧SoYoung"},
"dianshang":{"京东","淘宝","唯品会","天猫","苏宁易购","国美","当当","亚马逊","网易严选","小米有品"}, "dianshang":{"京东","淘宝","唯品会","天猫","苏宁易购","国美","当当","亚马逊","网易严选","小米有品"},
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment