Commit 129c754d authored by 张彦钊's avatar 张彦钊

修改str cat函数

parent 5108fe8e
...@@ -21,7 +21,7 @@ def con_sql(db,sql): ...@@ -21,7 +21,7 @@ def con_sql(db,sql):
def get_data(): def get_data():
db = pymysql.connect(host='10.66.157.22', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='jerry_prod') db = pymysql.connect(host='10.66.157.22', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='jerry_prod')
sql = "select * from esmm_data where stat_date >= '2018-11-20'" sql = "select * from esmm_data where stat_date >= '2018-11-20' limit 6"
esmm = con_sql(db,sql) esmm = con_sql(db,sql)
esmm = esmm.rename(columns={0:"stat_date",1: "device_id",2:"ucity_id",3:"cid_id",4:"diary_service_id",5:"y", esmm = esmm.rename(columns={0:"stat_date",1: "device_id",2:"ucity_id",3:"cid_id",4:"diary_service_id",5:"y",
6:"z",7:"clevel1_id",8:"slevel1_id"}) 6:"z",7:"clevel1_id",8:"slevel1_id"})
...@@ -29,7 +29,7 @@ def get_data(): ...@@ -29,7 +29,7 @@ def get_data():
print(esmm.head()) print(esmm.head())
print(esmm.shape) print(esmm.shape)
db = pymysql.connect(host='10.66.157.22', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='eagle') db = pymysql.connect(host='10.66.157.22', port=4000, user='root', passwd='3SYz54LS9#^9sBvC', db='eagle')
sql = "select * from home_tab_click" sql = "select * from home_tab_click limit 6"
temp = con_sql(db,sql) temp = con_sql(db,sql)
temp = temp.rename(columns={0: "device_id"}) temp = temp.rename(columns={0: "device_id"})
print("click data ok") print("click data ok")
...@@ -63,7 +63,7 @@ def transform(df,table): ...@@ -63,7 +63,7 @@ def transform(df,table):
df["diary_id"] = df[0].apply(lambda x: x.split(",")[2]) df["diary_id"] = df[0].apply(lambda x: x.split(",")[2])
df["seq"] = list(range(df.shape[0])) df["seq"] = list(range(df.shape[0]))
df["seq"] = df["seq"].astype("str") df["seq"] = df["seq"].astype("str")
df["ffm"] = df[0].apply(lambda x: x.split(",")[3:]) df["ffm"] = df[0].apply(lambda x: ",".join(x.split(",")[3:]))
df["ffm"] = df["seq"].str.cat(df["ffm"], sep=",") df["ffm"] = df["seq"].str.cat(df["ffm"], sep=",")
df["random"] = np.random.randint(1, 2147483647, df.shape[0]) df["random"] = np.random.randint(1, 2147483647, df.shape[0])
df = df.drop(0, axis=1).drop("seq",axis=1) df = df.drop(0, axis=1).drop("seq",axis=1)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment