Commit 1cc20431 authored by litaolemo's avatar litaolemo

update

parent 20dd3f76
......@@ -132,6 +132,7 @@ for t in range(1, task_days):
print(sql_dev_device_id)
dev_df = spark.sql(sql_dev_device_id)
dev_df_view = dev_df.createOrReplaceTempView("dev_view")
dev_df.cache()
dev_df.show(1)
sql_res = dev_df.collect()
for res in sql_res:
......@@ -154,6 +155,7 @@ for t in range(1, task_days):
spam_pv_view = spam_pv_df.createOrReplaceTempView("spam_pv")
spam_pv_df.show(1)
sql_res = spam_pv_df.collect()
spam_pv_df.cache()
for res in sql_res:
print(res)
......@@ -365,7 +367,7 @@ LEFT JOIN
LEFT JOIN dev_view
on t1.partition_date=dev_view.partition_date and t1.cl_id=dev_view.device_id
WHERE (spam_pv.device_id IS NULL or spam_pv.device_id ='')
and (dev_view.device_id is null or dev_view.device_id ='')
and (dev_view.device_id is NULL or dev_view.device_id ='')
GROUP BY t1.partition_date,active_type,device_os_type,channel
)t4
on t3.partition_date=t4.partition_date and t3.active_type=t4.active_type and t3.device_os_type = t4.device_os_type AND t3.channel = t4.channel
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment