Commit f73276dc authored by litaolemo's avatar litaolemo

update

parent 552d5392
......@@ -72,38 +72,38 @@ for t in range(0, task_days):
today_str = now.strftime("%Y%m%d")
yesterday_str = (now + datetime.timedelta(days=-1)).strftime("%Y%m%d")
one_week_age_str = (now + datetime.timedelta(days=-7)).strftime("%Y%m%d")
sql = """SELECT t1.query as `query词`
,t1.device_os_type as `设备类型`
,t1.active_type as `活跃类型`
,t1.channel as `渠道类型`
,NVL(t1.search_pv,0) as `过去30天搜索pv`
,NVL(t1.search_uv,0) as `过去30天搜索uv`
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as `昨天-核心卡片点击PV/搜索UV`
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as `昨天-内容卡片点击PV/搜索UV`
sql = """SELECT t1.query as query
,t1.device_os_type as device_type
,t1.active_type as active_type
,t1.channel as channel_type
,NVL(t1.search_pv,0) as 30_pv
,NVL(t1.search_uv,0) as 30_uv
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as 1_core_pv/uv
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as 1_pv/uv
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.hexin_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as `过去7天-核心卡片点击PV/搜索UV`
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.neirong_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as `过去7天-内容卡片点击PV/搜索UV`
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.hexin_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as 7_core_pv/uv
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.neirong_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as 7_pv/uv
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.hexin_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as `过去30天-核心卡片点击PV/搜索UV`
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.neirong_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as `过去30天-内容卡片点击PV/搜索UV`
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.hexin_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as 30_core_pv/uv
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.neirong_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as 30_pv/uv
,NVL(t2.hexin_card_click_pv,0) as `过去30天搜索结果核心卡片点击pv`
,NVL(t2.neirong_card_click_pv,0) as `过去30天搜索结果内容卡片点击pv`
,NVL(t2.hexin_card_click_pv,0) as 30_search_core_pv
,NVL(t2.neirong_card_click_pv,0) as 30_search_pv
,NVL(t3.search_pv,0) as `昨天搜索pv`
,NVL(t3.search_uv,0) as `昨天搜索uv`
,NVL(t3.search_pv,0) as 1_pv
,NVL(t3.search_uv,0) as 1_uv
,NVL(t4.hexin_card_click_pv,0) as `昨天搜索结果核心卡片点击pv`
,NVL(t4.neirong_card_click_pv,0) as `昨天搜索结果内容卡片点击pv`
,NVL(t4.hexin_card_click_pv,0) as 1_search_core_pv
,NVL(t4.neirong_card_click_pv,0) as 1_search_pv
,NVL(t5.search_pv,0) as `过去7天搜索pv`
,NVL(t5.search_uv,0) as `过去7天搜索uv`
,NVL(t5.search_pv,0) as 7_pv
,NVL(t5.search_uv,0) as 7_uv
,NVL(t6.hexin_card_click_pv,0) as `过去7天搜索结果核心卡片点击pv`
,NVL(t6.neirong_card_click_pv,0) as `过去7天搜索结果内容卡片点击pv`
,NVL(t6.hexin_card_click_pv,0) as 7_search_core_pv
,NVL(t6.neirong_card_click_pv,0) as 7_search_pv
FROM
(--过去30天总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
......@@ -140,7 +140,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
......@@ -197,7 +197,7 @@ for t in range(0, task_days):
)t1
LEFT JOIN
--过去30天搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
......@@ -210,7 +210,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -228,7 +228,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -281,7 +281,7 @@ for t in range(0, task_days):
LEFT JOIN
(--昨天总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
......@@ -317,7 +317,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
......@@ -375,7 +375,7 @@ for t in range(0, task_days):
on t1.query=t3.query and t1.active_type=t3.active_type and t1.device_os_type = t3.device_os_type AND t1.channel = t3.channel
LEFT JOIN
(--昨天搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
,sum(neirong) as neirong_card_click_pv
......@@ -387,7 +387,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -405,7 +405,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -457,7 +457,7 @@ for t in range(0, task_days):
LEFT JOIN
(--过去一周总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
......@@ -493,7 +493,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
......@@ -551,7 +551,7 @@ for t in range(0, task_days):
on t1.query=t5.query and t1.active_type=t5.active_type and t1.device_os_type = t5.device_os_type AND t1.channel = t5.channel
LEFT JOIN
(--过去一周搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
,sum(neirong) as neirong_card_click_pv
......@@ -563,7 +563,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -581,7 +581,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
......@@ -631,7 +631,7 @@ for t in range(0, task_days):
GROUP BY t1.query,active_type,device_os_type,channel
)t6
on t1.query=t6.query and t1.active_type=t6.active_type and t1.device_os_type = t6.device_os_type AND t1.channel = t6.channel
order by `过去30天搜索pv` desc,`query词`""".format(last_30_day_str=last_30_day_str, today_str=today_str,
order by 30_pv desc,query""".format(last_30_day_str=last_30_day_str, today_str=today_str,
yesterday_str=yesterday_str, one_week_age_str=one_week_age_str)
device_df = spark.sql(sql)
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment