Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
M
meta_base_code
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
宋柯
meta_base_code
Commits
f73276dc
Commit
f73276dc
authored
Aug 21, 2020
by
litaolemo
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
update
parent
552d5392
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
38 additions
and
38 deletions
+38
-38
search_strategy_d.py
task/search_strategy_d.py
+38
-38
No files found.
task/search_strategy_d.py
View file @
f73276dc
...
...
@@ -72,38 +72,38 @@ for t in range(0, task_days):
today_str
=
now
.
strftime
(
"
%
Y
%
m
%
d"
)
yesterday_str
=
(
now
+
datetime
.
timedelta
(
days
=-
1
))
.
strftime
(
"
%
Y
%
m
%
d"
)
one_week_age_str
=
(
now
+
datetime
.
timedelta
(
days
=-
7
))
.
strftime
(
"
%
Y
%
m
%
d"
)
sql
=
"""SELECT t1.query as
`query词`
,t1.device_os_type as
`设备类型`
,t1.active_type as
`活跃类型`
,t1.channel as
`渠道类型`
,NVL(t1.search_pv,0) as
`过去30天搜索pv`
,NVL(t1.search_uv,0) as
`过去30天搜索uv`
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as
`昨天-核心卡片点击PV/搜索UV`
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as
`昨天-内容卡片点击PV/搜索UV`
sql
=
"""SELECT t1.query as
query
,t1.device_os_type as
device_type
,t1.active_type as
active_type
,t1.channel as
channel_type
,NVL(t1.search_pv,0) as
30_pv
,NVL(t1.search_uv,0) as
30_uv
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as
1_core_pv/uv
,if(NVL(t3.search_uv,0) <> 0 ,concat(cast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-') as
1_pv/uv
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.hexin_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as
`过去7天-核心卡片点击PV/搜索UV`
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.neirong_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as
`过去7天-内容卡片点击PV/搜索UV`
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.hexin_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as
7_core_pv/uv
,if(NVL(t5.search_uv,0) <> 0 ,concat(cast((NVL(t6.neirong_card_click_pv,0)/NVL(t5.search_uv,0)) as decimal(18,2)),'') , '-') as
7_pv/uv
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.hexin_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as
`过去30天-核心卡片点击PV/搜索UV`
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.neirong_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as
`过去30天-内容卡片点击PV/搜索UV`
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.hexin_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as
30_core_pv/uv
,if(NVL(t1.search_uv,0) <> 0 ,concat(cast((NVL(t2.neirong_card_click_pv,0)/NVL(t1.search_uv,0)) as decimal(18,2)),'') , '-') as
30_pv/uv
,NVL(t2.hexin_card_click_pv,0) as
`过去30天搜索结果核心卡片点击pv`
,NVL(t2.neirong_card_click_pv,0) as
`过去30天搜索结果内容卡片点击pv`
,NVL(t2.hexin_card_click_pv,0) as
30_search_core_pv
,NVL(t2.neirong_card_click_pv,0) as
30_search_pv
,NVL(t3.search_pv,0) as
`昨天搜索pv`
,NVL(t3.search_uv,0) as
`昨天搜索uv`
,NVL(t3.search_pv,0) as
1_pv
,NVL(t3.search_uv,0) as
1_uv
,NVL(t4.hexin_card_click_pv,0) as
`昨天搜索结果核心卡片点击pv`
,NVL(t4.neirong_card_click_pv,0) as
`昨天搜索结果内容卡片点击pv`
,NVL(t4.hexin_card_click_pv,0) as
1_search_core_pv
,NVL(t4.neirong_card_click_pv,0) as
1_search_pv
,NVL(t5.search_pv,0) as
`过去7天搜索pv`
,NVL(t5.search_uv,0) as
`过去7天搜索uv`
,NVL(t5.search_pv,0) as
7_pv
,NVL(t5.search_uv,0) as
7_uv
,NVL(t6.hexin_card_click_pv,0) as
`过去7天搜索结果核心卡片点击pv`
,NVL(t6.neirong_card_click_pv,0) as
`过去7天搜索结果内容卡片点击pv`
,NVL(t6.hexin_card_click_pv,0) as
7_search_core_pv
,NVL(t6.neirong_card_click_pv,0) as
7_search_pv
FROM
(
--过去30天总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
...
...
@@ -140,7 +140,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
...
...
@@ -197,7 +197,7 @@ for t in range(0, task_days):
)t1
LEFT JOIN
--过去30天搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
...
...
@@ -210,7 +210,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(
--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -228,7 +228,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(
--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -281,7 +281,7 @@ for t in range(0, task_days):
LEFT JOIN
(
--昨天总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
...
...
@@ -317,7 +317,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
...
...
@@ -375,7 +375,7 @@ for t in range(0, task_days):
on t1.query=t3.query and t1.active_type=t3.active_type and t1.device_os_type = t3.device_os_type AND t1.channel = t3.channel
LEFT JOIN
(
--昨天搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
,sum(neirong) as neirong_card_click_pv
...
...
@@ -387,7 +387,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(
--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -405,7 +405,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(
--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -457,7 +457,7 @@ for t in range(0, task_days):
LEFT JOIN
(
--过去一周总搜索量
(
SELECT query,active_type,device_os_type,channel,search_pv,search_uv
FROM
(
...
...
@@ -493,7 +493,7 @@ for t in range(0, task_days):
AND params['in_page_pos']='猜你喜欢'
AND params['tab_name']='精选'
AND params['card_type']='search_word'
--AND page_name='home' android的page_name为空
UNION ALL
SELECT partition_date
...
...
@@ -551,7 +551,7 @@ for t in range(0, task_days):
on t1.query=t5.query and t1.active_type=t5.active_type and t1.device_os_type = t5.device_os_type AND t1.channel = t5.channel
LEFT JOIN
(
--过去一周搜索结果页卡片点击pv
(
SELECT t1.query,active_type,device_os_type,channel
,sum(hexin) as hexin_card_click_pv
,sum(neirong) as neirong_card_click_pv
...
...
@@ -563,7 +563,7 @@ for t in range(0, task_days):
,NVL(t2.pv) as hexin
,NVL(t3.pv) as neirong
FROM
(
--核心卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -581,7 +581,7 @@ for t in range(0, task_days):
,cl_id
)t2
FULL JOIN
(
--内容卡片点击
(
SELECT partition_date
,params['query'] as query
,cl_id
...
...
@@ -631,7 +631,7 @@ for t in range(0, task_days):
GROUP BY t1.query,active_type,device_os_type,channel
)t6
on t1.query=t6.query and t1.active_type=t6.active_type and t1.device_os_type = t6.device_os_type AND t1.channel = t6.channel
order by
`过去30天搜索pv` desc,`query词`
"""
.
format
(
last_30_day_str
=
last_30_day_str
,
today_str
=
today_str
,
order by
30_pv desc,query
"""
.
format
(
last_30_day_str
=
last_30_day_str
,
today_str
=
today_str
,
yesterday_str
=
yesterday_str
,
one_week_age_str
=
one_week_age_str
)
device_df
=
spark
.
sql
(
sql
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment