Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
M
meta_base_code
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
宋柯
meta_base_code
Commits
2a4face3
Commit
2a4face3
authored
Nov 18, 2020
by
litaolemo
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
update
parent
6180d0f9
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
19 additions
and
5 deletions
+19
-5
recommend_strategy_fix.py
task/recommend_strategy_fix.py
+19
-5
No files found.
task/recommend_strategy_fix.py
View file @
2a4face3
...
@@ -35,9 +35,7 @@ cursor = db.cursor()
...
@@ -35,9 +35,7 @@ cursor = db.cursor()
def
con_sql
(
sql
):
def
con_sql
(
sql
):
# 从数据库的表里获取数据
# 从数据库的表里获取数据
db
=
pymysql
.
connect
(
host
=
'172.16.40.158'
,
port
=
4000
,
user
=
'st_user'
,
passwd
=
'aqpuBLYzEV7tML5RPsN1pntUzFy'
,
db
=
'jerry_prod'
)
db
=
pymysql
.
connect
(
host
=
'172.16.40.158'
,
port
=
4000
,
user
=
'st_user'
,
passwd
=
'aqpuBLYzEV7tML5RPsN1pntUzFy'
,
db
=
'jerry_prod'
)
cursor
=
db
.
cursor
()
cursor
=
db
.
cursor
()
cursor
.
execute
(
sql
)
cursor
.
execute
(
sql
)
result
=
cursor
.
fetchall
()
result
=
cursor
.
fetchall
()
...
@@ -190,7 +188,7 @@ for t in range(0, task_days):
...
@@ -190,7 +188,7 @@ for t in range(0, task_days):
app_session_id
app_session_id
)a
)a
LATERAL VIEW explode (a.recommend_type) v as recommend_type
LATERAL VIEW explode (a.recommend_type) v as recommend_type
group by partition_date,cl_id) t0
group by partition_date,cl_id) t0
having session_pv0 >= 4
on t1.device_id = t0.cl_id
on t1.device_id = t0.cl_id
LEFT JOIN
LEFT JOIN
(--精准曝光,卡片id和session_id去重
(--精准曝光,卡片id和session_id去重
...
@@ -781,7 +779,7 @@ for t in range(0, task_days):
...
@@ -781,7 +779,7 @@ for t in range(0, task_days):
on t2.partition_date=dev.partition_date and t2.cl_id=dev.device_id
on t2.partition_date=dev.partition_date and t2.cl_id=dev.device_id
WHERE spam_pv.device_id IS NULL
WHERE spam_pv.device_id IS NULL
and dev.device_id is null
and dev.device_id is null
GROUP BY t1.partition_date,t1.device_os_type,t1.active_type,t2.card_content_type,t2.recommend_type
having t0.session_pv0 >= 4 or t3.session_pv >0
GROUP BY t1.partition_date,t1.device_os_type,t1.active_type,t2.card_content_type,t2.recommend_type
order by day_id,device_os_type,active_type,card_content_type,recommend_type
order by day_id,device_os_type,active_type,card_content_type,recommend_type
"""
.
format
(
partition_day
=
today_str
)
"""
.
format
(
partition_day
=
today_str
)
ctr_df
=
spark
.
sql
(
ctr_sql
)
ctr_df
=
spark
.
sql
(
ctr_sql
)
...
@@ -797,6 +795,16 @@ for t in range(0, task_days):
...
@@ -797,6 +795,16 @@ for t in range(0, task_days):
device_df
.
show
(
1
,
False
)
device_df
.
show
(
1
,
False
)
sql_res
=
device_df
.
collect
()
sql_res
=
device_df
.
collect
()
data_dict
=
{}
has_click_pv_sql
=
'select pid,card_click from recommend_strategy_d where partition_day = "
%
s"'
%
today_str
all_data_res
=
con_sql
(
has_click_pv_sql
)
for
data
in
all_data_res
:
data_dict
[
data
[
0
]]
=
data
[
1
]
if
not
data_dict
:
import
sys
sys
.
exit
(
0
)
sql_res
=
{}
print
(
"-----------------------------------------------------------------------------"
)
print
(
"-----------------------------------------------------------------------------"
)
for
res
in
sql_res
:
for
res
in
sql_res
:
# print(res)
# print(res)
...
@@ -829,6 +837,12 @@ for t in range(0, task_days):
...
@@ -829,6 +837,12 @@ for t in range(0, task_days):
second_jump_ctr
=
res
.
second_jump_ctr
second_jump_ctr
=
res
.
second_jump_ctr
click_ctr
=
res
.
click_ctr
click_ctr
=
res
.
click_ctr
pid
=
hashlib
.
md5
((
day_id
+
device_os_type
+
active_type
+
card_content_type
+
recommend_type
)
.
encode
(
"utf8"
))
.
hexdigest
()
pid
=
hashlib
.
md5
((
day_id
+
device_os_type
+
active_type
+
card_content_type
+
recommend_type
)
.
encode
(
"utf8"
))
.
hexdigest
()
try
:
card_click_diff
=
card_click
-
data_dict
.
get
(
pid
)
card_click
+=
card_click_diff
card_exposure
+=
card_exposure
except
:
print
(
"add error"
)
instert_sql
=
"""replace into recommend_strategy_d_fix(
instert_sql
=
"""replace into recommend_strategy_d_fix(
day_id,device_os_type,active_type,card_content_type,recommend_type,card_click,card_exposure,avg_page_stay,navbar_search,
day_id,device_os_type,active_type,card_content_type,recommend_type,card_click,card_exposure,avg_page_stay,navbar_search,
highlight_word,self_welfare_card,recommend_welfare_card,recommend_content_card,recommend_special_card,transfer_card,video_consultation,
highlight_word,self_welfare_card,recommend_welfare_card,recommend_content_card,recommend_special_card,transfer_card,video_consultation,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment