Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
414e7793
Commit
414e7793
authored
Nov 27, 2018
by
王志伟
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
统计新用户数据
parent
f1ca88ee
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
20 additions
and
63 deletions
+20
-63
strategy_other.scala
eda/feededa/src/main/scala/com/gmei/strategy_other.scala
+20
-63
No files found.
eda/feededa/src/main/scala/com/gmei/strategy_other.scala
View file @
414e7793
...
...
@@ -74,101 +74,58 @@ object strategy_other {
devicee_id_newUser
.
show
()
devicee_id_newUser
.
createOrReplaceTempView
(
"device_id_new"
)
val
clk_count_
old
User_Contrast
=
sc
.
sql
(
val
clk_count_
new
User_Contrast
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as clk_count_
old
User_Contrast
|from data_feed_click jd inner join device_id_
old
|on jd.device_id = device_id_
old.deciv
e_id
|select '${param.date}' as stat_date, count(cid_id) as clk_count_
new
User_Contrast
|from data_feed_click jd inner join device_id_
new
|on jd.device_id = device_id_
new.devic
e_id
|where (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
|and jd.device_id regexp'1$$'
|and jd.device_id not in (select device_id from bl_device_list)
|and jd.device_id not in (select device_id from blacklist)
|and jd.stat_date ='${param.date}'
"""
.
stripMargin
)
val
imp_count_
old
User_Contrast
=
sc
.
sql
(
val
imp_count_
new
User_Contrast
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as imp_count_
old
User_Contrast
|from data_feed_exposure je inner join device_id_
old
|on je.device_id = device_id_
old.deciv
e_id
|select '${param.date}' as stat_date, count(cid_id) as imp_count_
new
User_Contrast
|from data_feed_exposure je inner join device_id_
new
|on je.device_id = device_id_
new.devic
e_id
|where je.cid_type = 'diary'
|and je.device_id regexp'1$$'
|and je.device_id not in (select device_id from bl_device_list)
|and je.device_id not in (select device_id from blacklist)
|and je.stat_date ='${param.date}'
"""
.
stripMargin
)
val
clk_count_
old
User_all
=
sc
.
sql
(
val
clk_count_
new
User_all
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as clk_count_
old
User_all
|from data_feed_click jd inner join device_id_
old
|on jd.device_id = device_id_
old.deciv
e_id
|select '${param.date}' as stat_date, count(cid_id) as clk_count_
new
User_all
|from data_feed_click jd inner join device_id_
new
|on jd.device_id = device_id_
new.devic
e_id
|where (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
|and jd.device_id not in (select device_id from bl_device_list)
|and jd.device_id not in (select device_id from blacklist)
|and jd.stat_date ='${param.date}'
"""
.
stripMargin
)
val
imp_count_
old
User_all
=
sc
.
sql
(
val
imp_count_
new
User_all
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as imp_count_
old
User_all
|select '${param.date}' as stat_date, count(cid_id) as imp_count_
new
User_all
|from data_feed_exposure je inner join device_id_old
|on je.device_id = device_id_old.decive_id
|where je.cid_type = 'diary'
|and je.device_id not in (select device_id from bl_device_list)
|and je.device_id not in (select device_id from blacklist)
|and je.stat_date ='${param.date}'
"""
.
stripMargin
)
//获取策略命中用户device_id
val
device_id_cover
=
sc
.
sql
(
s
"""
|select distinct(device_id) as device_id
|from merge_queue_table
"""
.
stripMargin
)
device_id_cover
.
createOrReplaceTempView
(
"device_id_cover_older"
)
val
clk_count_oldUser_Cover
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as clk_count_oldUser_Cover
|from data_feed_click jd inner join device_id_cover_older
|on jd.device_id = device_id_cover_older.device_id
|where (jd.cid_type = 'diary' or jd.cid_type = 'diary_video')
|and jd.device_id not in (select device_id from bl_device_list)
|and jd.device_id not in (select device_id from blacklist)
|and jd.stat_date ='${param.date}'
"""
.
stripMargin
)
val
imp_count_oldUser_Cover
=
sc
.
sql
(
s
"""
|select '${param.date}' as stat_date, count(cid_id) as imp_count_oldUser_Cover
|from data_feed_exposure je inner join device_id_cover_older
|on je.device_id = device_id_cover_older.device_id
|on je.device_id = device_id_old.device_id
|where je.cid_type = 'diary'
|and je.device_id not in (select device_id from bl_device_list)
|and je.device_id not in (select device_id from blacklist)
|and je.stat_date ='${param.date}'
"""
.
stripMargin
)
val
result3
=
clk_count_newUser_Contrast
.
join
(
imp_count_newUser_Contrast
,
"stat_date"
)
.
join
(
clk_count_newUser_all
,
"stat_date"
)
.
join
(
imp_count_newUser_all
,
"stat_date"
)
result3
.
show
()
val
result1
=
clk_count_oldUser_Contrast
.
join
(
imp_count_oldUser_Contrast
,
"stat_date"
)
.
join
(
clk_count_oldUser_all
,
"stat_date"
)
.
join
(
imp_count_oldUser_all
,
"stat_date"
)
.
join
(
clk_count_oldUser_Cover
,
"stat_date"
)
.
join
(
imp_count_oldUser_Cover
,
"stat_date"
)
result1
.
show
()
GmeiConfig
.
writeToJDBCTable
(
result1
,
"Recommendation_strategy_temp"
,
SaveMode
.
Append
)
GmeiConfig
.
writeToJDBCTable
(
result3
,
"Recommendation_strategy_newOlder"
,
SaveMode
.
Append
)
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment