Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
17b1f603
Commit
17b1f603
authored
Dec 04, 2018
by
王志伟
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
核对日记本PV
parent
54bac5be
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
35 additions
and
14 deletions
+35
-14
WeafareStat.scala
eda/feededa/src/main/scala/com/gmei/WeafareStat.scala
+1
-0
testt.scala
eda/feededa/src/main/scala/com/gmei/testt.scala
+34
-14
No files found.
eda/feededa/src/main/scala/com/gmei/WeafareStat.scala
View file @
17b1f603
...
...
@@ -206,6 +206,7 @@ object WeafareStat {
val
result5
=
result4
.
withColumn
(
"diary_expoure_meigou_rate"
,
result
.
col
(
"diary_meigou_count"
)/
result
.
col
(
"diary_expoure"
))
result5
.
show
()
GmeiConfig
.
writeToJDBCTable
(
result5
,
"diary_meigou_cvr"
,
SaveMode
.
Append
)
sc
.
stop
()
...
...
eda/feededa/src/main/scala/com/gmei/testt.scala
View file @
17b1f603
...
...
@@ -44,27 +44,47 @@ object testt {
ti
.
tidbMapTable
(
dbName
=
"jerry_prod"
,
tableName
=
"diary_video"
)
ti
.
tidbMapTable
(
dbName
=
"jerry_prod"
,
tableName
=
"data_feed_click"
)
ti
.
tidbMapTable
(
dbName
=
"jerry_prod"
,
tableName
=
"blacklist"
)
ti
.
tidbMapTable
(
dbName
=
"jerry_test"
,
tableName
=
"bl_device_list"
)
ti
.
tidbMapTable
(
dbName
=
"jerry_prod"
,
tableName
=
"data_feed_exposure"
)
val
view_count
=
sc
.
sql
(
s
"""
|select params["business_id"] as diary_id,(params["out"]-params["in"]) as dur_time
|from online.tl_hdfs_maidian_view
|where action="page_view"
|and params["page_name"]="diary_detail"
|and partition_date >='20180901'
//机构id
val
agency_id
=
sc
.
sql
(
s
"""
|SELECT DISTINCT(cl_id) as device_id
|FROM online.ml_hospital_spam_pv_day
|WHERE partition_date >= '20180402'
|AND partition_date <= '20181203'
|AND pv_ratio >= 0.95
|UNION ALL
|SELECT DISTINCT(cl_id) as device_id
|FROM online.ml_hospital_spam_pv_month
|WHERE partition_date >= '20171101'
|AND partition_date <= '20181203'
|AND pv_ratio >= 0.95
"""
.
stripMargin
)
view_count
.
show
()
view_count
.
createOrReplaceTempView
(
"temp"
)
)
// agency_id.show()
agency_id
.
createOrReplaceTempView
(
"agency_id"
)
val
diary_pv
=
sc
.
sql
(
s
"""
|select ov.partition_date, count(params["business_id"]) as diary_pv
|from online.tl_hdfs_maidian_view ov left join agency_id
|on ov.cl_id = agency_id.device_id
|where ov.action="page_view"
|and ov.params["page_name"]="diary_detail"
|and (ov.params["out"]-ov.params["in"])<7200
|and agency_id.device_id is null
|and ov.partition_date >='20181120'
|and ov.cl_id not in (select distinct(device_id) from blacklist)
|group by ov.partition_date order by ov.partition_date
"""
.
stripMargin
)
diary_pv
.
show
()
GmeiConfig
.
writeToJDBCTable
(
view_count
,
"avg"
,
SaveMode
.
Overwrite
)
// GmeiConfig.writeToJDBCTable(view_count, "avg", SaveMode.Overwrite)
val
result
=
view_count
result
.
show
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment