Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
1623a6dd
Commit
1623a6dd
authored
May 06, 2019
by
王志伟
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
更改时间
parent
4bcf06fd
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
56 additions
and
3 deletions
+56
-3
data_feed_exposure_precise.scala
.../src/main/scala/com/gmei/data_feed_exposure_precise.scala
+56
-3
No files found.
eda/feededa/src/main/scala/com/gmei/data_feed_exposure_precise.scala
View file @
1623a6dd
...
@@ -8,6 +8,10 @@ import org.apache.spark.sql.SaveMode
...
@@ -8,6 +8,10 @@ import org.apache.spark.sql.SaveMode
import
org.apache.log4j.
{
Level
,
Logger
}
import
org.apache.log4j.
{
Level
,
Logger
}
import
scopt.OptionParser
import
scopt.OptionParser
import
com.gmei.lib.AbstractParams
import
com.gmei.lib.AbstractParams
//import com.sun.deploy.uitoolkit.Window
import
org.apache.spark.sql.expressions.Window
import
org.apache.spark.sql.functions.row_number
object
data_feed_exposure_precise
{
object
data_feed_exposure_precise
{
...
@@ -662,7 +666,7 @@ object tag_value {
...
@@ -662,7 +666,7 @@ object tag_value {
val
t2
=
0.5
val
t2
=
0.5
val
t3
=
1.0
val
t3
=
1.0
//
tag
_id到权重映射
//
level
_id到权重映射
val
level1_id
=
sc
.
sql
(
val
level1_id
=
sc
.
sql
(
s
"""
s
"""
|select distinct(level1_id) as level_id,'${t1}' as value
|select distinct(level1_id) as level_id,'${t1}' as value
...
@@ -694,7 +698,7 @@ object tag_value {
...
@@ -694,7 +698,7 @@ object tag_value {
level3_id
.
createOrReplaceTempView
(
"level3_id"
)
level3_id
.
createOrReplaceTempView
(
"level3_id"
)
val
tag
_value
=
sc
.
sql
(
val
level
_value
=
sc
.
sql
(
s
"""
s
"""
|select *
|select *
|from level1_id
|from level1_id
...
@@ -709,10 +713,59 @@ object tag_value {
...
@@ -709,10 +713,59 @@ object tag_value {
// tag_value.show(300)
// tag_value.show(300)
println
(
"开始写入"
)
println
(
"开始写入"
)
GmeiConfig
.
writeToJDBCTable
(
"jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true"
,
tag
_value
,
table
=
"tagId_value"
,
SaveMode
.
Overwrite
)
GmeiConfig
.
writeToJDBCTable
(
"jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true"
,
level
_value
,
table
=
"tagId_value"
,
SaveMode
.
Overwrite
)
println
(
"写入完成"
)
println
(
"写入完成"
)
//level_id到index映射
val
level_index_temp
=
sc
.
sql
(
s
"""
|select a.tag_id,b.level1_id,b.level2_id,b.level3_id
|from online.tl_hdfs_diary_tags_view a
|left join online.bl_tag_hierarchy_detail b
|on a.tag_id = b.id
|where a.partition_date = '${partition_date}'
|and b.partition_date = '${partition_date}'
"""
.
stripMargin
)
level_index_temp
.
createOrReplaceTempView
(
"level_index_temp"
)
val
temp1
=
sc
.
sql
(
s
"""
|select tag_id,level1_id as level_id
|from level_index_temp
|union all
|select tag_id,level2_id as level_id
|from level_index_temp
|union all
|select tag_id,level3_id as level_id
|from level_index_temp
"""
.
stripMargin
)
temp1
.
createOrReplaceTempView
(
"temp1"
)
val
temp2
=
sc
.
sql
(
s
"""
|select concat_ws(',',tag_id,level_id) as tag_level from temp1
"""
.
stripMargin
)
temp2
.
show
()
// temp2.createOrReplaceTempView("temp2")
val
w
=
Window
.
orderBy
(
"tag_level"
)
val
result
=
temp2
.
select
(
"tag_level"
).
distinct
().
withColumn
(
"index"
,
row_number
().
over
(
w
))
result
.
show
()
}
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment