Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
2ad622f6
Commit
2ad622f6
authored
May 07, 2019
by
王志伟
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
更改时间
parent
8b35aba5
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
13 additions
and
8 deletions
+13
-8
data_feed_exposure_precise.scala
.../src/main/scala/com/gmei/data_feed_exposure_precise.scala
+13
-8
No files found.
eda/feededa/src/main/scala/com/gmei/data_feed_exposure_precise.scala
View file @
2ad622f6
...
...
@@ -601,6 +601,8 @@ object icon_train_data {
}
object
tag_value
{
Logger
.
getLogger
(
"org.apache.spark"
).
setLevel
(
Level
.
WARN
)
...
...
@@ -653,30 +655,33 @@ object tag_value {
//level_id到权重映射
val
level1_id
=
sc
.
sql
(
s
"""
|select distinct(
level1
_id) as level_id,'${t1}' as value
|select distinct(
tag
_id) as level_id,'${t1}' as value
|from online.bl_tag_hierarchy_detail
|where partition_date = '${partition_date}'
|and level1_id !='0'
|and tag_id !=0
|and tag_type=1
"""
.
stripMargin
)
level1_id
.
createOrReplaceTempView
(
"level1_id"
)
val
level2_id
=
sc
.
sql
(
s
"""
|select distinct(
level2
_id) as level_id,'${t2}' as value
|select distinct(
tag
_id) as level_id,'${t2}' as value
|from online.bl_tag_hierarchy_detail
|where partition_date = '${partition_date}'
|and level2_id !='0'
|and tag_id !=0
|and tag_type=2
"""
.
stripMargin
)
level2_id
.
createOrReplaceTempView
(
"level2_id"
)
val
level3_id
=
sc
.
sql
(
s
"""
|select distinct(
level3
_id) as level_id,'${t3}' as value
|select distinct(
tag
_id) as level_id,'${t3}' as value
|from online.bl_tag_hierarchy_detail
|where partition_date = '${partition_date}'
|and level3_id !='0'
|and tag_id !=0
|and tag_type=3
"""
.
stripMargin
)
level3_id
.
createOrReplaceTempView
(
"level3_id"
)
...
...
@@ -730,7 +735,7 @@ object tag_value {
// temp1.createOrReplaceTempView("temp1")
// import implicit_
val
result
=
temp1
.
select
(
"
level
_id"
).
distinct
().
rdd
.
map
{
x
=>
x
.
toString
().
substring
(
1
,
x
.
toString
().
length
-
1
)}.
zipWithIndex
().
toDF
(
"level_id"
,
"index"
)
val
result
=
temp1
.
select
(
"
tag
_id"
).
distinct
().
rdd
.
map
{
x
=>
x
.
toString
().
substring
(
1
,
x
.
toString
().
length
-
1
)}.
zipWithIndex
().
toDF
(
"level_id"
,
"index"
)
val
test
=
result
.
select
(
result
.
col
(
"level_id"
).
cast
(
DoubleType
).
as
(
"level_id"
),
result
.
col
(
"index"
).
cast
(
DoubleType
).
as
(
"index"
))
// val resDf = spark.createDataFrame(rowRdd)
...
...
@@ -761,7 +766,7 @@ object tag_value {
GmeiConfig
.
writeToJDBCTable
(
"jdbc:mysql://172.16.40.158:4000/jerry_prod?user=root&password=3SYz54LS9#^9sBvC&rewriteBatchedStatements=true"
,
test
,
table
=
"tag_level_index"
,
SaveMode
.
Overwrite
)
println
(
"写入完成"
)
// zhengxing库里面的数据同步到jerry_prod
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment