Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
18fc6c48
Commit
18fc6c48
authored
Oct 19, 2019
by
高雅喆
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
改变画像的数据存储格式
parent
b69ad3c9
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
15 additions
and
0 deletions
+15
-0
dist_update_user_portrait_service.py
eda/smart_rank/dist_update_user_portrait_service.py
+15
-0
No files found.
eda/smart_rank/dist_update_user_portrait_service.py
View file @
18fc6c48
...
...
@@ -109,12 +109,20 @@ def get_user_service_portrait(cl_id, all_word_tags, all_tag_tag_type, all_3tag_2
),
axis
=
1
)
gmkv_tag_score_sum
=
tag_score_sum
[[
"tag2"
,
"tag_score"
,
"weight"
]][:
size
]
.
to_dict
(
'record'
)
gmkv_tag_score2_sum
=
tag_score_sum
[[
"tag2"
,
"tag_score"
]][:
size
]
.
to_dict
(
'record'
)
gmkv_tag_score2_sum_dict
=
{
i
[
"tag2"
]:
i
[
"tag_score"
]
for
i
in
gmkv_tag_score2_sum
}
# 写gmkv
gm_kv_cli
=
redis
.
Redis
(
host
=
"172.16.40.135"
,
port
=
5379
,
db
=
2
,
socket_timeout
=
2000
)
cl_id_portrait_key
=
"user:service_portrait_tags:cl_id:"
+
str
(
cl_id
)
tag_id_list_json
=
json
.
dumps
(
gmkv_tag_score_sum
)
gm_kv_cli
.
set
(
cl_id_portrait_key
,
tag_id_list_json
)
gm_kv_cli
.
expire
(
cl_id_portrait_key
,
time
=
30
*
24
*
60
*
60
)
cl_id_portrait_key2
=
"user:service_portrait_tags2:cl_id:"
+
str
(
cl_id
)
tag_id_list_json2
=
json
.
dumps
(
gmkv_tag_score2_sum_dict
)
gm_kv_cli
.
set
(
cl_id_portrait_key2
,
tag_id_list_json2
)
gm_kv_cli
.
expire
(
cl_id_portrait_key2
,
time
=
30
*
24
*
60
*
60
)
# 写tidb,redis同步
stat_date
=
datetime
.
datetime
.
today
()
.
strftime
(
'
%
Y-
%
m-
%
d'
)
replace_sql
=
"""replace into user_service_portrait_tags (stat_date, cl_id, tag_list) values("{stat_date}","{cl_id}","{tag_list}")"""
\
...
...
@@ -175,6 +183,13 @@ if __name__ == '__main__':
gm_kv_cli
.
set
(
hot_search_words_portrait_portrait_key
,
hot_search_words_portrait_json
)
gm_kv_cli
.
expire
(
hot_search_words_portrait_portrait_key
,
time
=
30
*
24
*
60
*
60
)
hot_search_words_portrait_portrait_key2
=
"user:service_coldstart_tags2"
hot_search_words_portrait_dict
=
{
i
[
"id"
]:
10
for
i
in
hot_search_words
}
hot_search_words_portrait_json2
=
json
.
dumps
(
hot_search_words_portrait_dict
)
gm_kv_cli
.
set
(
hot_search_words_portrait_portrait_key2
,
hot_search_words_portrait_json2
)
gm_kv_cli
.
expire
(
hot_search_words_portrait_portrait_key2
,
time
=
30
*
24
*
60
*
60
)
# rdd
sparkConf
=
SparkConf
()
.
set
(
"spark.hive.mapred.supports.subdirectories"
,
"true"
)
\
.
set
(
"spark.hadoop.mapreduce.input.fileinputformat.input.dir.recursive"
,
"true"
)
\
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment