Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
M
meta_base_code
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
黎涛
meta_base_code
Commits
04a60449
Commit
04a60449
authored
Sep 04, 2020
by
litaolemo
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
update
parent
883cd047
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
25 additions
and
25 deletions
+25
-25
search_strategy_d.py
task/search_strategy_d.py
+25
-25
No files found.
task/search_strategy_d.py
View file @
04a60449
...
@@ -72,9 +72,9 @@ spark.sql("CREATE TEMPORARY FUNCTION is_json AS 'com.gmei.hive.common.udf.UDFJso
...
@@ -72,9 +72,9 @@ spark.sql("CREATE TEMPORARY FUNCTION is_json AS 'com.gmei.hive.common.udf.UDFJso
spark
.
sql
(
"CREATE TEMPORARY FUNCTION arrayMerge AS 'com.gmei.hive.common.udf.UDFArryMerge'"
)
spark
.
sql
(
"CREATE TEMPORARY FUNCTION arrayMerge AS 'com.gmei.hive.common.udf.UDFArryMerge'"
)
task_list
=
[]
task_list
=
[]
task_days
=
2
task_days
=
90
for
t
in
range
(
1
,
task_days
):
for
t
in
range
(
0
,
task_days
):
day_num
=
0
-
t
day_num
=
0
-
t
now
=
(
datetime
.
datetime
.
now
()
+
datetime
.
timedelta
(
days
=
day_num
))
now
=
(
datetime
.
datetime
.
now
()
+
datetime
.
timedelta
(
days
=
day_num
))
last_30_day_str
=
(
now
+
datetime
.
timedelta
(
days
=-
30
))
.
strftime
(
"
%
Y
%
m
%
d"
)
last_30_day_str
=
(
now
+
datetime
.
timedelta
(
days
=-
30
))
.
strftime
(
"
%
Y
%
m
%
d"
)
...
@@ -168,8 +168,8 @@ for t in range(1, task_days):
...
@@ -168,8 +168,8 @@ for t in range(1, task_days):
,t3.channel as channel
,t3.channel as channel
,NVL(t3.search_pv,0) as pv
,NVL(t3.search_pv,0) as pv
,NVL(t3.search_uv,0) as uv
,NVL(t3.search_uv,0) as uv
,if(NVL(t3.search_uv,0) <> 0 ,c
oncat(cast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-'
) as search_core_pv
,if(NVL(t3.search_uv,0) <> 0 ,c
ast((NVL(t4.hexin_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,5)) , 0
) as search_core_pv
,if(NVL(t3.search_uv,0) <> 0 ,c
oncat(cast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,2)),'') , '-'
) as search_pv
,if(NVL(t3.search_uv,0) <> 0 ,c
ast((NVL(t4.neirong_card_click_pv,0)/NVL(t3.search_uv,0)) as decimal(18,5)) , 0
) as search_pv
FROM
FROM
(--昨天总搜索量
(--昨天总搜索量
SELECT partition_date,active_type,device_os_type,channel,search_pv,search_uv
SELECT partition_date,active_type,device_os_type,channel,search_pv,search_uv
...
@@ -728,25 +728,25 @@ for t in range(1, task_days):
...
@@ -728,25 +728,25 @@ for t in range(1, task_days):
#
#
# finnal_df.show(1, False)
# finnal_df.show(1, False)
# sql_res = finnal_df.collect()
# sql_res = finnal_df.collect()
#
for res in sql_res:
for
res
in
sql_res
:
#
# print(res)
# print(res)
# device_type = res.device
_type
device_type
=
res
.
device_os
_type
#
active_type = res.active_type
active_type
=
res
.
active_type
#
channel_type = res.channel_type
channel_type
=
res
.
channel_type
# core_pv_division_uv = res.core_pv_division_u
v
core_pv_division_uv
=
res
.
search_core_p
v
# pv_division_uv = res.pv_division_u
v
pv_division_uv
=
res
.
search_p
v
#
pid = hashlib.md5(
pid
=
hashlib
.
md5
(
#
(today_str + device_type + active_type + channel_type).encode("utf8")).hexdigest()
(
today_str
+
device_type
+
active_type
+
channel_type
)
.
encode
(
"utf8"
))
.
hexdigest
()
#
instert_sql = """replace into search_strategy_d(
instert_sql
=
"""replace into search_strategy_d(
#
day_id,device_type,active_type,channel_type,core_pv_division_uv,pv_division_uv,pid
day_id,device_type,active_type,channel_type,core_pv_division_uv,pv_division_uv,pid
#
) VALUES('{day_id}','{device_type}','{active_type}','{channel_type}',{core_pv_division_uv},{pv_division_uv},'{pid}');""".format(
) VALUES('{day_id}','{device_type}','{active_type}','{channel_type}',{core_pv_division_uv},{pv_division_uv},'{pid}');"""
.
format
(
#
day_id=today_str, device_type=device_type,
day_id
=
today_str
,
device_type
=
device_type
,
#
active_type=active_type, channel_type=channel_type, core_pv_division_uv=core_pv_division_uv,pv_division_uv=pv_division_uv,pid=pid
active_type
=
active_type
,
channel_type
=
channel_type
,
core_pv_division_uv
=
core_pv_division_uv
,
pv_division_uv
=
pv_division_uv
,
pid
=
pid
#
#
)
)
#
print(instert_sql)
print
(
instert_sql
)
#
# cursor.execute("set names 'UTF8'")
# cursor.execute("set names 'UTF8'")
#
res = cursor.execute(instert_sql)
res
=
cursor
.
execute
(
instert_sql
)
#
db.commit()
db
.
commit
()
#
print(res)
print
(
res
)
db
.
close
()
db
.
close
()
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment