Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
cbbc62f1
Commit
cbbc62f1
authored
Feb 24, 2020
by
张彦钊
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
add
parent
797041b6
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
9 additions
and
7 deletions
+9
-7
make_data.py
make_data.py
+9
-7
No files found.
make_data.py
View file @
cbbc62f1
...
...
@@ -44,11 +44,10 @@ def doctor():
# date_str = (datetime.datetime.now() - datetime.timedelta(days=1)).strftime("%Y%m%d")
# date_tmp = (datetime.datetime.now() - datetime.timedelta(days=1)).strftime("%Y-%m-%d")
sql
=
"select d.doctor_id,d.service_exposure_pv_30,d.service_ctr_30,d.expert_exposure_pv_30,d.expert_pv_30,"
\
"b.merchant_id "
\
"from statistic_doctor_rank_factor d "
\
"left join hippo_merchantrelevance b on d.doctor_id = b.doctor_id "
\
"where d.partition_date = '{}';"
.
format
(
date_str
)
sql
=
"select d.doctor_id,d.service_exposure_pv_30,d.service_ctr_30,d.expert_exposure_pv_30,"
\
"d.expert_pv_30,b.merchant_id from statistic_doctor_rank_factor d "
\
"left join hippo_merchantrelevance b on d.doctor_id = b.doctor_id "
\
"where d.partition_date = '{}';"
.
format
(
date_str
)
db
=
pymysql
.
connect
(
host
=
'172.16.30.143'
,
port
=
3306
,
user
=
'work'
,
passwd
=
'BJQaT9VzDcuPBqkd'
,
db
=
'zhengxing'
)
cursor
=
db
.
cursor
()
...
...
@@ -64,6 +63,7 @@ def doctor():
df
=
df
.
dropna
(
subset
=
[
"merchant_id"
])
print
(
"drop"
)
print
(
df
.
shape
)
print
(
df
.
head
(
6
))
sql
=
"select merchant_id,doctor_discount_30_days,expand_rechange_amount_30,"
\
"service_pv_30,expert_pv_30,organization_pv_30 from statistic_merchant_rank_factor "
\
...
...
@@ -79,6 +79,7 @@ def doctor():
tmp
=
tmp
.
rename
(
columns
=
dict
(
zip
(
list
(
range
(
len
(
name
))),
name
)))
print
(
"tmp"
)
print
(
tmp
.
shape
)
print
(
tmp
.
head
(
6
))
df
[
"merchant_id"
]
=
df
[
"merchant_id"
]
.
astype
(
'int64'
)
df
[
"merchant_id"
]
=
df
[
"merchant_id"
]
.
astype
(
"str"
)
...
...
@@ -123,6 +124,7 @@ def doctor():
df
.
loc
[
df
[
"pv_ad"
]
<
0.01
,
[
"pv_ad"
]]
=
0.01
df
[
"score"
]
=
df
[
"ctr"
]
**
0.5
*
(
df
[
"commission"
]
+
df
[
"pv_ad"
])
print
(
df
.
shape
)
columns
=
[
"doctor_id"
,
"score"
,
"ctr"
,
"commission"
,
"pv_ad"
,
"service_exposure_pv_30"
,
"service_ctr_30"
,
"expert_exposure_pv_30"
,
"expert_pv_30"
,
...
...
@@ -317,9 +319,9 @@ def old():
if
__name__
==
"__main__"
:
#
doctor()
doctor
()
# hospital()
old
()
#
old()
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment