Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
6560d5e2
Commit
6560d5e2
authored
Sep 03, 2018
by
张彦钊
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
修改模型训练数据日期
parent
acce07e8
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
12 additions
and
18 deletions
+12
-18
diaryUpdateOnlineOffline.py
diaryUpdateOnlineOffline.py
+0
-6
testCases.py
local/testCases.py
+7
-7
train.py
train.py
+1
-1
utils.py
utils.py
+4
-4
No files found.
diaryUpdateOnlineOffline.py
View file @
6560d5e2
...
...
@@ -174,7 +174,6 @@ def update_dairy_queue(score_df,predict_score_df,total_video_id):
def
update_sql_dairy_queue
(
queue_name
,
diary_id
,
device_id
,
city_id
):
begin
=
time
.
time
()
if
flag
:
db
=
pymysql
.
connect
(
host
=
QUEUE_ONLINE_HOST
,
port
=
3306
,
user
=
'doris'
,
passwd
=
'o5gbA27hXHHm'
,
db
=
'doris_prod'
)
...
...
@@ -190,8 +189,6 @@ def update_sql_dairy_queue(queue_name, diary_id,device_id, city_id):
cursor
.
execute
(
sql
)
db
.
commit
()
db
.
close
()
over
=
time
.
time
()
print
(
"写入日记队列耗时{}秒"
.
format
(
over
-
begin
))
print
(
"成功写入diary_id"
)
...
...
@@ -219,7 +216,6 @@ def queue_compare(old_list, new_list):
def
get_queue
(
device_id
,
city_id
,
queue_name
):
begin
=
time
.
time
()
if
flag
:
db
=
pymysql
.
connect
(
host
=
QUEUE_ONLINE_HOST
,
port
=
3306
,
user
=
'doris'
,
passwd
=
'o5gbA27hXHHm'
,
db
=
'doris_prod'
)
...
...
@@ -232,8 +228,6 @@ def get_queue(device_id, city_id,queue_name):
"where device_id = '{}' and city_id = '{}';"
.
format
(
queue_name
,
device_id
,
city_id
)
cursor
.
execute
(
sql
)
result
=
cursor
.
fetchall
()
over
=
time
.
time
()
print
(
"获取日记队列耗时{}秒"
.
format
(
over
-
begin
))
df
=
pd
.
DataFrame
(
list
(
result
))
if
df
.
empty
:
print
(
"该用户对应的日记为空"
)
...
...
local/testCases.py
View file @
6560d5e2
...
...
@@ -40,7 +40,7 @@ def get_local_device():
print
(
1
)
def
save_queue
(
id
,
device_id
,
city_id
):
def
save_queue
():
queue_name_list
=
[
"native_queue"
,
"nearby_queue"
,
"nation_queue"
,
"megacity_queue"
]
for
i
in
queue_name_list
:
sql
=
"select {} from device_diary_queue "
\
...
...
@@ -65,10 +65,10 @@ def delete():
sql
=
"delete from device_diary_queue where device_id = '{}' and city_id = '{}';"
.
format
(
device_id
,
city_id
)
cursor
.
execute
(
sql
)
db
.
close
()
print
(
"
shan
"
)
print
(
"
删除成功
"
)
def
insert
(
id
,
device_id
,
city_id
):
def
insert
():
queue_name_list
=
[
"native_queue"
,
"nearby_queue"
,
"nation_queue"
,
"megacity_queue"
]
a
=
{}
for
i
in
queue_name_list
:
...
...
@@ -87,14 +87,14 @@ def insert(id,device_id,city_id):
print
(
"end"
)
if
__name__
==
"__main__"
:
# 先把数据保存下来,调用上面的save函数,
# 先把数据保存下来,调用上面的save函数,
然后调上面delete函数删除数据,然后调insert函数插入数据
id
=
334
device_id
=
'00CA20EB-2719-4518-85CC-60E765AC526F'
city_id
=
'beijing'
insert
(
id
,
device_id
,
city_id
)
save_queue
()
delete
()
insert
()
...
...
train.py
View file @
6560d5e2
...
...
@@ -19,7 +19,7 @@ if __name__ == "__main__":
print
(
"训练模型耗时{}分"
.
format
((
end_train
-
start_train
)
/
60
))
move_file
()
#TODO 如果用自己写的keepProcess文件守护进程,下面在这个函数里删掉重新启动进程那行代码,因为可能会多启动一次进程
#
restart_process()
restart_process
()
...
...
utils.py
View file @
6560d5e2
...
...
@@ -29,11 +29,11 @@ def get_date():
day
=
now
.
day
date
=
datetime
(
year
,
month
,
day
)
data_start_date
=
"2018-07-15"
data_end_date
=
"2018-09-01
"
validation_date
=
"2018-08-3
1"
# data_end_date = "2018-09-02
"
# validation_date = "2018-09-0
1"
# data_start_date = (date - timedelta(days=3)).strftime("%Y-%m-%d")
#
data_end_date = (date - timedelta(days=1)).strftime("%Y-%m-%d")
#
validation_date = (date - timedelta(days=2)).strftime("%Y-%m-%d")
data_end_date
=
(
date
-
timedelta
(
days
=
1
))
.
strftime
(
"
%
Y-
%
m-
%
d"
)
validation_date
=
(
date
-
timedelta
(
days
=
2
))
.
strftime
(
"
%
Y-
%
m-
%
d"
)
# 验证集和测试集的日期必须相差一天,否则切割数据集时会报错
test_date
=
data_end_date
print
(
"data_start_date,data_end_date,validation_date,test_date:"
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment