Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
S
strategy_spider
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
rank
strategy_spider
Commits
8db47ae3
Commit
8db47ae3
authored
Jan 31, 2020
by
段英荣
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
修改爬虫词
parent
4ec7542e
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
5 deletions
+6
-5
zhihu_login.py
zhihu_login.py
+6
-5
No files found.
zhihu_login.py
View file @
8db47ae3
...
...
@@ -58,7 +58,7 @@ majia_user_list = [
"32269952"
,
"32269956"
,
"32269962"
,
"32269966"
,
"32269973"
,
"32269978"
,
"32269980"
,
"32269982"
,
"32269987"
,
"32269989"
,
"32270003"
,
"32270004"
,
"32270007"
,
"32270012"
,
"32270015"
,
"32270017"
,
"32270020"
,
"32270024"
,
"32270027"
,
"32270031"
,
"32270041"
,
"32270044"
,
"32270047"
,
"32270050"
,
"32270054"
,
"32270055"
,
"32270057"
,
"32270059"
,
"32270063"
,
"32270066"
,
"32269913"
,
"32269918"
,
"32269920"
,
"32269927"
,
"32269933"
,
"32269939"
,
"32269943"
,
"32269948"
,
"32269957"
,
"32269965"
,
"32269972"
,
"32269979"
,
"32269983"
,
"32269988"
,
"32269995"
,
"32270002"
,
"32270005"
,
"32270011"
,
"32270016"
,
"32270022"
,
"32270029"
,
"32270036"
,
"32270040"
,
"32270051"
,
"32270061"
,
"32270065"
,
"32270071"
,
"32270075"
,
"32270081"
,
"32270085"
,
"32270094"
,
"32270096"
,
"32270110"
,
"32270116"
,
"32270121"
,
"32270141"
,
"32270147"
,
"32270152"
,
"32270156"
,
"32270161"
,
"32270114"
,
"32270119"
,
"32270122"
,
"32270125"
,
"32270129"
,
"32270131"
,
"32270133"
,
"32270134"
,
"32270137"
,
"32270167"
,
"32270068"
,
"32270070"
,
"32270076"
,
"32270078"
,
"32270083"
,
"32270087"
,
"32270093"
,
"32270095"
,
"32270099"
,
"32270105"
,
"32269992"
,
"32270018"
,
"32270023"
,
"32270030"
,
"32270034"
,
"32270043"
,
"32270048"
,
"32270052"
,
"32270056"
,
"32270060"
]
g_query_word_
set
=
se
t
()
g_query_word_
list
=
lis
t
()
g_if_get_query_word
=
False
ZHENGXING_HOST
=
"172.16.30.141"
...
...
@@ -569,9 +569,9 @@ def get_query_word():
try
:
# query_word = top_query_list.pop()
global
g_query_word_
se
t
global
g_query_word_
lis
t
global
g_if_get_query_word
if
len
(
g_query_word_
se
t
)
==
0
and
not
g_if_get_query_word
:
if
len
(
g_query_word_
lis
t
)
==
0
and
not
g_if_get_query_word
:
g_if_get_query_word
=
True
offi_query_word_fd
=
open
(
"/data/log/spider/test_service/offi_query_word_from_20190101_20200115.txt"
,
"r"
)
for
line
in
offi_query_word_fd
:
...
...
@@ -583,11 +583,12 @@ def get_query_word():
query_word
,
query_counts
=
line
.
split
(
"
\t
"
)
query_word
=
query_word
.
strip
()
g_query_word_
set
.
ad
d
(
query_word
)
g_query_word_
list
.
appen
d
(
query_word
)
g_query_word_list
.
reverse
()
offi_query_word_fd
.
close
()
ret_word
=
g_query_word_
se
t
.
pop
()
ret_word
=
g_query_word_
lis
t
.
pop
()
except
:
print
(
traceback
.
format_exc
())
mutex_for_get_query_word
.
release
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment