Commit 8db47ae3 authored by 段英荣's avatar 段英荣

修改爬虫词

parent 4ec7542e
......@@ -58,7 +58,7 @@ majia_user_list = [
"32269952","32269956","32269962","32269966","32269973","32269978","32269980","32269982","32269987","32269989","32270003","32270004","32270007","32270012","32270015","32270017","32270020","32270024","32270027","32270031","32270041","32270044","32270047","32270050","32270054","32270055","32270057","32270059","32270063","32270066","32269913","32269918","32269920","32269927","32269933","32269939","32269943","32269948","32269957","32269965","32269972","32269979","32269983","32269988","32269995","32270002","32270005","32270011","32270016","32270022","32270029","32270036","32270040","32270051","32270061","32270065","32270071","32270075","32270081","32270085","32270094","32270096","32270110","32270116","32270121","32270141","32270147","32270152","32270156","32270161","32270114","32270119","32270122","32270125","32270129","32270131","32270133","32270134","32270137","32270167","32270068","32270070","32270076","32270078","32270083","32270087","32270093","32270095","32270099","32270105","32269992","32270018","32270023","32270030","32270034","32270043","32270048","32270052","32270056","32270060"
]
g_query_word_set = set()
g_query_word_list = list()
g_if_get_query_word = False
ZHENGXING_HOST = "172.16.30.141"
......@@ -569,9 +569,9 @@ def get_query_word():
try:
# query_word = top_query_list.pop()
global g_query_word_set
global g_query_word_list
global g_if_get_query_word
if len(g_query_word_set) == 0 and not g_if_get_query_word:
if len(g_query_word_list) == 0 and not g_if_get_query_word:
g_if_get_query_word = True
offi_query_word_fd = open("/data/log/spider/test_service/offi_query_word_from_20190101_20200115.txt","r")
for line in offi_query_word_fd:
......@@ -583,11 +583,12 @@ def get_query_word():
query_word,query_counts = line.split("\t")
query_word = query_word.strip()
g_query_word_set.add(query_word)
g_query_word_list.append(query_word)
g_query_word_list.reverse()
offi_query_word_fd.close()
ret_word = g_query_word_set.pop()
ret_word = g_query_word_list.pop()
except:
print(traceback.format_exc())
mutex_for_get_query_word.release()
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment