Commit 77e3344a authored by litaolemo's avatar litaolemo

update

parent 1b54de34
......@@ -14,10 +14,11 @@ Data in es will be update when run this program once.
@author: hanye
"""
from crawler.crawler_sys.site_crawler_by_redis import crawler_douban
from crawler.crawler_sys.site_crawler_by_redis import crawler_toutiao
from crawler.crawler_sys.site_crawler_by_redis import toutiao_article
from crawler.crawler_sys.site_crawler_by_redis import crawler_weibo
from crawler.crawler_sys.site_crawler_by_redis import crawler_douban
# crawler_v_qq, crawler_tudou, crawler_haokan,
# crawler_tencent_news,
# crawler_wangyi_news, crawler_kwai, crawler_douyin,
......
......@@ -26,14 +26,14 @@ from crawler.crawler_sys.utils.trans_strtime_to_timestamp import weibo_parse_tim
# from crawler.crawler_sys.utils.trans_duration_str_to_second import trans_duration
# from crawler.crawler_sys.utils.util_logging import logged
# from crawler.crawler_sys.proxy_pool.func_get_proxy_form_kuaidaili import get_proxy
from crawler.crawler_sys.utils.html_to_str import dehtml
from bs4 import BeautifulSoup
# from crawler.crawler_sys.utils.html_to_str import dehtml
# from bs4 import BeautifulSoup
from write_data_into_es.func_get_releaser_id import *
from write_data_into_es.func_cal_doc_id import cal_doc_id
class Crawler_douban():
def __init__(self, timeout=None, platform='weibo'):
def __init__(self, timeout=None, platform='douban'):
if timeout == None:
self.timeout = 10
else:
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment