update

77e3344a · litaolemo · 1b54de34 · 77e3344a · 77e3344a
Commit 77e3344a authored Jul 27, 2020 by litaolemo
Showing with 5 additions and 4 deletions

update_data_in_target_releasers_multi_process_by_date_from_redis.py ...a_in_target_releasers_multi_process_by_date_from_redis.py +2 -1

crawler_douban.py crawler_sys/site_crawler_by_redis/crawler_douban.py +3 -3

No files found.
--- a/crawler_sys/framework/update_data_in_target_releasers_multi_process_by_date_from_redis.py
+++ b/crawler_sys/framework/update_data_in_target_releasers_multi_process_by_date_from_redis.py
@@ -14,10 +14,11 @@ Data in es will be update when run this program once.
 @author: hanye
 """
+from crawler.crawler_sys.site_crawler_by_redis import crawler_douban
 from crawler.crawler_sys.site_crawler_by_redis import crawler_toutiao
 from crawler.crawler_sys.site_crawler_by_redis import toutiao_article
 from crawler.crawler_sys.site_crawler_by_redis import crawler_weibo
-from crawler.crawler_sys.site_crawler_by_redis import crawler_douban
 # crawler_v_qq, crawler_tudou, crawler_haokan,
 # crawler_tencent_news,
 # crawler_wangyi_news, crawler_kwai, crawler_douyin,

--- a/crawler_sys/site_crawler_by_redis/crawler_douban.py
+++ b/crawler_sys/site_crawler_by_redis/crawler_douban.py
@@ -26,14 +26,14 @@ from crawler.crawler_sys.utils.trans_strtime_to_timestamp import weibo_parse_tim
 # from crawler.crawler_sys.utils.trans_duration_str_to_second import trans_duration
 # from crawler.crawler_sys.utils.util_logging import logged
 # from crawler.crawler_sys.proxy_pool.func_get_proxy_form_kuaidaili import get_proxy
-from crawler.crawler_sys.utils.html_to_str import dehtml
+# from crawler.crawler_sys.utils.html_to_str import dehtml
-from bs4 import BeautifulSoup
+# from bs4 import BeautifulSoup
 from write_data_into_es.func_get_releaser_id import *
 from write_data_into_es.func_cal_doc_id import cal_doc_id
 class Crawler_douban():
-    def __init__(self, timeout=None, platform='weibo'):
+    def __init__(self, timeout=None, platform='douban'):
        if timeout == None:
            self.timeout = 10
        else: