Commit 32ad8f2c authored by litaolemo's avatar litaolemo

update

parent 138b90ca
...@@ -878,13 +878,15 @@ class Crawler_tudou(): ...@@ -878,13 +878,15 @@ class Crawler_tudou():
if __name__=='__main__': if __name__=='__main__':
test = Crawler_tudou() test = Crawler_tudou()
# url = 'https://video.tudou.com/v/XNDExNjcyNTI0MA==.html' # url = 'https://video.tudou.com/v/XNDExNjcyNTI0MA==.html'
releaser_url = "https://id.tudou.com/i/UNTUzMTU1ODg2OA==" releaser_url = "https://i.youku.com/i/UNzI3OTI2MTkyOA==/videos?spm=a2hzp.8244740.0.0"
# ttt = test.video_page("https://video.tudou.com/v/XNDExNjcyNTI0MA==.html") # ttt = test.video_page("https://video.tudou.com/v/XNDExNjcyNTI0MA==.html")
#releaserUrl=url, output_to_es_raw=True, #releaserUrl=url, output_to_es_raw=True,
# es_index='crawler-data-raw', # es_index='crawler-data-raw',
# doc_type='doc', # doc_type='doc',
# releaser_page_num_max=100) # releaser_page_num_max=100)
test.releaser_page_by_time(1569081600000,1570610953322 ,releaser_url,output_to_es_raw=True,es_index='crawler-data-raw', sacn_Res = test.releaser_page_by_time(1569081600000,1570610953322 ,releaser_url,output_to_es_raw=True,es_index='crawler-data-raw',
doc_type='doc',releaser_page_num_max=4000) doc_type='doc',releaser_page_num_max=4000,allow=20)
for res in sacn_Res:
print(res)
# test.get_releaser_image(releaser_url) # test.get_releaser_image(releaser_url)
# test.get_releaser_follower_num() # test.get_releaser_follower_num()
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment