update

d48a436a · litaolemo · bc21ff8a · d48a436a
Commit d48a436a authored Dec 21, 2020 by litaolemo
Hide whitespace changes
Inline Side-by-side

Showing with 49 additions and 49 deletions

revise_data_from_es.py write_data_into_es/revise_data_from_es.py +49 -49

No files found.
--- a/write_data_into_es/revise_data_from_es.py
+++ b/write_data_into_es/revise_data_from_es.py
@@ -19,15 +19,15 @@ hosts = '172.16.31.17'
 port = 9000
 es2 = elasticsearch.Elasticsearch(hosts=hosts, port=port)

-# es7 = e7.Elasticsearch(hosts="172.16.52.27", port=9200,http_auth=("elastic","gengmei!@#"))
-es7 = e7.Elasticsearch(hosts="172.16.31.17", port=9000)
+es7 = e7.Elasticsearch(hosts="172.16.52.27", port=9200,http_auth=("elastic","gengmei!@#"))
+# es7 = e7.Elasticsearch(hosts="172.16.31.17", port=9000)


 target_index = 'gm-dbmw-doctor-read'
 target_type = 'doctor'

 from_index = 'gm-dbmw-doctor-read'
-from_type = 'doc'
+from_type = '_doc'


 bulk_all_body = ''
@@ -47,49 +47,49 @@ es7_re = es7.search(index=target_index, doc_type=target_type,
 print(es7_re)
 #
 # q3_total = es2_re['hits']['total']
-# write_into_scan = scan(client=es2,
-#                        query=search_body,
-#                        index=target_index,
-#                        doc_type=target_type,
-#                        scroll='5m',
-#                        request_timeout=100
-#                        )
-#
-# count = 0
-# for one_scan in write_into_scan:
-#     count = count + 1
-#     line = one_scan['_source']
-#     doc_id = one_scan['_id']
-#     try:
-#         if line['facevideo_is_assistant'] == 1:
-#             line['facevideo_is_assistant'] = True
-#         else:
-#             line['facevideo_is_assistant'] = False
-#     except:
-#         pass
-#
-#     bulk_head = '{"index": {"_id":"%s"}}' % doc_id
-#     data_str = json.dumps(line, ensure_ascii=False)
-#
-#     bulk_one_body = bulk_head + '\n' + data_str + '\n'
-#     # print(bulk_one_body)
-#     bulk_all_body += bulk_one_body
-#     # break
-#     if count%500 == 0:
-#
-#          eror_dic=es7.bulk(index=target_index,
-#                 body=bulk_all_body, request_timeout=200)
-#          bulk_all_body=''
-#          if eror_dic['errors'] is True:
-#              print(eror_dic['items'])
-#              print(bulk_all_body)
-#          print(count)
-#
-# if bulk_all_body != '':
-#      eror_dic = es7.bulk(body=bulk_all_body,
-#                         index=target_index,
-#                         request_timeout=200)
-#      if eror_dic['errors'] is True:
-#          print(eror_dic)
-#
-#      bulk_all_body = ''
+write_into_scan = scan(client=es2,
+                       query=search_body,
+                       index=target_index,
+                       doc_type=target_type,
+                       scroll='5m',
+                       request_timeout=100
+                       )
+
+count = 0
+for one_scan in write_into_scan:
+    count = count + 1
+    line = one_scan['_source']
+    doc_id = one_scan['_id']
+    try:
+        if line['facevideo_is_assistant'] == 1:
+            line['facevideo_is_assistant'] = True
+        else:
+            line['facevideo_is_assistant'] = False
+    except:
+        pass
+
+    bulk_head = '{"index": {"_id":"%s"}}' % doc_id
+    data_str = json.dumps(line, ensure_ascii=False)
+
+    bulk_one_body = bulk_head + '\n' + data_str + '\n'
+    # print(bulk_one_body)
+    bulk_all_body += bulk_one_body
+    # break
+    if count%500 == 0:
+
+         eror_dic=es7.bulk(index=target_index,
+                body=bulk_all_body, request_timeout=200)
+         bulk_all_body=''
+         if eror_dic['errors'] is True:
+             print(eror_dic['items'])
+             print(bulk_all_body)
+         print(count)
+
+if bulk_all_body != '':
+     eror_dic = es7.bulk(body=bulk_all_body,
+                        index=target_index,
+                        request_timeout=200)
+     if eror_dic['errors'] is True:
+         print(eror_dic)
+
+     bulk_all_body = ''