elasticsearch_add_doc.py 810 B

123456789101112131415161718192021222324252627
  1. from elasticsearch import Elasticsearch
  2. from typing import List, Dict
  3. import json
  4. from utils.es import ElasticsearchOperations
  5. def add_law_document(ops):
  6. json_data = None
  7. with open(r"D:\work\03\regulations.json","r",encoding="utf-8") as f:
  8. lines = f.readlines()
  9. json_data = json.loads(''.join(lines))
  10. print(">>> finished process document ")
  11. if json_data:
  12. index = 1
  13. total = len(json_data)
  14. for item in json_data:
  15. es_ops.index_document(item["article_text"],item["meta_data"]['ArticleTitle'])
  16. print(item["meta_data"]['ArticleTitle'],f"processed {index}/{total}")
  17. index = index + 1
  18. # 使用示例
  19. if __name__ == "__main__":
  20. es_ops = ElasticsearchOperations()
  21. add_law_document(es_ops)