查询知识库应用
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

86 lines
3.3 KiB

  1. # coding:utf8
  2. import os, sys
  3. import io
  4. from jsonpath_ng import jsonpath, parse
  5. import uuid
  6. sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf8')
  7. cur_dir = os.path.dirname(os.path.abspath(__file__)) or os.getcwd()
  8. par_dir = os.path.abspath(os.path.join(cur_dir, os.path.pardir))
  9. sys.path.append(cur_dir)
  10. sys.path.append(par_dir)
  11. import json
  12. from django.http import HttpResponse
  13. from text_analysis.tools import to_kafka
  14. from django.views.decorators.csrf import csrf_exempt
  15. from log_util.set_logger import set_logger
  16. from datetime import datetime, timedelta
  17. logging = set_logger('logs/results.log')
  18. import traceback
  19. import queue
  20. import requests
  21. from text_analysis.tools.tool import parse_data,promptPro
  22. from text_analysis.writeChroma import LangChainChroma
  23. import time
  24. from datetime import datetime
  25. import os
  26. # 任务队列
  27. global task_queue
  28. task_queue = queue.Queue()
  29. # LC = LangChainChroma()
  30. @csrf_exempt
  31. def promptSim(request):
  32. if request.method == 'POST':
  33. try:
  34. raw_data = json.loads(request.body)
  35. task_queue.put(raw_data)
  36. return HttpResponse(json.dumps({"code": 1, "msg": "请求正常!"}, ensure_ascii=False))
  37. except:
  38. logging.error(traceback.format_exc())
  39. return HttpResponse(json.dumps({"code": 0, "msg": "请求json格式不正确!"}, ensure_ascii=False))
  40. else:
  41. return HttpResponse(json.dumps({"code": 0, "msg": "请求方式错误,改为post请求"}, ensure_ascii=False))
  42. def upload():
  43. while True:
  44. try:
  45. if task_queue.qsize() > 0:
  46. logging.info("取任务队列长度{}".format(task_queue.qsize()))
  47. raw_data = task_queue.get()
  48. output=raw_data["output"]
  49. res_tmp={key: "" for key in output}
  50. if "id" in res_tmp.keys():
  51. res_tmp["id"]=str(uuid.uuid4())
  52. logging.info("任务数据为:{}".format(raw_data))
  53. topn=parse_data(raw_data,raw_data["input"]["topn"])
  54. prompt=parse_data(raw_data,raw_data["input"]["prompt"])
  55. fieldName=parse_data(raw_data,raw_data["input"]["fieldName"])
  56. LC = LangChainChroma()
  57. promptSim=LC.similarity_search(fieldName,prompt,topn)
  58. logging.info("向量数据库搜索的相似上下文:{}".format(promptSim))
  59. #组装,最长字符5W
  60. res=promptPro(prompt,promptSim)
  61. logging.info("生成的上下文:{}".format(res))
  62. res_tmp["promptRes"]=res
  63. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  64. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": res_tmp_json}
  65. logging.info("结果数据为:{}".format(raw_data))
  66. to_kafka.send_kafka(raw_data, logging)
  67. else:
  68. # 暂无任务,进入休眠
  69. time.sleep(10)
  70. except:
  71. raw_data["result"]={}
  72. raw_data["result"]["successCode"] = "0"
  73. raw_data["result"]["errorLog"] = traceback.format_exc()
  74. raw_data["result"]["results"] = json.dumps(res_tmp, ensure_ascii=False)
  75. logging.error(traceback.format_exc())
  76. to_kafka.send_kafka(raw_data, logging)