千问开源大模型
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

164 lines
7.3 KiB

  1. # coding:utf8
  2. import os, sys
  3. import io
  4. import time
  5. sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf8')
  6. cur_dir = os.path.dirname(os.path.abspath(__file__)) or os.getcwd()
  7. par_dir = os.path.abspath(os.path.join(cur_dir, os.path.pardir))
  8. sys.path.append(cur_dir)
  9. sys.path.append(par_dir)
  10. import json
  11. from django.http import HttpResponse
  12. from text_analysis.tools import to_kafka
  13. from text_analysis.cusException import promptLen_Exception
  14. from django.views.decorators.csrf import csrf_exempt
  15. from log_util.set_logger import set_logger
  16. logger = set_logger('logs/results.log')
  17. import traceback
  18. # import queue
  19. import requests
  20. from text_analysis.tools.tool import get_content,parse_gptResult
  21. import uuid
  22. import time
  23. from kazoo.client import KazooClient
  24. from kazoo.protocol.states import EventType
  25. import queue
  26. task_queue = queue.PriorityQueue()
  27. stop_dict={}
  28. from text_analysis.read_config import load_config
  29. config=load_config()
  30. @csrf_exempt
  31. def QwenModel(request):
  32. if request.method == 'POST':
  33. try:
  34. raw_data = json.loads(request.body)
  35. if "trace" in raw_data.keys() and raw_data["trace"]==True:
  36. task_queue.put((-1, time.time(),raw_data))
  37. else:
  38. task_queue.put((1,time.time(), raw_data))
  39. return HttpResponse(json.dumps({"code": 1, "msg": "请求正常!"}, ensure_ascii=False))
  40. except:
  41. logger.error(traceback.format_exc())
  42. return HttpResponse(json.dumps({"code": 0, "msg": "请求json格式不正确!"}, ensure_ascii=False))
  43. else:
  44. return HttpResponse(json.dumps({"code": 0, "msg": "请求方式错误,改为post请求"}, ensure_ascii=False))
  45. def Qwen():
  46. while True:
  47. try:
  48. if task_queue.qsize()>0:
  49. p,t,raw_data = task_queue.get(timeout=1)
  50. logger.info("当前任务队列长度{}".format(task_queue.qsize()+1))
  51. output = raw_data["output"]
  52. res_tmp = {key: "" for key in output}
  53. if "id" in res_tmp.keys():
  54. res_tmp["id"] = str(uuid.uuid4())
  55. res_tmp["isLast"]=1
  56. task_id=raw_data["scenes_id"]
  57. task_version=raw_data["version"]
  58. logger.info("任务数据为:{}".format(raw_data))
  59. logger.info("当前version信息为:{}".format(stop_dict))
  60. if task_id in stop_dict.keys() and task_version!=stop_dict[task_id]["version"]:
  61. logger.info("已暂停任务,数据过滤掉")
  62. continue
  63. data = get_content(raw_data, logger)
  64. prompt_len=len(data["prompt"])
  65. # if len(data["prompt"])>=10000:
  66. # raise promptLen_Exception
  67. # logger.info("请求信息为{},解析后模型请求为{}".format(raw_data,data))
  68. url=config['qwenmodel']['url']
  69. headers = {
  70. "Content-Type": "application/json;charset=UTF-8"
  71. }
  72. payload = json.dumps({
  73. "model":"Qwen2-72B-Instruct-GPTQ-Int4",
  74. "messages": [{"role": "user", "content": data["prompt"]}],
  75. "temperature": float(data["temperature"]),
  76. "top_p": float(data["top_p"]),
  77. "n": int(data["n"])
  78. })
  79. # logger.info("prompt为{}".format(data["prompt"]))
  80. response = requests.request("POST", url, headers=headers, data=payload,timeout=180)
  81. logger.info("Prompt为:{}***Qwen返回值:{}-{}".format(data["prompt"],response,response.text))
  82. d = json.loads(response.text)
  83. if response.status_code==400 and "maximum context length" in d["message"]:
  84. logger.info("文本长度超过模型限制-{}-{}".format(prompt_len, raw_data))
  85. raise promptLen_Exception
  86. result = d['choices'][0]['message']['content']
  87. if result:
  88. #添加 0是文本,1是json格式
  89. fieldType = raw_data["input"]['fieldType']
  90. if fieldType == 0:
  91. res_tmp["content"] = result
  92. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  93. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": res_tmp_json,"status":1,"message":"成功"}
  94. else:
  95. res=parse_gptResult(res_tmp,result)
  96. if res:
  97. res["isLast"] = 1
  98. res_tmp_json = json.dumps(res, ensure_ascii=False)
  99. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": res_tmp_json,"status":1,"message":"成功"}
  100. else:
  101. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  102. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": res_tmp_json, "status": 1,"message": "成功"}
  103. else:
  104. logger.info("模型返回值为空")
  105. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  106. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": res_tmp_json, "status": 1,"message": "成功"}
  107. # logger.info(raw_data)
  108. to_kafka.send_kafka(raw_data, logger)
  109. else:
  110. time.sleep(10)
  111. except queue.Empty:
  112. #从空队列取任务
  113. logger.info("该线程任务队列为空,等待新任务")
  114. except promptLen_Exception:
  115. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  116. raw_data["result"] = {"successCode": "0", "errorLog": "", "results": res_tmp_json, "status": 2,"message": "文本长度超过模型限制"}
  117. to_kafka.send_kafka(raw_data, logger)
  118. except:
  119. res_tmp_json = json.dumps(res_tmp, ensure_ascii=False)
  120. raw_data["result"] = {"successCode": "0", "errorLog": traceback.format_exc(), "results": res_tmp_json,"status":2,"message":"异常"}
  121. logger.info("调用Qwen失败{}-{}".format(raw_data, traceback.format_exc()))
  122. to_kafka.send_kafka(raw_data, logger)
  123. def zk_monitoring():
  124. try:
  125. #线上环境
  126. zk = KazooClient(hosts=config['zookeeper']['zkhost'])
  127. #测试环境
  128. # zk = KazooClient(hosts='172.16.12.55:2181,172.16.12.56:2181,172.16.12.57:2181')
  129. zk.start()
  130. # 设置监听器
  131. @zk.DataWatch(config['zookeeper']['node'])
  132. def watch_node(data, stat, event):
  133. if event is not None and event.type == EventType.CHANGED:
  134. data, stat = zk.get("/analyze")
  135. # logger.info("执行删除操作:{}".format(data))
  136. d = json.loads(data)
  137. id = d["scenes_id"]
  138. stop_dict[id] = {}
  139. stop_dict[id]["version"] = d["version"]
  140. stop_dict[id]["operation"] = d["operation"]
  141. # 保持程序运行以监听节点变化
  142. try:
  143. while True:
  144. time.sleep(1)
  145. except:
  146. logger.info("Stopping...")
  147. # 关闭连接
  148. zk.stop()
  149. zk.close()
  150. except:
  151. logger.error(traceback.format_exc())