语音识别应用
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

151 lines
6.6 KiB

  1. #coding:utf8
  2. import os, sys
  3. import io
  4. sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf8')
  5. cur_dir = os.path.dirname(os.path.abspath(__file__)) or os.getcwd()
  6. par_dir = os.path.abspath(os.path.join(cur_dir, os.path.pardir))
  7. sys.path.append(cur_dir)
  8. sys.path.append(par_dir)
  9. import json
  10. from django.http import HttpResponse
  11. from text_analysis.tools import to_kafka
  12. from django.views.decorators.csrf import csrf_exempt
  13. from log_util.set_logger import set_logger
  14. logging=set_logger('logs/results.log')
  15. import traceback
  16. import queue
  17. import requests
  18. from text_analysis.tools.tool import get_data
  19. import time
  20. from datetime import datetime
  21. import os
  22. #任务队列
  23. global task_queue
  24. task_queue = queue.Queue()
  25. #数据队列
  26. global data_queue
  27. data_queue = queue.Queue()
  28. @csrf_exempt
  29. def ASR(request):
  30. if request.method == 'POST':
  31. try:
  32. raw_data = json.loads(request.body)
  33. task_queue.put(raw_data)
  34. return HttpResponse(json.dumps({"code": 1, "msg": "请求正常!"}, ensure_ascii=False))
  35. except:
  36. logging.error(traceback.format_exc())
  37. return HttpResponse(json.dumps({"code": 0, "msg": "请求json格式不正确!"}, ensure_ascii=False))
  38. else:
  39. return HttpResponse(json.dumps({"code": 0, "msg": "请求方式错误,改为post请求"}, ensure_ascii=False))
  40. def upload():
  41. while True:
  42. try:
  43. if task_queue.qsize() >0:
  44. logging.info("取任务队列长度{}".format(task_queue.qsize()))
  45. raw_data = task_queue.get()
  46. index=raw_data["metadata"]["index"]
  47. datasource=raw_data["metadata"]["admin"]["datasource"]
  48. if datasource not in raw_data["data"].keys():
  49. logging.info("找不到相关数据源!—{}".format(raw_data))
  50. continue
  51. allFile=raw_data["data"][datasource]
  52. currentFile=eval(allFile)[index]
  53. currentFile["content"]=""
  54. file=currentFile["fileUrl"]
  55. if "http" not in file:
  56. file="https://caiji.percent.cn/"+file.lstrip("/")
  57. fileName=currentFile["fileName"]
  58. language=raw_data["metadata"]["admin"]["fromLanguage"]
  59. #从gofast获取视频
  60. myfile = requests.get(file)
  61. starttime = datetime.now().strftime('%Y-%m-%d')
  62. path='inputdata/'+starttime
  63. if not os.path.exists(path):
  64. os.makedirs(path)
  65. with open(path+'/'+fileName, 'wb') as f:
  66. f.write(myfile.content)
  67. logging.info("视频从gofast下载完毕,开始上传-{}".format(fileName))
  68. #访问视频上传接口
  69. url = "https://realtime.pdeepmatrix.com/apis/media/analysis/upload"
  70. data = {'fromLanguage': language}
  71. f=open(path+'/'+fileName, 'rb')
  72. files = {'file': f}
  73. response = requests.post(url, data=data, files=files)
  74. d = json.loads(response.text)
  75. if "code" in d.keys() and d["code"]==200:
  76. #接口返回值data中存放视频获取结果的key
  77. result = d["data"]
  78. raw_data["result"] = {"successCode": "1", "errorLog": "", "results": currentFile,"dataKey":result}
  79. data_queue.put(raw_data)
  80. logging.info("视频上传成功{}".format(raw_data))
  81. # to_kafka.send_kafka(raw_data,logging)
  82. else:
  83. logging.info("视频上传失败{}-{}".format(raw_data,d))
  84. f.close()
  85. #Todo删除视频文件
  86. else:
  87. #暂无任务,进入休眠
  88. time.sleep(10)
  89. except:
  90. logging.error(traceback.format_exc())
  91. def getResult():
  92. while True:
  93. #3秒钟结果获取一次
  94. time.sleep(3)
  95. try:
  96. if data_queue.qsize() >0:
  97. logging.info("取数据队列长度{}".format(data_queue.qsize()))
  98. raw_data = data_queue.get()
  99. # print(raw_data)
  100. #根据视频key访问获取结果接口
  101. dataKey=raw_data["result"]["dataKey"]
  102. url = "https://realtime.pdeepmatrix.com/apis/media/analysis/getResult"
  103. params = {'taskId': dataKey}
  104. response = requests.get(url, params=params)
  105. # print(response.text)
  106. d = json.loads(response.text)
  107. if "code" in d.keys() and d["code"]==200:
  108. results=""
  109. if d["data"]["code"]=="1":
  110. for sentence in d["data"]["sentences"]:
  111. results+=sentence["text"]
  112. raw_data["result"]["results"]["content"] =results
  113. raw_data["result"]["results"]=json.dumps(raw_data["result"]["results"],ensure_ascii=False)
  114. logging.info("视频解析获取结果成功{}".format(raw_data))
  115. to_kafka.send_kafka(raw_data, logging)
  116. elif d["data"]["code"]=="0":
  117. #正在解析中,将任务再次放回数据队列
  118. data_queue.put(raw_data)
  119. logging.info("视频未解析完毕,放回队列等待{}-{}".format(raw_data,d))
  120. else:
  121. #解析失败
  122. raw_data["result"]["successCode"] = "0"
  123. raw_data["result"]["errorLog"] = response.text
  124. raw_data["result"]["results"]=json.dumps(raw_data["result"]["results"],ensure_ascii=False)
  125. logging.info("视频解析获取结果失败,数据{},接口返回值{}".format(raw_data, d))
  126. to_kafka.send_kafka(raw_data, logging)
  127. else:
  128. raw_data["result"]["successCode"] = "0"
  129. raw_data["result"]["errorLog"]=response.text
  130. raw_data["result"]["results"] = json.dumps(raw_data["result"]["results"], ensure_ascii=False)
  131. logging.info("视频解析获取结果失败,数据{},接口返回值{}".format(raw_data,d))
  132. to_kafka.send_kafka(raw_data, logging)
  133. else:
  134. #暂无任务,进入休眠
  135. time.sleep(10)
  136. except:
  137. raw_data["result"]["successCode"]="0"
  138. raw_data["result"]["errorLog"]=traceback.format_exc()
  139. raw_data["result"]["results"]=""
  140. logging.error(traceback.format_exc())
  141. to_kafka.send_kafka(raw_data, logging)