假新闻识别应用
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

117 lines
5.1 KiB

  1. #coding:utf8
  2. import os, sys
  3. import io
  4. sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding='utf8')
  5. cur_dir = os.path.dirname(os.path.abspath(__file__)) or os.getcwd()
  6. par_dir = os.path.abspath(os.path.join(cur_dir, os.path.pardir))
  7. sys.path.append(cur_dir)
  8. sys.path.append(par_dir)
  9. import json
  10. from django.http import HttpResponse
  11. from text_analysis.tools import to_kafka,tool
  12. from text_analysis.tools import pred
  13. from django.views.decorators.csrf import csrf_exempt
  14. from log_util.set_logger import set_logger
  15. logging=set_logger('logs/results.log')
  16. import traceback
  17. import queue
  18. from text_analysis.cusException import userFile_Exception,chainFile_Exception
  19. import requests
  20. import time
  21. from datetime import datetime
  22. import os
  23. import joblib
  24. #任务队列
  25. global task_queue
  26. task_queue = queue.Queue()
  27. @csrf_exempt
  28. def fakeNewIdentification(request):
  29. if request.method == 'POST':
  30. try:
  31. raw_data = json.loads(request.body)
  32. task_queue.put(raw_data)
  33. return HttpResponse(json.dumps({"code": 1, "msg": "请求正常!"}, ensure_ascii=False))
  34. except:
  35. logging.error(traceback.format_exc())
  36. return HttpResponse(json.dumps({"code": 0, "msg": "请求json格式不正确!"}, ensure_ascii=False))
  37. else:
  38. return HttpResponse(json.dumps({"code": 0, "msg": "请求方式错误,改为post请求"}, ensure_ascii=False))
  39. def predict_news(dbConfig):
  40. while True:
  41. if task_queue.qsize() > 0:
  42. try:
  43. logging.info("取任务队列长度{}".format(task_queue.qsize()))
  44. raw_data = task_queue.get()
  45. logging.info("原始数据-{}".format(raw_data))
  46. res = {"successCode": "1", "errorLog": "", "results": {},"status":1,"message":"成功"}
  47. # 账号数据
  48. userData = tool.mysqlData(raw_data, logging,"1",dbConfig)
  49. # if not userData:
  50. # raise userFile_Exception
  51. logging.info("账号数据获取完毕!-长度{}".format(len(userData)))
  52. # 传播链数据
  53. postChain=tool.mysqlData(raw_data, logging,"0",dbConfig)
  54. if not postChain:
  55. raise chainFile_Exception
  56. logging.info("传播链数据获取完毕!-长度{}".format(len(postChain)))
  57. news=pred.predict_news(userData,postChain,logging)
  58. # 结束标识
  59. res['isLast'] = True
  60. for i in range(len(news)):
  61. row_dict = news.iloc[i].to_dict()
  62. row_dict['pageType'] = 'fakeNewsPage'
  63. # postId
  64. row_dict['postId'] = userData[0]['postId']
  65. if i == len(news) - 1:
  66. row_dict["isLast"]=1
  67. res["results"] = json.dumps(row_dict,ensure_ascii=False)
  68. res["status"] = 1
  69. res["message"] = "成功"
  70. raw_data["result"] = res
  71. logging.info("共{}条数据,第{}条数据输出-{}".format(len(news),i+1,raw_data))
  72. to_kafka.send_kafka(raw_data, logging)
  73. except userFile_Exception:
  74. res = {"successCode": "0", "errorLog": "用户数据为空!", "results": {}, "status": 2,"message": "异常"}
  75. results={}
  76. results['pageType'] = 'fakeNewsPage'
  77. results['recognitionResult'] = '用户数据为空'
  78. res['results'] = json.dumps(results)
  79. res["status"] = 2
  80. res["message"] = "用户数据为空"
  81. raw_data["result"] = res
  82. logging.info("该条请求用户数据为空-{}".format(raw_data))
  83. to_kafka.send_kafka(raw_data, logging)
  84. except chainFile_Exception:
  85. res = {"successCode": "0", "errorLog": "关系链数据为空!", "results": {}, "status": 2,"message": "异常"}
  86. results={}
  87. results['pageType'] = 'fakeNewsPage'
  88. results['recognitionResult'] = '关系链数据为空'
  89. res['results'] = json.dumps(results)
  90. res["status"] = 2
  91. res["message"] = "关系链数据为空"
  92. raw_data["result"] = res
  93. logging.info("该条请求关系链数据为空-{}".format(raw_data))
  94. to_kafka.send_kafka(raw_data, logging)
  95. except:
  96. res = {"successCode": "0", "errorLog": "", "results": {}, "status": 2,"message": "异常"}
  97. results={}
  98. results['pageType'] = 'fakeNewsPage'
  99. results['recognitionResult'] = ""
  100. res['results'] = json.dumps(results)
  101. res["status"] = 2
  102. res["message"] = "异常"
  103. raw_data["result"] = res
  104. raw_data["result"]["errorLog"] = traceback.format_exc()
  105. logging.info(traceback.format_exc())
  106. to_kafka.send_kafka(raw_data, logging)
  107. else:
  108. # 暂无任务,进入休眠
  109. time.sleep(10)