Browse Source

海外任务缓存

sitask
zhicheng.zhang 4 weeks ago
parent
commit
0ea71fa1ef
  1. 115
      cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/Newscontent.java
  2. 4
      cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/test.java
  3. 79
      cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/ListenfastTaskManager.java
  4. 480
      cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/SubjectTaskdele.java
  5. 471
      cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/SubjectTaskdelone.java
  6. 36
      cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/si.java
  7. 172
      cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/taskdel.java
  8. 31
      cl_stream_datasave/src/main/java/com/bfd/mf/runstart/DelRunStartDataSave.java
  9. 36
      cl_stream_datasave/src/main/resources/META-INF/MANIFEST.MF
  10. BIN
      cl_stream_datasave/target/cl_stream_datasave-2.0-SNAPSHOT.jar
  11. BIN
      cl_stream_datasave/target/cl_stream_datasave-2.0-SNAPSHOT.jar.original
  12. 36
      cl_stream_datasave/target/classes/META-INF/MANIFEST.MF
  13. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/DownLoadFile.class
  14. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/MyCookieJar.class
  15. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/NewsDownload.class
  16. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/Newscontent.class
  17. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/OkHttpUtils.class
  18. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/ProxyIp.class
  19. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/test.class
  20. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/kafka/IKafka.class
  21. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/kafka/ReadKafka.class
  22. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/DataSaveManager.class
  23. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenKafkaManager.class
  24. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenTaskManager.class
  25. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenfastTaskManager.class
  26. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/Constants.class
  27. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBConnectionManager$DBConnectionPool.class
  28. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBConnectionManager.class
  29. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBUtil.class
  30. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DataCheckUtil.class
  31. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DataProcess.class
  32. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DateUtil.class
  33. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/PropertiesUtil.class
  34. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/ReadLine.class
  35. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/WriteMethod.class
  36. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/AllKeys.class
  37. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/DataSaveManager.class
  38. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/FieldInfo.class
  39. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/FieldNormaliz.class
  40. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/ReaultInfo.class
  41. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/impl/DataSaveManagerImpl.class
  42. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/FiledTableInfo.class
  43. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTask.class
  44. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTaskdele.class
  45. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTaskdelone.class
  46. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/Tasklimit.class
  47. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/Userlimit.class
  48. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/cl_task.class
  49. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/si.class
  50. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/taskdel.class
  51. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/runstart/DelRunStartDataSave.class
  52. BIN
      cl_stream_datasave/target/classes/com/bfd/mf/runstart/RunStartDataSave.class
  53. BIN
      cl_stream_datasave/target/gxcl_stream_datasave-2.0-SNAPSHOT.jar
  54. 5
      cl_stream_datasave/target/maven-archiver/pom.properties
  55. 36
      cl_stream_datasave/target/maven-status/maven-compiler-plugin/compile/default-compile/createdFiles.lst
  56. 39
      cl_stream_datasave/target/maven-status/maven-compiler-plugin/compile/default-compile/inputFiles.lst
  57. 2
      cl_stream_datasave/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst
  58. 3
      cl_stream_datasave/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst
  59. BIN
      cl_stream_datasave/target/test-classes/CreatIndex.class
  60. BIN
      cl_stream_datasave/target/test-classes/Test1.class

115
cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/Newscontent.java

@ -0,0 +1,115 @@
package com.bfd.mf.datasave.download;
import com.bfd.crawler.utils.JsonUtils;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
//videoPath == egc
//filePath == ugc
//imagePath == pgc
public class Newscontent {
public static void downloadAndSaveimage(Map<String, Object> resultMap, List<Map<String, String>> imagePathSizevalue){
// = (List<Map<String, String>>) resultMap.get("imagePathSize");
List<String> imagePathlist=new ArrayList<>();
for (Map<String, String> mapurl:imagePathSizevalue){
if(mapurl.containsKey("url")){
imagePathlist.add(mapurl.get("url").toString());
}
}
resultMap.put("imagePathSize",JsonUtils.toJSONString(imagePathSizevalue));
resultMap.put("imagePath",imagePathlist);
resultMap.put("pgc",1);
List<Map<String, Object>> picturepath=new ArrayList<>();
if(resultMap.get("pictureList")!=""){
try {
Map<String,Object> map=JsonUtils.parseObject((String) resultMap.get("pictureList"));
if(!map.isEmpty()){
for (Map.Entry<String, Object> entry : map.entrySet()) {
Map<String,Object> gofastmap=new HashMap<>();
Map<String,Object> revmap= (Map<String, Object>) entry.getValue();
if(revmap.containsKey("uploadImg")&&revmap.get("uploadImg")!=null&&revmap.get("uploadImg")!=""){
gofastmap.put("gofastUrl","/group"+revmap.get("uploadImg").toString().split("/group")[1]);
gofastmap.put("originalUrl",revmap.get("img"));
}
picturepath.add(gofastmap);
}
resultMap.put("srcimagePath",JsonUtils.toJSONString(picturepath));
}
} catch (Exception e) {
e.printStackTrace();
}
}
}
public static void downloadAndSavefile(Map<String, Object> resultMap, List<Map<String, Object>> filePathSize){
//List<Map<String, String>> imagePathSizevalue= (List<Map<String, String>>) resultMap.get("filePathSize");
List<String> imagePathlist=new ArrayList<>();
for (Map<String, Object> mapurl:filePathSize){
if(mapurl.containsKey("url")){
imagePathlist.add(mapurl.get("url").toString());
}
}
resultMap.put("filePathSize",JsonUtils.toJSONString(filePathSize));
resultMap.put("filePath",imagePathlist);
resultMap.put("ugc",1);
if(resultMap.get("forwardUrl")!=""){
try {
List<Map<String, Object>> forwardUrl= (List<Map<String, Object>>) JsonUtils.parseArray((String) resultMap.get("forwardUrl"));
List<Map<String, Object>> anewforwardUrl=new ArrayList<>();
for( Map<String, Object> mapList : forwardUrl ) {
if(mapList.containsKey("gofastUrl")){
mapList.put("gofastUrl","/group"+mapList.get("gofastUrl").toString().split("/group")[1]);
anewforwardUrl.add(mapList);
}else{
anewforwardUrl.add(mapList);
}
}
String reforwardUrl=JsonUtils.toJSONString(anewforwardUrl);
resultMap.put("srcfilePath",reforwardUrl);
} catch (Exception e) {
e.printStackTrace();
}
}
}
public static void downloadAndSavevideo(Map<String, Object> resultMap, List<Map<String, String>> videoPathSize){
// List<Map<String, String>> imagePathSizevalue= (List<Map<String, String>>) resultMap.get("videoPathSize");
List<String> imagePathlist=new ArrayList<>();
for (Map<String, String> mapurl:videoPathSize){
if(mapurl.containsKey("url")){
imagePathlist.add(mapurl.get("url"));
}
}
resultMap.put("videoPathSize",JsonUtils.toJSONString(videoPathSize));
resultMap.put("videoPath",imagePathlist);
resultMap.put("egc",1);
if(resultMap.get("videoUrl")!=""){
try {
List<Map<String, Object>> forwardUrl= (List<Map<String, Object>>) JsonUtils.parseArray((String) resultMap.get("videoUrl"));
List<Map<String, Object>> anewforwardUrl=new ArrayList<>();
for( Map<String, Object> mapList : forwardUrl ) {
if(mapList.containsKey("gofastUrl")){
mapList.put("gofastUrl","/group"+mapList.get("gofastUrl").toString().split("/group")[1]);
anewforwardUrl.add(mapList);
}else{
anewforwardUrl.add(mapList);
}
}
String reforwardUrl=JsonUtils.toJSONString(anewforwardUrl);
resultMap.put("srcvideoPath",reforwardUrl);
} catch (Exception e) {
e.printStackTrace();
}
}
}
}

4
cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/test.java

@ -0,0 +1,4 @@
package com.bfd.mf.datasave.download;
public class test {
}

79
cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/ListenfastTaskManager.java

@ -0,0 +1,79 @@
package com.bfd.mf.datasave.listen;
import com.bfd.mf.datasave.kafka.ReadKafka;
import com.bfd.mf.datasave.tools.DateUtil;
import com.bfd.mf.entity.FieldNormaliz;
import com.bfd.mf.entity.mysql.FiledTableInfo;
import com.bfd.mf.entity.mysql.SubjectTask;
import java.util.List;
import java.util.Map;
import java.util.concurrent.LinkedBlockingDeque;
import java.util.concurrent.SynchronousQueue;
import java.util.concurrent.ThreadPoolExecutor;
import java.util.concurrent.TimeUnit;
public class ListenfastTaskManager implements Runnable {
//private LinkedBlockingDeque<String> queue= new LinkedBlockingDeque<String>(5000);
private LinkedBlockingDeque<String> fastqueue= new LinkedBlockingDeque<String>(5000);
private boolean isRun = true;
private FieldNormaliz fieldNormaliz;
private ThreadPoolExecutor spiderPoolExec ;
private Map<String, List<Map<String,String>>> subject;
private Map<Integer,Map<String,String>> tableInfoMap;
public ListenfastTaskManager(FieldNormaliz fieldNormaliz){
int croePoolsize = 20 ;
int maximumPoolsize = 500;
long keepAliveTime = 0;
this.spiderPoolExec = new ThreadPoolExecutor(croePoolsize, maximumPoolsize, keepAliveTime, TimeUnit.SECONDS, new SynchronousQueue<Runnable>());
this.fieldNormaliz = fieldNormaliz ;
this.subject = SubjectTask.subjectTaskMap;
this.tableInfoMap = FiledTableInfo.tableInfoMap;
String kafkaname = fieldNormaliz.getKafkaName()+"fast" ;
ReadKafka readfaseKafka = new ReadKafka(fastqueue , kafkaname ,12 , fieldNormaliz.getGroupId(), fieldNormaliz.getKafkaSerName(),fieldNormaliz.getEsSerName());
readfaseKafka.read();
}
@Override
public void run() {
while(isRun){
if(this.fastqueue.size() < 1){
DateUtil.sleep(1);
continue;
}
String data = this.fastqueue.poll();
System.out.println(data);
if(data == null) continue ;
if (data.equals("__Exit__")) break ;
this.addTask(data);
}
}
private void addTask(String data){
while ( spiderPoolExec.getPoolSize() >= spiderPoolExec.getMaximumPoolSize() ||
spiderPoolExec.getActiveCount() >= spiderPoolExec.getMaximumPoolSize()) {
try {
Thread.sleep(200);
} catch (InterruptedException e) {
e.printStackTrace();
}
}
System.out.println("现有的线程数"+spiderPoolExec.getActiveCount());
spiderPoolExec.submit(new DataSaveManager(data, fieldNormaliz,subject,tableInfoMap));
}
public void setSwitch(boolean flag){
this.isRun = flag ;
}
public LinkedBlockingDeque<String> getQueue(){
return fastqueue ;
}
}

480
cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/SubjectTaskdele.java

@ -0,0 +1,480 @@
package com.bfd.mf.entity.mysql;
//import com.bfd.crawler.utils.JsonUtils;
import com.bfd.crawler.utils.JsonUtils;
import com.bfd.mf.datasave.tools.Constants;
import com.bfd.mf.datasave.tools.DBUtil;
import com.bfd.mf.datasave.tools.DateUtil;
import crawler.open.util.RedisUtil;
import org.apache.log4j.Logger;
import java.text.SimpleDateFormat;
import java.util.*;
import static com.bfd.mf.entity.mysql.Tasklimit.subjectTasktimelimiit;
import static com.bfd.mf.entity.mysql.Userlimit.subjectuserlimiit;
public class SubjectTaskdele implements Runnable {
private static Logger log = Logger.getLogger(SubjectTask.class);
public static Map<String, List<Map<String,String>>> subjectTaskMap = new HashMap<>();
// public static void loadSubjectTask() {
// subjectTaskMap.clear();
// //List<Map<String, Object>> subjectTaskList = DBUtil.getInstance("db_stat").query("select cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id)where (ct.crawl_status=1 or ct.crawl_status=3) and ct.del=0 ;");ct.app_id=cs.app_id and
// String time=DateUtil.getDate();
// //System.out.println(time);
// //System.out.println("结束时间"+ DateUtil.getcurr());
// List<Map<String, Object>> subjectTaskList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=1 ) and ct.del=0 and ct.app_id=cs.app_id and ct.cid!=\"\" and ct.update_time>'"+time+"'order by ct.update_time desc;");
// System.out.println(subjectTaskList.size());
// if(subjectTaskList.size() > 0){
// String key = "";
// for(Map<String, Object> subjectTask : subjectTaskList){ //{subject_id=10222, name=我是张三, task_id=188, id=71, crawl_data_flag=aaa}
// String keytwo = "";
// if( subjectTask.get("cid").equals("Tmall")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Taobao"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else if (subjectTask.get("cid").equals("Taobao")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Tmall"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else {
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// }
// Map<String,String> value = new HashMap<>();
// List<Map<String,String>> valueList = new ArrayList<>();
// String v_subject_id = "";
// String v_go_fast_addr = "";
// String v_kafka_switch = "";
// String v_kafka_addr = "";
// String v_task_id = "";
// String v_external_id ="";
// String v_go_fast_switch="";
// String v_kafka_topic="";
// String v_status="";
// String v_del="";
// String v_create_user_id="";
// String v_ocr="0";
// String v_trans="0";
// String v_crawl_content_key="";
// if(null != subjectTask.get("subject_id")) {
// v_subject_id = subjectTask.get("subject_id").toString();
// }
// if(null != subjectTask.get("crawl_content_key")) {
// v_crawl_content_key = subjectTask.get("crawl_content_key").toString();
// }
// if(null != subjectTask.get("go_fast_addr")) {
// v_go_fast_addr = subjectTask.get("go_fast_addr").toString();
// }
// if(null != subjectTask.get("kafka_addr")) {
// v_kafka_addr = subjectTask.get("kafka_addr").toString();
// }
// if(null != subjectTask.get("kafka_switch")){
// v_kafka_switch = subjectTask.get("kafka_switch").toString();
// }
// if(null !=subjectTask.get("id")){
// v_task_id = subjectTask.get("id").toString();
// }
// if(null !=subjectTask.get("external_id")){
// v_external_id = subjectTask.get("external_id").toString();
// }
// if(null !=subjectTask.get("go_fast_switch")){
// v_go_fast_switch = subjectTask.get("go_fast_switch").toString();
// }
// if(null !=subjectTask.get("kafka_topic")){
// v_kafka_topic = subjectTask.get("kafka_topic").toString();
// }
//// if(null !=subjectTask.get("status")){
//// v_status = subjectTask.get("status").toString();
//// }
// if(null !=subjectTask.get("del")){
// v_del = subjectTask.get("del").toString();
// }
// if(null !=subjectTask.get("create_user_id")){
// v_create_user_id = subjectTask.get("create_user_id").toString();
// }
// value.put("subject_id",v_subject_id);
// value.put("go_fast_addr",v_go_fast_addr);
// value.put("export_to_kafka",v_kafka_switch);
// value.put("kafka_addr",v_kafka_addr);
// // value.put("task_id",v_task_id);
// value.put("external_id",v_external_id);
// value.put("go_fast_switch",v_go_fast_switch);
// value.put("kafka_topic",v_kafka_topic);
// // value.put("status",v_status);//专题的状态
// value.put("del",v_del);//专题的状态
// value.put("appid",subjectTask.get("app_id").toString());
// value.put("crawl_content_key",v_crawl_content_key);
// //System.out.print(v_external_id+"external_id");
// String newkey = key.toLowerCase();
// String userkey=newkey+"#####"+subjectTask.get("app_id").toString().toLowerCase();
//
// //组装时间的参数
// if (subjectTasktimelimiit.containsKey(userkey)){
// List<Map<String,String>>timelist=subjectTasktimelimiit.get(userkey);
// if(timelist.size()==1){
// for(Map<String, String> subjectTasktime : timelist){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// } else{
// for(Map<String, String> subjectTasktime : timelist){
// String subject_id=subjectTasktime.get("subject_id").toString();
// if (v_subject_id.equals(subject_id)){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// }
// }
//
// }
//// //用户的权限
// if (subjectuserlimiit.containsKey(v_create_user_id)){
// Map<String,Object> permission= (Map<String, Object>) subjectuserlimiit.get(v_create_user_id);
// v_ocr= permission.get("is_ocr").toString();
// v_trans= permission.get("is_trans").toString();
// }
// value.put("is_ocr",v_ocr);
// value.put("is_trans",v_trans);
// //组装相同任务的任务id
// if(subjectTaskMap.containsKey(newkey)){
// valueList = subjectTaskMap.get(newkey);
// for (Map<String, String> valuetask : valueList){
// String task=valuetask.get("task_id")+","+v_task_id;
// valuetask.put("task_id",task);
// value.put("task_id",task);
// }
// valueList.add(value);
// }else{
// value.put("task_id",v_task_id);
// valueList.add(value);
// }
//
// if(keytwo.length()>0){
// String tmallnewkey = keytwo.toLowerCase();
// subjectTaskMap.put(tmallnewkey,valueList);
// }
// String redis=newkey+"$$"+JsonUtils.toJSONString(valueList);
//// try {
//// Constants.getLineQueue().put(redis);
//// } catch (InterruptedException e) {
//// e.printStackTrace();
//// }
//
// // RedisUtil.set(newkey, JsonUtils.toJSONString(valueList), 10);
// // System.out.println("结束时间"+ DateUtil.getcurr());
// subjectTaskMap.put(newkey,valueList);
// //System.out.println(newkey);
// }
// // System.out.println("结束时间"+ DateUtil.getcurr());
//
//
// //System.out.println(subjectTaskMap.size());
// log.info("当天任务的数量" + key + " ; data = " + subjectTaskMap.size());
// // SimpleDateFormat df = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");//设置日期格式
// //System.out.println(subjectTaskList.size());// new Date()为获取当前系统时间
// //WriteMethod.writeMethod("0621test.txt",JsonUtils.toJSONString(subjectTaskMap));
// // System.out.println(JsonUtils.toJSONString(subjectTaskMap)+"当前时间"+ DateUtil.getcurr());
// }else {
// System.out.println("kong a ");
// }
// }
// public static long updatetime = new Date().getTime()/1000;
@Override
public void run() {
while (true) try {
{
long updatetime = new Date().getTime()/1000-15;
List<Map<String, Object>> subjectTaskendList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.crawl_start_time,ct.crawl_end_time,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where ct.del=1 and ct.cid!=\"\" and ct.subject_id ='302681' and ct.cid='Npresidentgov' ;");
if(subjectTaskendList.size()>0){
// System.out.println(JsonUtils.toJSONString(subjectTaskendList));
for(Map<String, Object> subjectendtTask : subjectTaskendList){
String v_subject_id = "";
String v_task_id = ""; String appid="";
if(null != subjectendtTask.get("subject_id")) {
v_subject_id = subjectendtTask.get("subject_id").toString();
}
if(null !=subjectendtTask.get("id")){
v_task_id = subjectendtTask.get("id").toString();
}
if(null !=subjectendtTask.get("app_id")){
appid = subjectendtTask.get("app_id").toString();
}
if(subjectTaskendList.size()>0){
// for(Map<String, Object> subjectTask : subjectTaskList){
String key = "";
key = subjectendtTask.get("cid") + "#####" + subjectendtTask.get("crawl_data_flag");
key= key.toLowerCase();
System.out.println(key);
key= key.toLowerCase();
if(disposeCrawldataflag(key)) {
String getsubjectList = RedisUtil.get(key, 10);
List<Map<String, String>> subjectList = (List<Map<String, String>>) JsonUtils.parseArray(getsubjectList);
List<Map<String, String>> redistList = new ArrayList<>();
for (Map<String, String> redissubjectTask : subjectList) {
String resubject_id = redissubjectTask.get("subject_id").toString();
String reappid = redissubjectTask.get("appid").toString();
String taskid = redissubjectTask.get("task_id").toString();
if (!resubject_id.equals(v_subject_id) || !reappid.equals(appid) || !v_task_id.equals(taskid)) {
redistList.add(redissubjectTask);
}
}
String redis = key + "@#@" + JsonUtils.toJSONString(redistList);
// System.out.println(JsonUtils.toJSONString(redistList));
try {
// System.out.println("写入redis是"+redis);
Constants.getLineQueue().put(redis);
} catch (InterruptedException e) {
e.printStackTrace();
}
}
}
// }
// if(subjectTaskList.size() > 0){
// // System.out.println(subjectTaskendList.size()+"大小啊啊啊啊啊啊啊啊");
// String key = "";
// for(Map<String, Object> subjectTask : subjectTaskList){
// String keytwo = "";
// if( subjectTask.get("cid").equals("Tmall")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Taobao"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else if (subjectTask.get("cid").equals("Taobao")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Tmall"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else {
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// }
// Map<String,String> value = new HashMap<>();
// List<Map<String,String>> valueList = new ArrayList<>();
// String v_subject_id = "";
// String v_go_fast_addr = "";
// String v_kafka_switch = "";
// String v_kafka_addr = "";
// String v_task_id = "";
// String v_external_id ="";
// String v_go_fast_switch="";
// String v_kafka_topic="";
// String v_status="";
// String v_del="";
// String v_create_user_id="";
// String v_ocr="0";
// String v_trans="0";
// String v_crawl_content_key="";
// String appid="";
// if(null != subjectTask.get("subject_id")) {
// v_subject_id = subjectTask.get("subject_id").toString();
// }
// if(null != subjectTask.get("crawl_content_key")) {
// v_crawl_content_key = subjectTask.get("crawl_content_key").toString();
// }
// if(null != subjectTask.get("go_fast_addr")) {
// v_go_fast_addr = subjectTask.get("go_fast_addr").toString();
// }
// if(null != subjectTask.get("kafka_addr")) {
// v_kafka_addr = subjectTask.get("kafka_addr").toString();
// }
// if(null != subjectTask.get("kafka_switch")){
// v_kafka_switch = subjectTask.get("kafka_switch").toString();
// }
// if(null !=subjectTask.get("id")){
// v_task_id = subjectTask.get("id").toString();
// }
// if(null !=subjectTask.get("external_id")){
// v_external_id = subjectTask.get("external_id").toString();
// }
// if(null !=subjectTask.get("go_fast_switch")){
// v_go_fast_switch = subjectTask.get("go_fast_switch").toString();
// }
// if(null !=subjectTask.get("kafka_topic")){
// v_kafka_topic = subjectTask.get("kafka_topic").toString();
// }
// // if(null !=subjectTask.get("status")){
// // v_status = subjectTask.get("status").toString();
// // }
// if(null !=subjectTask.get("del")){
// v_del = subjectTask.get("del").toString();
// }
// if(null !=subjectTask.get("create_user_id")){
// v_create_user_id = subjectTask.get("create_user_id").toString();
// }
// if(null !=subjectTask.get("app_id")){
// appid = subjectTask.get("app_id").toString();
// }
//
//
// value.put("subject_id",v_subject_id);
// value.put("go_fast_addr",v_go_fast_addr);
// value.put("export_to_kafka",v_kafka_switch);
// value.put("kafka_addr",v_kafka_addr);
// // value.put("task_id",v_task_id);
// value.put("external_id",v_external_id);
// value.put("go_fast_switch",v_go_fast_switch);
// value.put("kafka_topic",v_kafka_topic);
// // value.put("status",v_status);//专题的状态
// value.put("del",v_del);//专题的状态
// value.put("appid",subjectTask.get("app_id").toString());
// value.put("crawl_content_key",v_crawl_content_key);
// //System.out.print(v_external_id+"external_id");
// String newkey = key.toLowerCase();
// String userkey=newkey+"#####"+subjectTask.get("app_id").toString().toLowerCase();
// //组装时间的参数
// if (subjectTasktimelimiit.containsKey(userkey)){
// List<Map<String,String>>timelist=subjectTasktimelimiit.get(userkey);
// if(timelist.size()==1){
// for(Map<String, String> subjectTasktime : timelist){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// } else{
// for(Map<String, String> subjectTasktime : timelist){
// String subject_id=subjectTasktime.get("subject_id").toString();
// if (v_subject_id.equals(subject_id)){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// }
// }
//
// }
// // //用户的权限
// if (subjectuserlimiit.containsKey(v_create_user_id)){
// Map<String,Object> permission= (Map<String, Object>) subjectuserlimiit.get(v_create_user_id);
// v_ocr= permission.get("is_ocr").toString();
// v_trans= permission.get("is_trans").toString();
// }
// value.put("is_ocr",v_ocr);
// value.put("is_trans",v_trans);
// Set keysSet = new HashSet();
//
//
// //组装相同任务的任务id
// if(subjectTaskMap.containsKey(newkey)){
// valueList = subjectTaskMap.get(newkey);
// for (Map<String, String> valuetask : valueList){
// String task=valuetask.get("task_id")+","+v_task_id;
// valuetask.put("task_id",task);
// value.put("task_id",task);
// }
// valueList.add(value);
// }else{
// value.put("task_id",v_task_id);
// valueList.add(value);
// }
//// if(disposeCrawldataflag(newkey)) { //判断redis中的key
//// String getsubjectList=RedisUtil.get(newkey,10);
//// try {
//// List<Map<String, String>> subjectList = (List<Map<String, String>>) JsonUtils.parseArray(getsubjectList);
//// List<Map<String, String>> redistList=new ArrayList<>();
//// for(Map<String, String> redissubjectTask : subjectList){
//// String resubject_id=redissubjectTask.get("subject_id").toString();
//// String reappid=redissubjectTask.get("appid").toString();
//// String maxtime="";
//// if(redissubjectTask.containsKey("maxtime")){
//// maxtime=redissubjectTask.get("maxtime").toString();
//// }
////
//// if(!resubject_id.equals(v_subject_id)&&!reappid.equals(appid)){
//// redistList.add(redissubjectTask);
//// }
//// String keys=resubject_id+reappid+maxtime;
//// int beforeSize = keysSet.size();
//// keysSet.add(keys);
//// int afterSize = keysSet.size();
//// if(afterSize == beforeSize + 1){
//// valueList.add(redissubjectTask);
//// }
//// }
//// valueList.addAll(redistList);
//// } catch (Exception e) {
//// log.error("获取redis中的任务失败"+getsubjectList);
//// }
//// }
// if(keytwo.length()>0){
// String tmallnewkey = keytwo.toLowerCase();
// subjectTaskMap.put(tmallnewkey,valueList);
// }
// subjectTaskMap.put(newkey,valueList);
// //System.out.print(valueList);
// }
// //System.out.print(JsonUtils.toJSONString(subjectTaskMap));
//
// Set keysSet = new HashSet();
// for (String newkey :subjectTaskMap.keySet()){
// List<Map<String, String>> newkeyvalue=subjectTaskMap.get(newkey);
// //System.out.println(JsonUtils.toJSONString(newkeyvalue));
// List<Map<String, String>> setkeyvalue=new ArrayList<>();
// for(Map<String, String> redissubjectTask : newkeyvalue){
// String resubject_id=redissubjectTask.get("subject_id").toString();
// String reappid=redissubjectTask.get("appid").toString();
// String maxtime=redissubjectTask.get("maxtime").toString();
// String keys=resubject_id+reappid+newkey;
// int beforeSize = keysSet.size();
// keysSet.add(keys);
// int afterSize = keysSet.size();
// if(afterSize == beforeSize + 1){
// setkeyvalue.add(redissubjectTask);
// }
// }
// String redis=newkey+"@#@"+JsonUtils.toJSONString(setkeyvalue);
// try {
// Constants.getLineQueue().put(redis);
// } catch (InterruptedException e) {
// e.printStackTrace();
// }
// }
//
// log.info("结束时间"+ DateUtil.getcurr());
// //System.out.println(subjectTaskMap.size());
// log.info("当天任务的数量" + key + " ; data = " + subjectTaskMap.size());
// }else {
// String delkey = subjectendtTask.get("cid") + "#####" + subjectendtTask.get("crawl_data_flag");
// log.info(delkey.toLowerCase()+"====del");
// RedisUtil.del(delkey.toLowerCase(), 10);
// }
}
}
Thread.sleep(1000*86400);
}
} catch (Exception e) {
e.printStackTrace();
}
}
private boolean disposeCrawldataflag(String crawldataflag) {
try{
if (RedisUtil.exists(crawldataflag, 10)) { // 先去 redis中查询是否存在不存直接忽略
String value = RedisUtil.get(crawldataflag,10);
if(null != value && !("").equals(value)) {
return true;
}
} else {
log.error("[datasave] exec >>> 灌数:该 crwaldataflag 在 Redis 中不存在!!! keys = " + crawldataflag + " ; dbindex = " + 10);
return false;
}
return false;
}catch (Exception e){
e.printStackTrace();
return false;
}
}
}

471
cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/SubjectTaskdelone.java

@ -0,0 +1,471 @@
package com.bfd.mf.entity.mysql;
//import com.bfd.crawler.utils.JsonUtils;
import com.bfd.crawler.utils.JsonUtils;
import com.bfd.mf.datasave.tools.Constants;
import com.bfd.mf.datasave.tools.DBUtil;
import com.bfd.mf.datasave.tools.DateUtil;
import crawler.open.util.RedisUtil;
import org.apache.log4j.Logger;
import java.util.*;
import static com.bfd.mf.entity.mysql.Tasklimit.subjectTasktimelimiit;
import static com.bfd.mf.entity.mysql.Userlimit.subjectuserlimiit;
public class SubjectTaskdelone implements Runnable {
private static Logger log = Logger.getLogger(SubjectTaskdelone.class);
public static Map<String, List<Map<String,String>>> subjectTaskMap = new HashMap<>();
// public static void loadSubjectTask() {
// subjectTaskMap.clear();
// //List<Map<String, Object>> subjectTaskList = DBUtil.getInstance("db_stat").query("select cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id)where (ct.crawl_status=1 or ct.crawl_status=3) and ct.del=0 ;");ct.app_id=cs.app_id and
// String time=DateUtil.getDate();
// //System.out.println(time);
// //System.out.println("结束时间"+ DateUtil.getcurr());
// List<Map<String, Object>> subjectTaskList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=1 ) and ct.del=0 and ct.app_id=cs.app_id and ct.cid!=\"\" and ct.update_time>'"+time+"'order by ct.update_time desc;");
// System.out.println(subjectTaskList.size());
// if(subjectTaskList.size() > 0){
// String key = "";
// for(Map<String, Object> subjectTask : subjectTaskList){ //{subject_id=10222, name=我是张三, task_id=188, id=71, crawl_data_flag=aaa}
// String keytwo = "";
// if( subjectTask.get("cid").equals("Tmall")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Taobao"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else if (subjectTask.get("cid").equals("Taobao")){
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// keytwo = "Tmall"+ "#####" + subjectTask.get("crawl_data_flag");
// }
// else {
// key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
// }
// Map<String,String> value = new HashMap<>();
// List<Map<String,String>> valueList = new ArrayList<>();
// String v_subject_id = "";
// String v_go_fast_addr = "";
// String v_kafka_switch = "";
// String v_kafka_addr = "";
// String v_task_id = "";
// String v_external_id ="";
// String v_go_fast_switch="";
// String v_kafka_topic="";
// String v_status="";
// String v_del="";
// String v_create_user_id="";
// String v_ocr="0";
// String v_trans="0";
// String v_crawl_content_key="";
// if(null != subjectTask.get("subject_id")) {
// v_subject_id = subjectTask.get("subject_id").toString();
// }
// if(null != subjectTask.get("crawl_content_key")) {
// v_crawl_content_key = subjectTask.get("crawl_content_key").toString();
// }
// if(null != subjectTask.get("go_fast_addr")) {
// v_go_fast_addr = subjectTask.get("go_fast_addr").toString();
// }
// if(null != subjectTask.get("kafka_addr")) {
// v_kafka_addr = subjectTask.get("kafka_addr").toString();
// }
// if(null != subjectTask.get("kafka_switch")){
// v_kafka_switch = subjectTask.get("kafka_switch").toString();
// }
// if(null !=subjectTask.get("id")){
// v_task_id = subjectTask.get("id").toString();
// }
// if(null !=subjectTask.get("external_id")){
// v_external_id = subjectTask.get("external_id").toString();
// }
// if(null !=subjectTask.get("go_fast_switch")){
// v_go_fast_switch = subjectTask.get("go_fast_switch").toString();
// }
// if(null !=subjectTask.get("kafka_topic")){
// v_kafka_topic = subjectTask.get("kafka_topic").toString();
// }
//// if(null !=subjectTask.get("status")){
//// v_status = subjectTask.get("status").toString();
//// }
// if(null !=subjectTask.get("del")){
// v_del = subjectTask.get("del").toString();
// }
// if(null !=subjectTask.get("create_user_id")){
// v_create_user_id = subjectTask.get("create_user_id").toString();
// }
// value.put("subject_id",v_subject_id);
// value.put("go_fast_addr",v_go_fast_addr);
// value.put("export_to_kafka",v_kafka_switch);
// value.put("kafka_addr",v_kafka_addr);
// // value.put("task_id",v_task_id);
// value.put("external_id",v_external_id);
// value.put("go_fast_switch",v_go_fast_switch);
// value.put("kafka_topic",v_kafka_topic);
// // value.put("status",v_status);//专题的状态
// value.put("del",v_del);//专题的状态
// value.put("appid",subjectTask.get("app_id").toString());
// value.put("crawl_content_key",v_crawl_content_key);
// //System.out.print(v_external_id+"external_id");
// String newkey = key.toLowerCase();
// String userkey=newkey+"#####"+subjectTask.get("app_id").toString().toLowerCase();
//
// //组装时间的参数
// if (subjectTasktimelimiit.containsKey(userkey)){
// List<Map<String,String>>timelist=subjectTasktimelimiit.get(userkey);
// if(timelist.size()==1){
// for(Map<String, String> subjectTasktime : timelist){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// } else{
// for(Map<String, String> subjectTasktime : timelist){
// String subject_id=subjectTasktime.get("subject_id").toString();
// if (v_subject_id.equals(subject_id)){
// value.put("maxtime",subjectTasktime.get("max_time").toString());
// value.put("mintime",subjectTasktime.get("min_time").toString());
// }
// }
// }
//
// }
//// //用户的权限
// if (subjectuserlimiit.containsKey(v_create_user_id)){
// Map<String,Object> permission= (Map<String, Object>) subjectuserlimiit.get(v_create_user_id);
// v_ocr= permission.get("is_ocr").toString();
// v_trans= permission.get("is_trans").toString();
// }
// value.put("is_ocr",v_ocr);
// value.put("is_trans",v_trans);
// //组装相同任务的任务id
// if(subjectTaskMap.containsKey(newkey)){
// valueList = subjectTaskMap.get(newkey);
// for (Map<String, String> valuetask : valueList){
// String task=valuetask.get("task_id")+","+v_task_id;
// valuetask.put("task_id",task);
// value.put("task_id",task);
// }
// valueList.add(value);
// }else{
// value.put("task_id",v_task_id);
// valueList.add(value);
// }
//
// if(keytwo.length()>0){
// String tmallnewkey = keytwo.toLowerCase();
// subjectTaskMap.put(tmallnewkey,valueList);
// }
// String redis=newkey+"$$"+JsonUtils.toJSONString(valueList);
//// try {
//// Constants.getLineQueue().put(redis);
//// } catch (InterruptedException e) {
//// e.printStackTrace();
//// }
//
// // RedisUtil.set(newkey, JsonUtils.toJSONString(valueList), 10);
// // System.out.println("结束时间"+ DateUtil.getcurr());
// subjectTaskMap.put(newkey,valueList);
// //System.out.println(newkey);
// }
// // System.out.println("结束时间"+ DateUtil.getcurr());
//
//
// //System.out.println(subjectTaskMap.size());
// log.info("当天任务的数量" + key + " ; data = " + subjectTaskMap.size());
// // SimpleDateFormat df = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");//设置日期格式
// //System.out.println(subjectTaskList.size());// new Date()为获取当前系统时间
// //WriteMethod.writeMethod("0621test.txt",JsonUtils.toJSONString(subjectTaskMap));
// // System.out.println(JsonUtils.toJSONString(subjectTaskMap)+"当前时间"+ DateUtil.getcurr());
// }else {
// System.out.println("kong a ");
// }
// }
// public static long updatetime = new Date().getTime()/1000;
@Override
public void run() {
while (true) try {
{
Userlimit.loaduser();
Tasklimit.loadTask();
// long updatetime = new Date().getTime()/1000-15;
// SimpleDateFormat datetime = new SimpleDateFormat("yyyy-MM-dd HH:mm:ss");
// String now=datetime.format(Calendar.getInstance().getTime());
// System.out.println(updatetime+now);
// long starttime=new Date().getTime()/1000-20L;
// if (disposeCrawldataflag("Tasktimelimiit")){
// starttime= Long.parseLong(RedisUtil.get("Tasktimelimiit",10));
// starttime=starttime-5;
// RedisUtil.set("Tasktimelimiit", String.valueOf(updatetime), 10);
// }else {
// System.out.println("第一次写入");
// RedisUtil.set("Tasktimelimiit", String.valueOf(updatetime), 10);
// }
// System.out.println(System.currentTimeMillis()+"开始mysql执行的时间");
// String sql ="select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=1 ) and ct.del=0 and ct.cid!=\"\" and unix_timestamp(ct.start_time)>'"+starttime+"';";
//subject_id=302896 and del=1 and crawl_status =1
List<Map<String, Object>> delsubjectTaskendList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=0 ) and ct.del=1 and ct.cid!=\"\" and ct.subject_id=302896 and ct.del=1 and ct.crawl_status =0;");
for(Map<String, Object> delsubjectTask : delsubjectTaskendList){
String cid= (String) delsubjectTask.get("cid");
String crawl_data_flag= (String) delsubjectTask.get("crawl_data_flag");
// System.out.println("sq; si "+sql);
// List<Map<String, Object>> subjectTaskendList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=1 ) and ct.del=0 and ct.cid!=\"\" and unix_timestamp(ct.start_time)>'"+starttime+"';");
List<Map<String, Object>> subjectTaskendList = DBUtil.getInstance("db_stat_alltask").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where (ct.crawl_status=1) and ct.del=0 and ct.cid='"+cid+"' and ct.subject_id!=302896 and ct.crawl_data_flag='"+crawl_data_flag+"';");
System.out.println(System.currentTimeMillis()+"执行mysql任务结束的时间");
subjectTaskMap.clear();
if(subjectTaskendList.size()>0){
String delkey = cid + "#####" + crawl_data_flag;
log.info(delkey.toLowerCase()+"====del");
RedisUtil.del(delkey.toLowerCase(), 10);
Thread.sleep(1000*5);
System.out.println(subjectTaskendList.size()+"任务的大小");
for(Map<String, Object> subjectTask : subjectTaskendList){
String key = "";
String keytwo = "";
if( subjectTask.get("cid").equals("Tmall")){
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
keytwo = "Taobao"+ "#####" + subjectTask.get("crawl_data_flag");
}
else if (subjectTask.get("cid").equals("Taobao")){
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
keytwo = "Tmall"+ "#####" + subjectTask.get("crawl_data_flag");
}
else {
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
}
Map<String,String> value = new HashMap<>();
List<Map<String,String>> valueList = new ArrayList<>();
String v_subject_id = "";
String v_go_fast_addr = "";
String v_kafka_switch = "";
String v_kafka_addr = "";
String v_task_id = "";
String v_external_id ="";
String v_go_fast_switch="";
String v_kafka_topic="";
String v_status="";
String v_del="";
String v_create_user_id="";
String v_ocr="0";
String v_trans="0";
String v_crawl_content_key="";
String appid="";
if(null != subjectTask.get("subject_id")) {
v_subject_id = subjectTask.get("subject_id").toString();
}
if(null != subjectTask.get("crawl_content_key")) {
v_crawl_content_key = subjectTask.get("crawl_content_key").toString();
}
if(null != subjectTask.get("go_fast_addr")) {
v_go_fast_addr = subjectTask.get("go_fast_addr").toString();
}
if(null != subjectTask.get("kafka_addr")) {
v_kafka_addr = subjectTask.get("kafka_addr").toString();
}
if(null != subjectTask.get("kafka_switch")){
v_kafka_switch = subjectTask.get("kafka_switch").toString();
}
if(null !=subjectTask.get("id")){
v_task_id = subjectTask.get("id").toString();
}
if(null !=subjectTask.get("external_id")){
v_external_id = subjectTask.get("external_id").toString();
}
if(null !=subjectTask.get("go_fast_switch")){
v_go_fast_switch = subjectTask.get("go_fast_switch").toString();
}
if(null !=subjectTask.get("kafka_topic")){
v_kafka_topic = subjectTask.get("kafka_topic").toString();
}
if(null !=subjectTask.get("del")){
v_del = subjectTask.get("del").toString();
}
if(null !=subjectTask.get("create_user_id")){
v_create_user_id = subjectTask.get("create_user_id").toString();
}
if(null !=subjectTask.get("app_id")){
appid = subjectTask.get("app_id").toString();
}
value.put("appid", appid);
value.put("subject_id",v_subject_id);
value.put("go_fast_addr",v_go_fast_addr);
value.put("export_to_kafka",v_kafka_switch);
value.put("kafka_addr",v_kafka_addr);
// value.put("task_id",v_task_id);
value.put("external_id",v_external_id);
value.put("go_fast_switch",v_go_fast_switch);
value.put("kafka_topic",v_kafka_topic);
value.put("del",v_del);//专题的状态
value.put("crawl_content_key",v_crawl_content_key);
String newkey = key.toLowerCase();
String userkey=newkey;
//组装时间的参数
try {
if (!subjectTasktimelimiit.containsKey(userkey)) {//如果无最大和最小时间
Tasklimit.loadTask();
}
List<Map<String,String>>timelist=subjectTasktimelimiit.get(userkey);
if(timelist.size()==1){
for(Map<String, String> subjectTasktime : timelist){
value.put("maxtime",subjectTasktime.get("max_time").toString());
value.put("mintime",subjectTasktime.get("min_time").toString());
}
} else{
for(Map<String, String> subjectTasktime : timelist){
String subject_id=subjectTasktime.get("subject_id").toString();
if (v_subject_id.equals(subject_id)){
value.put("maxtime",subjectTasktime.get("max_time").toString());
value.put("mintime",subjectTasktime.get("min_time").toString());
}
}
}
} catch (Exception e) {
System.out.print("获取时间失败了"+subjectTask.get("crawl_data_flag"));
value.put("maxtime", String.valueOf(System.currentTimeMillis()));
value.put("mintime","0");
e.printStackTrace();
}
//
// //用户的权限
if (subjectuserlimiit.containsKey(v_create_user_id)){
Map<String,Object> permission= (Map<String, Object>) subjectuserlimiit.get(v_create_user_id);
v_ocr= permission.get("is_ocr").toString();
v_trans= permission.get("is_trans").toString();
}
value.put("is_ocr",v_ocr);
value.put("is_trans",v_trans);
Set keysSet = new HashSet();
//组装相同任务的任务id
if(subjectTaskMap.containsKey(newkey)){
valueList = subjectTaskMap.get(newkey);
for (Map<String, String> valuetask : valueList){
String task=valuetask.get("task_id")+","+v_task_id;
valuetask.put("task_id",task);
value.put("task_id",task);
}
valueList.add(value);
}else{
value.put("task_id",v_task_id);
valueList.add(value);
}
if(disposeCrawldataflag(newkey)) { //判断redis中的key
String getsubjectList=RedisUtil.get(newkey,10);
try {
List<Map<String, String>> subjectList = (List<Map<String, String>>) JsonUtils.parseArray(getsubjectList);
List<Map<String, String>> redistList=new ArrayList<>();
for(Map<String, String> redissubjectTask : subjectList){
String resubject_id=redissubjectTask.get("subject_id").toString();
// String reappid=redissubjectTask.get("appid").toString();
String maxtime="";
if(redissubjectTask.containsKey("maxtime")){
maxtime=redissubjectTask.get("maxtime").toString();
}
if(!resubject_id.equals(v_subject_id)){
redistList.add(redissubjectTask);
}
String keys=resubject_id+maxtime;
int beforeSize = keysSet.size();
keysSet.add(keys);
int afterSize = keysSet.size();
if(afterSize == beforeSize + 1){
valueList.add(redissubjectTask);
}
}
valueList.addAll(redistList);
} catch (Exception e) {
log.error("获取redis中的任务失败"+getsubjectList);
}
}
if(keytwo.length()>0){
String tmallnewkey = keytwo.toLowerCase();
subjectTaskMap.put(tmallnewkey,valueList);
}
subjectTaskMap.put(newkey,valueList);
//System.out.print(valueList);
//System.out.print(JsonUtils.toJSONString(subjectTaskMap));
Set keysSets = new HashSet();
for (String newkeya :subjectTaskMap.keySet()){
List<Map<String, String>> newkeyvalue=subjectTaskMap.get(newkeya);
List<Map<String, String>> setkeyvalue=new ArrayList<>();
for(Map<String, String> redissubjectTask : newkeyvalue){
String resubject_id=redissubjectTask.get("subject_id").toString();
String reappid=redissubjectTask.get("appid").toString();
String keys=resubject_id+reappid+newkeya;
int beforeSize = keysSets.size();
keysSets.add(keys);
int afterSize = keysSets.size();
if(afterSize == beforeSize + 1){
setkeyvalue.add(redissubjectTask);
}
}
String redis=newkeya+"@#@"+JsonUtils.toJSONString(setkeyvalue);
System.out.println(redis);
try {
Constants.getLineQueue().put(redis);
} catch (InterruptedException e) {
e.printStackTrace();
}
}
System.out.println(System.currentTimeMillis()+"任务组装结束的时间");
log.info("结束时间"+ DateUtil.getcurr());
log.info("当天任务的数量" + key + " ; data = " + subjectTaskMap.size());
// }else {
// String delkey = subjectendtTask.get("cid") + "#####" + subjectendtTask.get("crawl_data_flag");
// log.info(delkey.toLowerCase()+"====del");
// RedisUtil.del(delkey.toLowerCase(), 10);
// }
}
}else {
String delkey = cid + "#####" + crawl_data_flag;
log.info(delkey.toLowerCase()+"====del");
RedisUtil.del(delkey.toLowerCase(), 10);
Thread.sleep(1000*5);
}
}
Thread.sleep(1000*60*60);
}
} catch (Exception e) {
e.printStackTrace();
}
}
private boolean disposeCrawldataflag(String crawldataflag) {
try{
if (RedisUtil.exists(crawldataflag, 10)) { // 先去 redis中查询是否存在不存直接忽略
String value = RedisUtil.get(crawldataflag,10);
if(null != value && !("").equals(value)) {
return true;
}
} else {
log.error("[datasave] exec >>> 灌数:该 crwaldataflag 在 Redis 中不存在!!! keys = " + crawldataflag + " ; dbindex = " + 10);
return false;
}
return false;
}catch (Exception e){
e.printStackTrace();
return false;
}
}
public static void main(String[] args) {
long updatetime = new Date().getTime()/1000-30;
System.out.println(updatetime);
System.out.println(new Date().getTime()/1000);
}
}

36
cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/si.java

@ -0,0 +1,36 @@
package com.bfd.mf.entity.mysql;
import com.bfd.mf.datasave.tools.DBUtil;
import java.util.List;
import java.util.Map;
public class si implements Runnable{
@Override
public void run() {
System.out.println("aaa");
List<Map<String, Object>> subjectTaskendList = DBUtil.getInstance("db_stat_alltask").query("SELECT create_user,id,external_id from intelligent_crawl.cl_task ct WHERE (create_user like '%SocialInsightPro%' or create_user like '%SocialInsightTe%' or create_user like '%si-osint%') and crawl_status =1 and del =0 and external_id like '%t_%'");
System.out.println((subjectTaskendList.size()));
if(subjectTaskendList.size()>0){
for(Map<String, Object> subjectendtTask : subjectTaskendList){
String external_id= (String) subjectendtTask.get("external_id");
String create_user= (String) subjectendtTask.get("create_user");
long idin= (long) subjectendtTask.get("id");
int id= Integer.parseInt(external_id.split("t_")[1]);
String sql="update all_task.cl_task set external_id='"+external_id+"',id='"+id+"' where create_user='"+create_user+"'and id='"+idin+"';";
System.out.println(sql);
}
}
}
}

172
cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/taskdel.java

@ -0,0 +1,172 @@
package com.bfd.mf.entity.mysql;
import com.bfd.crawler.utils.JsonUtils;
import com.bfd.mf.datasave.tools.Constants;
import com.bfd.mf.datasave.tools.DBUtil;
import com.bfd.mf.datasave.tools.DateUtil;
import crawler.open.util.RedisUtil;
import org.apache.log4j.Logger;
import java.util.*;
import static com.bfd.mf.entity.mysql.Userlimit.subjectuserlimiit;
public class taskdel implements Runnable{
private static Logger log = Logger.getLogger(taskdel.class);
@Override
public void run() {
while (true) {
System.out.println("==========");
long updatetime = new Date().getTime()/1000-15;
List<Map<String, Object>> subjectTaskendList = DBUtil.getInstance("db_stat").query("select ct.crawl_content_key,ct.create_user_id,ct.app_id,cs.del,ct.crawl_start_time,ct.crawl_end_time,ct.external_id, ct.subject_id, ct.id, ct.cid, ct.crawl_data_flag,cs.kafka_switch,cs.kafka_addr,cs.go_fast_addr,cs.kafka_topic,cs.go_fast_switch from cl_subject cs Join cl_task ct on(ct.subject_id=cs.id) where ct.del=1 and ct.cid!=\"\" and ct.cid!='MUZX2WNM84L3ARXNSYN3' and unix_timestamp(ct.update_time)>'"+updatetime+"' ;");
if(subjectTaskendList.size()>0) {
System.out.println(subjectTaskendList);
System.out.println(subjectTaskendList.size() + "任务的大小");
for (Map<String, Object> subjectTask : subjectTaskendList) {
String key = "";
String keytwo = "";
if (subjectTask.get("cid").equals("Tmall")) {
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
keytwo = "Taobao" + "#####" + subjectTask.get("crawl_data_flag");
} else if (subjectTask.get("cid").equals("Taobao")) {
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
keytwo = "Tmall" + "#####" + subjectTask.get("crawl_data_flag");
} else {
key = subjectTask.get("cid") + "#####" + subjectTask.get("crawl_data_flag");
}
Map<String, String> value = new HashMap<>();
List<Map<String, String>> valueList = new ArrayList<>();
String v_subject_id = "";
String v_go_fast_addr = "";
String v_kafka_switch = "";
String v_kafka_addr = "";
String v_task_id = "";
String v_external_id = "";
String v_go_fast_switch = "";
String v_kafka_topic = "";
String v_status = "";
String v_del = "";
String v_create_user_id = "";
String v_ocr = "0";
String v_trans = "0";
String v_crawl_content_key = "";
String appid = "";
if (null != subjectTask.get("subject_id")) {
v_subject_id = subjectTask.get("subject_id").toString();
}
if (null != subjectTask.get("crawl_content_key")) {
v_crawl_content_key = subjectTask.get("crawl_content_key").toString();
}
if (null != subjectTask.get("go_fast_addr")) {
v_go_fast_addr = subjectTask.get("go_fast_addr").toString();
}
if (null != subjectTask.get("kafka_addr")) {
v_kafka_addr = subjectTask.get("kafka_addr").toString();
}
if (null != subjectTask.get("kafka_switch")) {
v_kafka_switch = subjectTask.get("kafka_switch").toString();
}
if (null != subjectTask.get("id")) {
v_task_id = subjectTask.get("id").toString();
}
if (null != subjectTask.get("external_id")) {
v_external_id = subjectTask.get("external_id").toString();
}
if (null != subjectTask.get("go_fast_switch")) {
v_go_fast_switch = subjectTask.get("go_fast_switch").toString();
}
if (null != subjectTask.get("kafka_topic")) {
v_kafka_topic = subjectTask.get("kafka_topic").toString();
}
if (null != subjectTask.get("del")) {
v_del = subjectTask.get("del").toString();
}
if (null != subjectTask.get("create_user_id")) {
v_create_user_id = subjectTask.get("create_user_id").toString();
}
if (null != subjectTask.get("app_id")) {
appid = subjectTask.get("app_id").toString();
}
value.put("appid", appid);
value.put("subject_id", v_subject_id);
value.put("go_fast_addr", v_go_fast_addr);
value.put("export_to_kafka", v_kafka_switch);
value.put("kafka_addr", v_kafka_addr);
// value.put("task_id",v_task_id);
value.put("external_id", v_external_id);
value.put("go_fast_switch", v_go_fast_switch);
value.put("kafka_topic", v_kafka_topic);
value.put("del", v_del);//专题的状态
value.put("crawl_content_key", v_crawl_content_key);
value.put("maxtime", subjectTask.get("crawl_end_time").toString());
value.put("mintime", subjectTask.get("crawl_start_time").toString());
String newkey = key.toLowerCase();
if (disposeCrawldataflag(newkey)) { //判断redis中的key
String getsubjectList = RedisUtil.get(newkey, 10);
try {
List<Map<String, String>> subjectList = (List<Map<String, String>>) JsonUtils.parseArray(getsubjectList);
List<Map<String, String>> redistList = new ArrayList<>();
for (Map<String, String> redissubjectTask : subjectList) {
String resubject_id = redissubjectTask.get("subject_id").toString();
String reappid = redissubjectTask.get("appid").toString();
String taskid = redissubjectTask.get("task_id").toString();
appid="SI_1";
if (!resubject_id.equals(v_subject_id) || !reappid.equals(appid) || !v_task_id.equals(taskid)) {
redistList.add(redissubjectTask);
}
}
String redis = newkey + "@#@" + JsonUtils.toJSONString(redistList);
if(redistList.size()>0){
try {
System.out.println(newkey+"写入redis是" + JsonUtils.toJSONString(redistList));
RedisUtil.set(newkey, JsonUtils.toJSONString(redistList), 10);
} catch (Exception e) {
e.printStackTrace();
}
}else {
System.out.println("删除redis是" +newkey);
RedisUtil.del(newkey, 10);
}
} catch (Exception e) {
log.error("获取redis中的任务失败" + getsubjectList);
}
}
System.out.println(System.currentTimeMillis() + "任务组装结束的时间");
log.info("结束时间" + DateUtil.getcurr());
log.info("当天任务的数量" + key + " ; data = " + subjectTaskendList.size());
}
}
try {
Thread.sleep(1000*5);
} catch (InterruptedException e) {
e.printStackTrace();
}
}
}
private boolean disposeCrawldataflag(String crawldataflag) {
try{
if (RedisUtil.exists(crawldataflag, 10)) { // 先去 redis中查询是否存在不存直接忽略
String value = RedisUtil.get(crawldataflag,10);
if(null != value && !("").equals(value)) {
return true;
}
} else {
log.error("[datasave] exec >>> 灌数:该 crwaldataflag 在 Redis 中不存在!!! keys = " + crawldataflag + " ; dbindex = " + 10);
return false;
}
return false;
}catch (Exception e){
e.printStackTrace();
return false;
}
}
}

31
cl_stream_datasave/src/main/java/com/bfd/mf/runstart/DelRunStartDataSave.java

@ -0,0 +1,31 @@
package com.bfd.mf.runstart;
import com.bfd.mf.datasave.tools.DBUtil;
import com.bfd.mf.entity.mysql.SubjectTask;
import com.bfd.mf.entity.mysql.taskdel;
import crawler.open.util.RedisUtil;
import org.apache.log4j.PropertyConfigurator;
public class DelRunStartDataSave {
private static String log4jPath = "../etc/log4j.properties";
private static String dbPath = "../etc/db.properties";
private static String redisPath = "../etc/145redis.properties";
static {
PropertyConfigurator.configureAndWatch(log4jPath);
DBUtil.init(dbPath);
RedisUtil.init(redisPath);
}
public static void main(String[] args) {
System.out.println("asdasdad");
for (int i = 0; i < 1; i ++) {
taskdel taskdel = new taskdel();
Thread del = new Thread(taskdel, "taskdel" + i);
del.start();
}
}
}

36
cl_stream_datasave/src/main/resources/META-INF/MANIFEST.MF

@ -0,0 +1,36 @@
Manifest-Version: 1.0
Main-Class: com.bfd.mf.runstart.DelRunStartDataSave
Class-Path: junit-4.13-beta-1.jar zkclient-0.10.jar lucene-core-7.2.1.ja
r netty-codec-4.1.16.Final.jar protobuf-java-3.19.4.jar lucene-spatial-
extras-7.2.1.jar utils-3.0.0.jar fastjson-1.1.22.jar mysql-connector-ja
va-8.0.29.jar netty-resolver-4.1.16.Final.jar lucene-spatial3d-7.2.1.ja
r commons-codec-1.10.jar elasticsearch-core-6.2.3.jar lz4-1.3.0.jar com
mons-lang3-3.1.jar lucene-join-7.2.1.jar reindex-client-6.2.3.jar snake
yaml-1.17.jar netty-codec-http-4.1.16.Final.jar hamcrest-core-1.3.jar l
ucene-misc-7.2.1.jar guava-14.0.1.jar lucene-suggest-7.2.1.jar hppc-0.7
.1.jar lucene-highlighter-7.2.1.jar httpasyncclient-4.1.2.jar netty-com
mon-4.1.16.Final.jar transport-6.2.3.jar log4j-api-2.9.1.jar HdrHistogr
am-2.1.9.jar kafka-0.10.jar compiler-0.9.3.jar lucene-memory-7.2.1.jar
elasticsearch-cli-6.2.3.jar aggs-matrix-stats-client-6.2.3.jar lucene-a
nalyzers-common-7.2.1.jar lucene-sandbox-7.2.1.jar jackson-dataformat-c
bor-2.8.10.jar elastiUtils-0.0.1-SNAPSHOT.jar httpcore-nio-4.4.5.jar co
mmons-logging-1.1.3.jar BfdRedisTools-2.0-1.0.0.jar slf4j-api-1.7.22.ja
r httpcore-4.4.5.jar snappy-java-1.1.2.6.jar jts-1.13.jar commons-pool2
-2.0.jar jodis-0.1.2.jar netty-handler-4.1.16.Final.jar metrics-core-2.
2.0.jar curator-client-2.7.0.jar transport-netty4-client-6.2.3.jar elas
ticsearch-6.2.3.jar httpclient-4.5.2.jar lang-mustache-client-6.2.3.jar
lucene-queryparser-7.2.1.jar jackson-dataformat-smile-2.8.10.jar kafka
_2.10-0.10.2.0.jar commons-lang-2.4.jar rank-eval-client-6.2.3.jar elas
ticsearch-rest-client-6.2.3.jar jackson-core-2.8.1.jar scala-library-2.
10.6.jar t-digest-3.0.jar spatial4j-0.6.jar securesm-1.2.jar curator-re
cipes-2.7.0.jar jedis-2.6.0.jar lucene-queries-7.2.1.jar curator-framew
ork-2.7.0.jar lucene-backward-codecs-7.2.1.jar parent-join-client-6.2.3
.jar jackson-dataformat-yaml-2.8.10.jar okio-1.11.0.jar netty-transport
-4.1.16.Final.jar jopt-simple-5.0.3.jar jackson-annotations-2.8.1.jar j
oda-time-2.9.9.jar zookeeper-3.4.6.jar okhttp-3.6.0.jar netty-buffer-4.
1.16.Final.jar log4j-core-2.9.1.jar slf4j-log4j12-1.7.21.jar jackson-da
tabind-2.8.1.jar lucene-spatial-7.2.1.jar percolator-client-6.2.3.jar n
etty-3.7.0.Final.jar log4j-1.2.17.jar lucene-grouping-7.2.1.jar elastic
search-rest-high-level-client-6.2.3.jar kafka-clients-0.10.2.0.jar jlin
e-0.9.94.jar jna-4.5.1.jar

BIN
cl_stream_datasave/target/cl_stream_datasave-2.0-SNAPSHOT.jar

BIN
cl_stream_datasave/target/cl_stream_datasave-2.0-SNAPSHOT.jar.original

36
cl_stream_datasave/target/classes/META-INF/MANIFEST.MF

@ -0,0 +1,36 @@
Manifest-Version: 1.0
Main-Class: com.bfd.mf.runstart.DelRunStartDataSave
Class-Path: junit-4.13-beta-1.jar zkclient-0.10.jar lucene-core-7.2.1.ja
r netty-codec-4.1.16.Final.jar protobuf-java-3.19.4.jar lucene-spatial-
extras-7.2.1.jar utils-3.0.0.jar fastjson-1.1.22.jar mysql-connector-ja
va-8.0.29.jar netty-resolver-4.1.16.Final.jar lucene-spatial3d-7.2.1.ja
r commons-codec-1.10.jar elasticsearch-core-6.2.3.jar lz4-1.3.0.jar com
mons-lang3-3.1.jar lucene-join-7.2.1.jar reindex-client-6.2.3.jar snake
yaml-1.17.jar netty-codec-http-4.1.16.Final.jar hamcrest-core-1.3.jar l
ucene-misc-7.2.1.jar guava-14.0.1.jar lucene-suggest-7.2.1.jar hppc-0.7
.1.jar lucene-highlighter-7.2.1.jar httpasyncclient-4.1.2.jar netty-com
mon-4.1.16.Final.jar transport-6.2.3.jar log4j-api-2.9.1.jar HdrHistogr
am-2.1.9.jar kafka-0.10.jar compiler-0.9.3.jar lucene-memory-7.2.1.jar
elasticsearch-cli-6.2.3.jar aggs-matrix-stats-client-6.2.3.jar lucene-a
nalyzers-common-7.2.1.jar lucene-sandbox-7.2.1.jar jackson-dataformat-c
bor-2.8.10.jar elastiUtils-0.0.1-SNAPSHOT.jar httpcore-nio-4.4.5.jar co
mmons-logging-1.1.3.jar BfdRedisTools-2.0-1.0.0.jar slf4j-api-1.7.22.ja
r httpcore-4.4.5.jar snappy-java-1.1.2.6.jar jts-1.13.jar commons-pool2
-2.0.jar jodis-0.1.2.jar netty-handler-4.1.16.Final.jar metrics-core-2.
2.0.jar curator-client-2.7.0.jar transport-netty4-client-6.2.3.jar elas
ticsearch-6.2.3.jar httpclient-4.5.2.jar lang-mustache-client-6.2.3.jar
lucene-queryparser-7.2.1.jar jackson-dataformat-smile-2.8.10.jar kafka
_2.10-0.10.2.0.jar commons-lang-2.4.jar rank-eval-client-6.2.3.jar elas
ticsearch-rest-client-6.2.3.jar jackson-core-2.8.1.jar scala-library-2.
10.6.jar t-digest-3.0.jar spatial4j-0.6.jar securesm-1.2.jar curator-re
cipes-2.7.0.jar jedis-2.6.0.jar lucene-queries-7.2.1.jar curator-framew
ork-2.7.0.jar lucene-backward-codecs-7.2.1.jar parent-join-client-6.2.3
.jar jackson-dataformat-yaml-2.8.10.jar okio-1.11.0.jar netty-transport
-4.1.16.Final.jar jopt-simple-5.0.3.jar jackson-annotations-2.8.1.jar j
oda-time-2.9.9.jar zookeeper-3.4.6.jar okhttp-3.6.0.jar netty-buffer-4.
1.16.Final.jar log4j-core-2.9.1.jar slf4j-log4j12-1.7.21.jar jackson-da
tabind-2.8.1.jar lucene-spatial-7.2.1.jar percolator-client-6.2.3.jar n
etty-3.7.0.Final.jar log4j-1.2.17.jar lucene-grouping-7.2.1.jar elastic
search-rest-high-level-client-6.2.3.jar kafka-clients-0.10.2.0.jar jlin
e-0.9.94.jar jna-4.5.1.jar

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/DownLoadFile.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/MyCookieJar.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/NewsDownload.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/Newscontent.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/OkHttpUtils.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/ProxyIp.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/download/test.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/kafka/IKafka.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/kafka/ReadKafka.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/DataSaveManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenKafkaManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenTaskManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/listen/ListenfastTaskManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/Constants.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBConnectionManager$DBConnectionPool.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBConnectionManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DBUtil.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DataCheckUtil.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DataProcess.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/DateUtil.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/PropertiesUtil.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/ReadLine.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/datasave/tools/WriteMethod.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/AllKeys.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/DataSaveManager.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/FieldInfo.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/FieldNormaliz.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/ReaultInfo.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/impl/DataSaveManagerImpl.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/FiledTableInfo.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTask.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTaskdele.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/SubjectTaskdelone.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/Tasklimit.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/Userlimit.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/cl_task.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/si.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/entity/mysql/taskdel.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/runstart/DelRunStartDataSave.class

BIN
cl_stream_datasave/target/classes/com/bfd/mf/runstart/RunStartDataSave.class

BIN
cl_stream_datasave/target/gxcl_stream_datasave-2.0-SNAPSHOT.jar

5
cl_stream_datasave/target/maven-archiver/pom.properties

@ -0,0 +1,5 @@
#Generated by Maven
#Mon Oct 31 11:59:19 CST 2022
version=2.0-SNAPSHOT
groupId=com.bfd.mf
artifactId=cl_stream_datasave

36
cl_stream_datasave/target/maven-status/maven-compiler-plugin/compile/default-compile/createdFiles.lst

@ -0,0 +1,36 @@
com/bfd/mf/entity/FieldInfo.class
com/bfd/mf/datasave/tools/DBConnectionManager.class
com/bfd/mf/datasave/tools/Constants.class
com/bfd/mf/entity/FieldNormaliz.class
com/bfd/mf/runstart/RunStartDataSave.class
com/bfd/mf/datasave/tools/DataProcess.class
com/bfd/mf/datasave/kafka/IKafka.class
com/bfd/mf/datasave/listen/ListenKafkaManager.class
com/bfd/mf/entity/mysql/SubjectTask.class
com/bfd/mf/datasave/download/OkHttpUtils.class
com/bfd/mf/datasave/listen/ListenTaskManager.class
com/bfd/mf/datasave/kafka/ReadKafka.class
com/bfd/mf/datasave/listen/DataSaveManager.class
com/bfd/mf/datasave/download/test.class
com/bfd/mf/datasave/download/MyCookieJar.class
com/bfd/mf/datasave/tools/WriteMethod.class
com/bfd/mf/datasave/tools/PropertiesUtil.class
com/bfd/mf/entity/mysql/Userlimit.class
com/bfd/mf/datasave/tools/ReadLine.class
com/bfd/mf/entity/mysql/cl_task.class
com/bfd/mf/datasave/download/ProxyIp.class
com/bfd/mf/entity/impl/DataSaveManagerImpl.class
com/bfd/mf/entity/AllKeys.class
com/bfd/mf/datasave/tools/DBUtil.class
com/bfd/mf/entity/mysql/SubjectTaskdelone.class
com/bfd/mf/datasave/listen/ListenfastTaskManager.class
com/bfd/mf/entity/DataSaveManager.class
com/bfd/mf/datasave/download/NewsDownload.class
com/bfd/mf/entity/mysql/Tasklimit.class
com/bfd/mf/datasave/download/DownLoadFile.class
com/bfd/mf/datasave/tools/DateUtil.class
com/bfd/mf/datasave/tools/DBConnectionManager$DBConnectionPool.class
com/bfd/mf/entity/mysql/FiledTableInfo.class
com/bfd/mf/datasave/download/Newscontent.class
com/bfd/mf/entity/ReaultInfo.class
com/bfd/mf/datasave/tools/DataCheckUtil.class

39
cl_stream_datasave/target/maven-status/maven-compiler-plugin/compile/default-compile/inputFiles.lst

@ -0,0 +1,39 @@
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/MyCookieJar.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/FieldNormaliz.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/SubjectTask.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/impl/DataSaveManagerImpl.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/DataCheckUtil.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/testkongtianyuan.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/PropertiesUtil.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/DataSaveManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/test.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/ReaultInfo.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/DataProcess.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/ProxyIp.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/kafka/IKafka.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/Userlimit.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/Constants.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/DataSaveManager_kongtianyuan.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/DateUtil.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/FieldInfo.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/FiledTableInfo.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/cl_task.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/WriteMethod.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/OkHttpUtils.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/Newscontent.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/DownLoadFile.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/ReadFile1125.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/DBConnectionManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/ReadLine.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/ListenTaskManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/ListenfastTaskManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/AllKeys.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/kafka/ReadKafka.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/entity/mysql/Tasklimit.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/runstart/TaskFileUtils.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/download/NewsDownload.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/runstart/RunStartDataSave.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/tools/DBUtil.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/ListenKafkaManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/datasave/listen/DataSaveManager.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/main/java/com/bfd/mf/runstart/GeterExit.java

2
cl_stream_datasave/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/createdFiles.lst

@ -0,0 +1,2 @@
CreatIndex.class
Test1.class

3
cl_stream_datasave/target/maven-status/maven-compiler-plugin/testCompile/default-testCompile/inputFiles.lst

@ -0,0 +1,3 @@
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/test/java/CreatIndex.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/test/java/AboutMysql.java
/Users/zhichengzhang/Desktop/公司/查询服务/datastreamfast/SocialX_Stream_1.0/cl_stream_datasave/src/test/java/Test1.java

BIN
cl_stream_datasave/target/test-classes/CreatIndex.class

BIN
cl_stream_datasave/target/test-classes/Test1.class

Loading…
Cancel
Save