Browse Source

20210607-v1

崔老师项目版本代码
release-1.0
杜静 4 years ago
parent
commit
27b846360a
  1. 10
      cl_query_data_job/src/main/java/com/bfd/mf/job/service/backtrace/BacktraceService.java
  2. 4
      cl_query_data_job/src/main/java/com/bfd/mf/job/service/query/QueryService.java
  3. 25
      cl_query_data_job/src/main/java/com/bfd/mf/job/service/statistics/StatisticsService.java
  4. 33
      cl_query_data_job/src/main/resources/application.yml
  5. 4
      cl_search_api/src/main/java/com/bfd/mf/common/util/es/EsUtils.java
  6. 10
      cl_search_api/src/main/java/com/bfd/mf/controller/SearchDataController.java
  7. 4
      cl_search_api/src/main/resources/application.yml
  8. 4
      logs/sdkclient_error.log
  9. 0
      logs/sdkclient_error.log.2021-05-12-14

10
cl_query_data_job/src/main/java/com/bfd/mf/job/service/backtrace/BacktraceService.java

@ -53,12 +53,12 @@ public class BacktraceService {
@PostConstruct @PostConstruct
public void init() { public void init() {
// 注册数据查询来源 // 注册数据查询来源
EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
// EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target
pRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
cRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
dataRateLimiter = RateLimiter.create(config.esMiniBulkRate());
// kafkaProducer = Kafka010Utils.getProducer(config.getBrokerList());
// pRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
// cRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
// dataRateLimiter = RateLimiter.create(config.esMiniBulkRate());
// kafkaProducer = Kafka010Utils.getProducer(config.getBrokerList());
} }
/* /*

4
cl_query_data_job/src/main/java/com/bfd/mf/job/service/query/QueryService.java

@ -61,9 +61,9 @@ public class QueryService {
@PostConstruct @PostConstruct
public void init() { public void init() {
// 注册数据查询来源 // 注册数据查询来源
EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
// EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target
pRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
// pRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());
kafkaProducer = Kafka010Utils.getProducer(config.getBrokerList()); kafkaProducer = Kafka010Utils.getProducer(config.getBrokerList());
// cRateLimiter = RateLimiter.create(1.0D / config.getPeriodS()); // cRateLimiter = RateLimiter.create(1.0D / config.getPeriodS());

25
cl_query_data_job/src/main/java/com/bfd/mf/job/service/statistics/StatisticsService.java

@ -38,7 +38,7 @@ public class StatisticsService {
@PostConstruct @PostConstruct
public void init() { public void init() {
// 注册数据查询来源 // 注册数据查询来源
EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
// EsUtils.registerCluster(config.esNormalClusterName(), config.esNormalAddress());// 配置文件中的 es-source
EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target EsUtils.registerCluster(config.esMiniClusterName(), config.esMiniAddress()); // 配置文件中的 es-target
} }
@ -49,14 +49,14 @@ public class StatisticsService {
LOGGER.info("------------------------------------------------------------------ StatisticsService ------------------------------------------------------"); LOGGER.info("------------------------------------------------------------------ StatisticsService ------------------------------------------------------");
long start = System.currentTimeMillis(); long start = System.currentTimeMillis();
//-------统计134上的总量------------------------------------------------------------------------------------ //-------统计134上的总量------------------------------------------------------------------------------------
String clusterName = config.esNormalClusterName(); // 获得 134 clusterName
statisticsTotal(clusterName);
// String clusterName = config.esNormalClusterName(); // 获得 134 clusterName
//statisticsTotal(clusterName);
long end = System.currentTimeMillis(); long end = System.currentTimeMillis();
LOGGER.info("Statistics Total, took:{} ms.",(end - start)); LOGGER.info("Statistics Total, took:{} ms.",(end - start));
//-------统计147上的 每个任务的总量------------------------------------------------------------------------- //-------统计147上的 每个任务的总量-------------------------------------------------------------------------
start = System.currentTimeMillis(); start = System.currentTimeMillis();
clusterName = config.esMiniClusterName(); // 获得 147 clusterName
String clusterName = config.esMiniClusterName(); // 获得 147 clusterName
statisticsTask(clusterName); statisticsTask(clusterName);
end = System.currentTimeMillis(); end = System.currentTimeMillis();
LOGGER.info("Statistics Task, took:{} ms.",(end - start)); LOGGER.info("Statistics Task, took:{} ms.",(end - start));
@ -71,13 +71,13 @@ public class StatisticsService {
end = System.currentTimeMillis(); end = System.currentTimeMillis();
LOGGER.info("Statistics Subject Normal, took:{} ms.",(end - start)); LOGGER.info("Statistics Subject Normal, took:{} ms.",(end - start));
// 如果是欧莱雅任务的得用这个方式统计呀 // 如果是欧莱雅任务的得用这个方式统计呀
start = System.currentTimeMillis();
List<BigInteger> subjectIds1 = subjectRepository.findAllOlySubjectIds();
for (BigInteger subjectId: subjectIds1) {
statisticsSubject(subjectId,clusterName);
}
end = System.currentTimeMillis();
LOGGER.info("Statistics Subject OLY, took:{} ms.",(end - start));
// start = System.currentTimeMillis();
// List<BigInteger> subjectIds1 = subjectRepository.findAllOlySubjectIds();
// for (BigInteger subjectId: subjectIds1) {
// statisticsSubject(subjectId,clusterName);
// }
// end = System.currentTimeMillis();
// LOGGER.info("Statistics Subject OLY, took:{} ms.",(end - start));
} }
@ -151,7 +151,7 @@ public class StatisticsService {
}else{ }else{
siteTodayCount = 0; siteTodayCount = 0;
} }
switch (i) {
switch (i) { //
case 0: case 0:
subjectCrawlDatFlagMap.put("keyword", siteCount); subjectCrawlDatFlagMap.put("keyword", siteCount);
subjectCrawlDataFlagTodayMap.put("keyword", siteTodayCount); subjectCrawlDataFlagTodayMap.put("keyword", siteTodayCount);
@ -238,6 +238,7 @@ public class StatisticsService {
List<Task> taskList = taskRepository.findAllBydel0(); List<Task> taskList = taskRepository.findAllBydel0();
// 遍历任务List 根据条件组装ES查询语句去对应的索引下查结果然后回写到任务表中 // 遍历任务List 根据条件组装ES查询语句去对应的索引下查结果然后回写到任务表中
for (Task task: taskList) { for (Task task: taskList) {
System.out.println(" 任务ID ===== " + task);
Long taskId = task.getId().longValue(); Long taskId = task.getId().longValue();
String crawlDataFlag = task.getCrawlDataFlag(); String crawlDataFlag = task.getCrawlDataFlag();
String indexNamePre = config.getIndexNamePre(); String indexNamePre = config.getIndexNamePre();

33
cl_query_data_job/src/main/resources/application.yml

@ -6,9 +6,9 @@ logging:
spring: spring:
datasource: datasource:
driver-class-name: com.mysql.jdbc.Driver driver-class-name: com.mysql.jdbc.Driver
username: root
password: Bfd123!@#
url: jdbc:mysql://172.18.1.134:3306/intelligent_crawl?useOldAliasMetadataBehavior=true&characterEncoding=UTF-8&zeroDateTimeBehavior=round
username: crawl
password: crawl
url: jdbc:mysql://172.18.1.181:3306/intelligent_crawl?useOldAliasMetadataBehavior=true&characterEncoding=UTF-8&zeroDateTimeBehavior=round
hikari: hikari:
maximum-pool-size: 10 maximum-pool-size: 10
minimum-idle: 1 minimum-idle: 1
@ -29,14 +29,14 @@ worker:
## 服务的状态,true 为启动 ## 服务的状态,true 为启动
enable-analysis-producer: false enable-analysis-producer: false
enable-analysis-consumer: false enable-analysis-consumer: false
enable-statistics-producer: false
enable-statistics-producer: true
enable-query-producer: false enable-query-producer: false
enable-backtrace-producer: false enable-backtrace-producer: false
enable-rw-oly-producer: false enable-rw-oly-producer: false
enable-up-load-producer: false enable-up-load-producer: false
enable-output-producer: false enable-output-producer: false
enable-taskcount-producer: false enable-taskcount-producer: false
enable-alarm-producer: true
enable-alarm-producer: false
## 启动服务的线程数 ## 启动服务的线程数
statistics-producer-thread-count: 1 statistics-producer-thread-count: 1
query-producer-thread-count: 10 query-producer-thread-count: 10
@ -64,6 +64,29 @@ worker:
uploadZipPath : /opt/nfsdata/uploadFiles/ uploadZipPath : /opt/nfsdata/uploadFiles/
indexNamePre : cl_major_ indexNamePre : cl_major_
# es-normal:
# name: SQ_Normal
# address: 172.16.10.61:9301
# upper: 2000-01-01
# standby: cl_major_*
# es-reply-source:
# name: SQ_Normal
# address: 172.16.10.61:9301
# upper: 2000-01-01
# standby: cl_major_*
# es-mini:
# name: SQ_Normal
# address: 172.16.10.61:9301
# bulk-thread-count: 5
# bulk-rate: 3
# bulk-size: 100
# es-logstash:
# name: SQ_Normal
# address: 172.16.10.61:9301
# upper: 2021-01-01
# standby: logstash-2021.05.13
es-normal: es-normal:
name: SQ_Normal_new name: SQ_Normal_new
address: 172.18.1.134:9301 address: 172.18.1.134:9301

4
cl_search_api/src/main/java/com/bfd/mf/common/util/es/EsUtils.java

@ -183,7 +183,7 @@ public abstract class EsUtils {
.setQuery(boolQueryBuilder) .setQuery(boolQueryBuilder)
.setSearchType(SearchType.DEFAULT) .setSearchType(SearchType.DEFAULT)
.setSize(limit) .setSize(limit)
.setScroll(new TimeValue(20000))
.setScroll(new TimeValue(300000))
.execute() .execute()
.actionGet();//注意:首次搜索并不包含数据 .actionGet();//注意:首次搜索并不包含数据
}catch (Exception e){ }catch (Exception e){
@ -195,7 +195,7 @@ public abstract class EsUtils {
try { try {
searchResponse = client searchResponse = client
.prepareSearchScroll(scrollId) .prepareSearchScroll(scrollId)
.setScroll(new TimeValue(20000))
.setScroll(new TimeValue(300000))
.execute() .execute()
.actionGet(); .actionGet();
} catch (Exception e) { } catch (Exception e) {

10
cl_search_api/src/main/java/com/bfd/mf/controller/SearchDataController.java

@ -34,8 +34,6 @@ public class SearchDataController {
@Autowired @Autowired
private SearchDataService searchDataService; private SearchDataService searchDataService;
@Autowired @Autowired
private SiteRepository siteRepository;
@Autowired
private UpdateService updateService; private UpdateService updateService;
@ -58,13 +56,9 @@ public class SearchDataController {
}else if(subjectId.equals("")){ // 没有专题 }else if(subjectId.equals("")){ // 没有专题
result.put(ESConstant.ALLDOCNUMBER,0L); result.put(ESConstant.ALLDOCNUMBER,0L);
result.put(ESConstant.MONITORLISTS,new ArrayList<>()); result.put(ESConstant.MONITORLISTS,new ArrayList<>());
}else{ // 专题数据导出
//Integer searchType = queryRequest.getSearchType();
// if(searchType == 0) {
// result = searchDataService.exportDataInSubjectIndexTestGroupBy(queryRequest);
// }else{
}else{
// 专题数据导出
result = searchDataService.exportDataInSubjectIndex(queryRequest); result = searchDataService.exportDataInSubjectIndex(queryRequest);
// }
} }
return ResponseWrapper.buildResponse(RTCodeEnum.C_OK, result); return ResponseWrapper.buildResponse(RTCodeEnum.C_OK, result);
}else { }else {

4
cl_search_api/src/main/resources/application.yml

@ -11,8 +11,8 @@ spring:
datasource: datasource:
driver-class-name: com.mysql.jdbc.Driver driver-class-name: com.mysql.jdbc.Driver
username: root username: root
password: bfd123
url: jdbc:mysql://172.26.11.113:3306/intelligent_crawl_item?useOldAliasMetadataBehavior=true&characterEncoding=UTF-8&zeroDateTimeBehavior=round
password: Bfd123!@#
url: jdbc:mysql://172.18.1.134:3306/intelligent_crawl?useOldAliasMetadataBehavior=true&characterEncoding=UTF-8&zeroDateTimeBehavior=round
hikari: hikari:
maximum-pool-size: 10 maximum-pool-size: 10

4
logs/sdkclient_error.log

@ -1,4 +0,0 @@
2021-05-22 17:21:45,031 ERROR [com.bfd.mf.job.util.EMailUtils] EMailUtils:sendEmail error. title:{cid=Nreuters} emailList:[jing.du@percent.cn]
2021-05-22 17:21:45,039 ERROR [com.bfd.mf.job.util.EMailUtils] EMailUtils:sendEmail error. title:{cid=Nrusi} emailList:[jing.du@percent.cn]
2021-05-22 17:21:45,045 ERROR [com.bfd.mf.job.util.EMailUtils] EMailUtils:sendEmail error. title:{cid=Nusadefense} emailList:[jing.du@percent.cn]
2021-05-22 17:21:45,053 ERROR [com.bfd.mf.job.util.EMailUtils] EMailUtils:sendEmail error. title:{cid=Nenotrans} emailList:[jing.du@percent.cn]

0
logs/sdkclient_error.log.2021-05-12-14

Loading…
Cancel
Save