From 8f5cb469b825cce61734c84fd633f0dfc3000ee6 Mon Sep 17 00:00:00 2001 From: guyue <1721849008@qq.com> Date: 星期二, 08 七月 2025 18:50:01 +0800 Subject: [PATCH] 第三方接口请求数据完成 --- src/main/java/com/linghu/controller/CollectController.java | 305 +++++++++++++++++++++++++++----------------------- 1 files changed, 164 insertions(+), 141 deletions(-) diff --git a/src/main/java/com/linghu/controller/CollectController.java b/src/main/java/com/linghu/controller/CollectController.java index 434c9d6..e3bab81 100644 --- a/src/main/java/com/linghu/controller/CollectController.java +++ b/src/main/java/com/linghu/controller/CollectController.java @@ -3,13 +3,18 @@ import java.time.LocalDateTime; import java.time.format.DateTimeFormatter; import java.util.ArrayList; -import java.util.Date; import java.util.List; import java.util.Map; +import java.util.Optional; import java.util.stream.Collectors; import javax.servlet.http.HttpServletRequest; +import com.fasterxml.jackson.core.JsonProcessingException; +import com.fasterxml.jackson.databind.JsonNode; +import com.fasterxml.jackson.databind.ObjectMapper; +import com.linghu.model.dto.*; +import org.springframework.beans.BeanUtils; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Value; import org.springframework.core.ParameterizedTypeReference; @@ -21,8 +26,6 @@ import com.baomidou.mybatisplus.core.conditions.query.LambdaQueryWrapper; import com.baomidou.mybatisplus.core.conditions.update.LambdaUpdateWrapper; import com.linghu.model.common.ResponseResult; -import com.linghu.model.dto.HealthResponse; -import com.linghu.model.dto.SearchTaskRequest; import com.linghu.model.entity.Keyword; import com.linghu.model.entity.Question; import com.linghu.model.entity.User; @@ -30,23 +33,19 @@ import com.linghu.service.QuestionService; import com.linghu.service.ReferenceService; import com.linghu.utils.JwtUtils; -import com.linghu.model.dto.SearchTaskResponse; -import com.linghu.model.dto.TaskStatusResponse; -import com.linghu.model.dto.TaskCancelResponse; -import com.linghu.model.dto.TaskListResponse; import io.jsonwebtoken.lang.Collections; import io.swagger.annotations.Api; import io.swagger.annotations.ApiOperation; import reactor.core.publisher.Mono; -import org.springframework.web.bind.annotation.*; +import org.springframework.web.bind.annotation.* ; import org.springframework.http.HttpStatus; -import com.linghu.model.dto.TaskResultResponse; import com.linghu.model.dto.TaskResultResponse.QuestionResult; import com.linghu.model.dto.TaskResultResponse.UserResult; import com.linghu.model.entity.Reference; import java.util.stream.Collectors; +import java.util.stream.IntStream; @RestController @RequestMapping("/collect") @@ -71,25 +70,38 @@ @PostMapping("/search") @ApiOperation(value = "开始采集") - public Mono<ResponseResult<SearchTaskResponse>> createSearchTask( + public Mono<SearchTaskResponse> createSearchTask( @RequestBody SearchTaskRequest searchTaskRequest, - HttpServletRequest request) { + HttpServletRequest request) throws JsonProcessingException { String token = request.getHeader("Authorization"); User user = jwtUtils.parseToken(token); - List<User> users = new ArrayList<>(); - users.add(user); + // 复制到UserDto + UserDto userDto = new UserDto(); + userDto.setName(user.getUser_name()); + userDto.setEmail(user.getUser_email()); + userDto.setPassword(user.getPassword()); + + // List<User> users = new ArrayList<>(); + // users.add(user); + List<UserDto> users = new ArrayList<>(); + users.add(userDto); searchTaskRequest.setUsers(users); + // json格式 + ObjectMapper objectMapper = new ObjectMapper(); + System.out.println(objectMapper.writeValueAsString(searchTaskRequest)); return webClient.post() - .uri(baseUrl + "/search") + .uri(baseUrl + "/api/v1/search") .contentType(MediaType.APPLICATION_JSON) .bodyValue(searchTaskRequest) .retrieve() - .bodyToMono(new ParameterizedTypeReference<ResponseResult<SearchTaskResponse>>() { + .onStatus(HttpStatus::is4xxClientError, response -> response.bodyToMono(String.class) + .flatMap(errorBody -> Mono.error(new RuntimeException(errorBody)))) + .bodyToMono(new ParameterizedTypeReference<SearchTaskResponse>() { }) .flatMap(responseResult -> { // 提取任务ID - SearchTaskResponse taskResponse = responseResult.getData(); + SearchTaskResponse taskResponse = responseResult; if (taskResponse != null && taskResponse.getTask_id() != null) { // 保存任务ID到关键词 LambdaUpdateWrapper<Keyword> updateWrapper = new LambdaUpdateWrapper<>(); @@ -99,10 +111,13 @@ // 可选:更新响应中的其他信息 // taskResponse.setMessage("任务已提交并保存,ID: " + taskResponse.getTaskId()); } - return Mono.just(responseResult); + return Mono.just(taskResponse); }) .onErrorResume(e -> { - return Mono.just(ResponseResult.error("调用失败: " + e.getMessage())); + // return Mono.just(ResponseResult.error("调用失败: " + e.getMessage())); + SearchTaskResponse task = new SearchTaskResponse(); + task.setMessage("调用失败: " + e.getMessage()); + return Mono.just(task); }); } @@ -110,11 +125,11 @@ @GetMapping("/status") public Mono<TaskStatusResponse> getTaskStatus(String taskId) { return webClient.get() - .uri(baseUrl + "/tasks/" + taskId) + .uri(baseUrl + "/api/v1/tasks/" + taskId) .accept(MediaType.APPLICATION_JSON) .retrieve() - .onStatus(HttpStatus::is4xxClientError, response -> response.bodyToMono(String.class) - .flatMap(errorBody -> Mono.error(new RuntimeException("任务不存在: " + errorBody)))) + .onStatus(HttpStatus::is4xxClientError, response -> response.bodyToMono(TaskStatusResponse.class) + .flatMap(errorBody -> Mono.error(new RuntimeException(errorBody.getDetail())))) .bodyToMono(TaskStatusResponse.class) .flatMap(result -> { TaskStatusResponse taskStatusResponse = result; @@ -130,6 +145,15 @@ questionService.updateBatchById(updateQuestions); } return Mono.just(result); + }) + .onErrorResume(e -> { + // 创建一个自定义的错误响应对象 + TaskStatusResponse errorResponse = new TaskStatusResponse(); + errorResponse.setStatus("ERROR"); + errorResponse.setMessage(e.getMessage()); + errorResponse.setDetail(e.getMessage()); + + return Mono.just(errorResponse); }); } @@ -137,20 +161,12 @@ @ApiOperation(value = "取消任务") public Mono<ResponseResult<TaskCancelResponse>> cancelTask(@PathVariable String taskId) { return webClient.post() - .uri(baseUrl + "/tasks/" + taskId + "/cancel") + .uri(baseUrl + "/api/v1/tasks/" + taskId + "/cancel") .contentType(MediaType.APPLICATION_JSON) .bodyValue(Collections.emptyMap()) // 添加空请求体 .retrieve() - .onStatus(HttpStatus::isError, response -> { - if (response.statusCode() == HttpStatus.NOT_FOUND) { - return response.bodyToMono(String.class) - .flatMap(errorBody -> Mono.error(new RuntimeException("任务不存在"))); - } else if (response.statusCode() == HttpStatus.BAD_REQUEST) { - return response.bodyToMono(String.class) - .flatMap(errorBody -> Mono.error(new RuntimeException("任务已经完成,无法取消"))); - } - return response.createException().flatMap(Mono::error); - }) + .onStatus(HttpStatus::isError, response -> response.bodyToMono(TaskCancelResponse.class) + .flatMap(errorBody -> Mono.error(new RuntimeException(errorBody.getDetail())))) .bodyToMono(TaskCancelResponse.class) .map(data -> ResponseResult.success(data)) .onErrorResume(e -> { @@ -165,9 +181,9 @@ @ApiOperation(value = "获取任务结果") @GetMapping("/tasks/{taskId}") - public Mono<ResponseResult<TaskResultResponse>> getTaskResult(@PathVariable String taskId) { + public Mono<TaskResultResponse> getTaskResult(@PathVariable String taskId) { return webClient.get() - .uri(baseUrl + "/tasks/" + taskId + "/result") + .uri(baseUrl + "/api/v1/tasks/" + taskId + "/result") .accept(MediaType.APPLICATION_JSON) .retrieve() .onStatus(HttpStatus::is4xxClientError, response -> { @@ -180,10 +196,9 @@ } return response.createException().flatMap(Mono::error); }) - .bodyToMono(new ParameterizedTypeReference<ResponseResult<TaskResultResponse>>() { - }) + .bodyToMono(TaskResultResponse.class) .flatMap(responseResult -> { - TaskResultResponse result = responseResult.getData(); + TaskResultResponse result = responseResult; if (result != null && result.getResults() != null) { return updateQuestionAndReference(result) .thenReturn(responseResult); @@ -192,77 +207,77 @@ }) .onErrorResume(e -> { System.out.println("获取任务结果失败"); - return Mono.just(ResponseResult.error(e.getMessage())); + TaskResultResponse result = new TaskResultResponse(); + result.setDetail("获取任务结果失败: " + e.getMessage()); + return Mono.just(result); }); } - /* - * private Mono<Void> updateQuestionAndReference(TaskResultResponse result) { - * return Mono.fromRunnable(() -> { - * // 1. 更新关键词状态 - * LambdaUpdateWrapper<Keyword> keywordUpdate = new LambdaUpdateWrapper<>(); - * keywordUpdate.eq(Keyword::getTask_id, result.getTask_id()) - * .set(Keyword::getStatus, "completed"); - * keywordService.update(keywordUpdate); - * - * // 查询关键词ID - * LambdaQueryWrapper<Keyword> keywordQuery = new LambdaQueryWrapper<>(); - * keywordQuery.eq(Keyword::getTask_id, result.getTask_id()); - * Keyword keyword = keywordService.getOne(keywordQuery); - * - * if (keyword == null) { - * System.out.println("未找到关联的关键词,task_id: " + result.getTask_id()); - * return; - * } - * - * // 2. 处理每个用户的问题结果 - * for (UserResult userResult : result.getResults()) { - * for (QuestionResult questionResult : userResult.getQuestions_results()) { - * // 2.1 查询问题ID - * LambdaQueryWrapper<Question> queryWrapper = new LambdaQueryWrapper<>(); - * queryWrapper.eq(Question::getQuestion, questionResult.getQuestion()) - * .eq(Question::getKeyword_id, keyword.getKeyword_id()); - * Question question = questionService.getOne(queryWrapper); - * - * if (question != null) { - * // 更新问题状态 - * LambdaUpdateWrapper<Question> updateWrapper = new LambdaUpdateWrapper<>(); - * updateWrapper.eq(Question::getQuestion_id, question.getQuestion_id()) - * .set(Question::getStatus, questionResult.getStatus()) - * .set(Question::getResponse, questionResult.getResponse()) - * .set(Question::getExtracted_count, questionResult.getExtracted_count()) - * .set(Question::getError, questionResult.getError()) - * .set(Question::getTimestamp, LocalDateTime.parse( - * questionResult.getTimestamp(), - * DateTimeFormatter.ofPattern("yyyy-MM-dd'T'HH:mm:ss.SSSSSS") - * )); - * questionService.update(updateWrapper); - * - * // 2.2 保存引用数据 - * List<Reference> references = questionResult.getReferences().stream() - * .map(ref -> { - * Reference reference = new Reference(); - * reference.setQuestion_id(question.getQuestion_id()); - * reference.setTitle(ref.getTitle()); - * reference.setUrl(ref.getUrl()); - * reference.setDomain(ref.getDomain()); - * reference.setCreate_time(new Date()); - * return reference; - * }) - * .collect(Collectors.toList()); - * - * if (!references.isEmpty()) { - * referenceService.saveBatch(references); - * } - * } else { - * System.out.println("未找到匹配的问题,question " + question.getQuestion()); - * - * } - * } - * } - * }); - * } - */ +// private Mono<Void> updateQuestionAndReference(TaskResultResponse result) { +// return Mono.fromRunnable(() -> { +// // 1. 更新关键词状态 +// LambdaUpdateWrapper<Keyword> keywordUpdate = new LambdaUpdateWrapper<>(); +// keywordUpdate.eq(Keyword::getTask_id, result.getTask_id()) +// .set(Keyword::getStatus, "completed"); +// keywordService.update(keywordUpdate); +// +// // 查询关键词ID +// LambdaQueryWrapper<Keyword> keywordQuery = new LambdaQueryWrapper<>(); +// keywordQuery.eq(Keyword::getTask_id, result.getTask_id()); +// Keyword keyword = keywordService.getOne(keywordQuery); +// +// if (keyword == null) { +// System.out.println("未找到关联的关键词,task_id: " + result.getTask_id()); +// return; +// } +// +// // 2. 处理每个用户的问题结果 +// for (UserResult userResult : result.getResults()) { +// for (QuestionResult questionResult : userResult.getQuestions_results()) { +// // 2.1 查询问题ID +// LambdaQueryWrapper<Question> queryWrapper = new LambdaQueryWrapper<>(); +// queryWrapper.eq(Question::getQuestion, questionResult.getQuestion()) +// .eq(Question::getKeyword_id, keyword.getKeyword_id()); +// Question question = questionService.getOne(queryWrapper); +// +// if (question != null) { +// // 更新问题状态 +// LambdaUpdateWrapper<Question> updateWrapper = new LambdaUpdateWrapper<>(); +// updateWrapper.eq(Question::getQuestion_id, question.getQuestion_id()) +// .set(Question::getStatus, questionResult.getStatus()) +// .set(Question::getResponse, questionResult.getResponse()) +// .set(Question::getExtracted_count, questionResult.getExtracted_count()) +// .set(Question::getError, questionResult.getError()) +// .set(Question::getTimestamp, LocalDateTime.parse( +// questionResult.getTimestamp(), +// DateTimeFormatter.ofPattern("yyyy-MM-dd'T'HH:mm:ss.SSSSSS") +// )); +// questionService.update(updateWrapper); +// +// // 2.2 保存引用数据 +// List<Reference> references = questionResult.getReferences().stream() +// .map(ref -> { +// Reference reference = new Reference(); +// reference.setQuestion_id(question.getQuestion_id()); +// reference.setTitle(ref.getTitle()); +// reference.setUrl(ref.getUrl()); +// reference.setDomain(ref.getDomain()); +// reference.setCreate_time(LocalDateTime.now()); +// return reference; +// }) +// .collect(Collectors.toList()); +// +// if (!references.isEmpty()) { +// referenceService.saveBatch(references); +// } +// } else { +// System.out.println("未找到匹配的问题,question " + question.getQuestion()); +// +// } +// } +// } +// }); +// } private Mono<Void> updateQuestionAndReference(TaskResultResponse result) { return Mono.fromRunnable(() -> { @@ -279,12 +294,11 @@ Keyword keyword = keywordService.getOne(keywordQuery); if (keyword == null) { - // log.error("未找到关联的关键词,task_id: {}", result.getTask_id()); System.out.println("未找到关联的关键词,task_id: " + result.getTask_id()); return; } - // 2. 批量查询所有问题(假设Question有task_id和keyword_id字段) + // 2. 批量查询所有问题 LambdaQueryWrapper<Question> queryWrapper = new LambdaQueryWrapper<>(); queryWrapper.eq(Question::getKeyword_id, keyword.getKeyword_id()); List<Question> questions = questionService.list(queryWrapper); @@ -297,7 +311,7 @@ List<Question> questionsToUpdate = new ArrayList<>(); List<Reference> allReferences = new ArrayList<>(); - // 遍历结果,只收集数据不执行数据库操作 + // 遍历结果 for (UserResult userResult : result.getResults()) { for (QuestionResult questionResult : userResult.getQuestions_results()) { try { @@ -316,55 +330,60 @@ question.setTimestamp( LocalDateTime.parse(questionResult.getTimestamp(), formatter)); } + //更新 +// questionService.updateById(question); questionsToUpdate.add(question); - // 收集引用数据 - List<Reference> references = questionResult.getReferences().stream() - .map(ref -> { - Reference reference = new Reference(); - reference.setQuestion_id(question.getQuestion_id()); - reference.setTitle(ref.getTitle()); - reference.setUrl(ref.getUrl()); - reference.setDomain(ref.getDomain()); - reference.setCreate_time(LocalDateTime.now()); - return reference; - }) - .collect(Collectors.toList()); + // 收集引用数据,处理空集合情况 + List<Reference> references = + Optional.ofNullable(questionResult.getReferences()) + .orElse(Collections.emptyList()) + .stream() + .map(ref -> { + Reference reference = new Reference(); + reference.setQuestion_id(question.getQuestion_id()); + reference.setTitle(ref.getTitle()); + reference.setUrl(ref.getUrl()); + reference.setDomain(ref.getDomain()); + reference.setCreate_time(LocalDateTime.now()); + return reference; + }) + .collect(Collectors.toList()); - allReferences.addAll(references); - } else { - // log.warn("未找到匹配的问题,question: {}, keyword_id: {}", - // questionResult.getQuestion(), keyword.getKeyword_id()); + // 添加到总引用列表 + if (!references.isEmpty()) { + allReferences.addAll(references); + } } } catch (Exception e) { - // log.error("处理问题结果失败,question: {}, error: {}", - // questionResult.getQuestion(), e.getMessage(), e); + System.out.println("处理问题结果失败: " + e.getMessage()); } } } // 4. 批量更新问题 + System.out.println(questionsToUpdate); if (!questionsToUpdate.isEmpty()) { questionService.updateBatchById(questionsToUpdate); - // log.info("成功批量更新 {} 个问题", questionsToUpdate.size()); + System.out.println("成功批量更新 " + questionsToUpdate.size() + " 个问题"); } - // 5. 批量插入引用 + // 5. 批量插入引用,使用流式分批处理 if (!allReferences.isEmpty()) { - // 分批处理,每批1000条记录,避免内存溢出 int batchSize = 1000; - for (int i = 0; i < allReferences.size(); i += batchSize) { - List<Reference> batch = allReferences.subList( - i, Math.min(i + batchSize, allReferences.size())); - referenceService.saveBatch(batch); - } - // log.info("成功批量插入 {} 条引用数据", allReferences.size()); + IntStream.iterate(0, i -> i + batchSize) + .limit((allReferences.size() + batchSize - 1) / batchSize) + .forEach(i -> { + List<Reference> batch = allReferences.subList( + i, Math.min(i + batchSize, allReferences.size())); + referenceService.saveBatch(batch); + }); + System.out.println("成功批量插入 " + allReferences.size() + " 条引用数据"); } } catch (Exception e) { - // log.error("更新问题和引用数据失败,task_id: {}, error: {}", - // result.getTask_id(), e.getMessage(), e); + System.out.println("更新问题和引用数据失败: " + e.getMessage()); throw new RuntimeException("更新问题和引用数据失败", e); } }); @@ -372,15 +391,19 @@ @GetMapping("/tasks/all") @ApiOperation(value = "获取所有任务列表") - public Mono<ResponseResult<TaskListResponse>> getAllTasks() { + public Mono<TaskListResponse> getAllTasks() { return webClient.get() - .uri(baseUrl + "/tasks") + .uri(baseUrl + "/api/v1/tasks") .accept(MediaType.APPLICATION_JSON) .retrieve() - .bodyToMono(new ParameterizedTypeReference<ResponseResult<TaskListResponse>>() { + .bodyToMono(new ParameterizedTypeReference<TaskListResponse>() { }) .onErrorResume(e -> { - return Mono.just(ResponseResult.error("获取任务列表失败: " + e.getMessage())); + TaskListResponse response = new TaskListResponse(); + response.setDetail("获取任务列表失败: " + e.getMessage()); + return Mono.just(response); + + // return Mono.just(ResponseResult.error("获取任务列表失败: " + e.getMessage())); }); } -- Gitblit v1.7.1