增加构建了知识库,同时构建相对应的索引

This commit is contained in:
moon 2025-09-23 17:02:50 +08:00
parent d9ae2a07c1
commit fbad0df5de
11 changed files with 98 additions and 42 deletions

View File

@ -507,7 +507,7 @@
import { useRoute, useRouter } from 'vue-router' import { useRoute, useRouter } from 'vue-router'
import { ref, reactive, computed, onMounted, onUnmounted } from 'vue' import { ref, reactive, computed, onMounted, onUnmounted } from 'vue'
import VueOfficePdf from '@vue-office/pdf' import VueOfficePdf from '@vue-office/pdf'
import { getDatasetDocPage, uploadDocument, deleteDocument, downloadDocument, previewDocumentUrl, renameDocument, createFolder, CreateFolderReq} from '@/api/dataset' import { getDatasetDocPage, uploadDocument, deleteDocument, downloadDocument, previewDocumentUrl, renameDocument, createFolder, CreateFolderReq,deleteFileIndex} from '@/api/dataset'
import {getSegmentList} from "@/api/Segment" import {getSegmentList} from "@/api/Segment"
import DocUpload from './DocUpload.vue' import DocUpload from './DocUpload.vue'
//VueOfficeDocx //VueOfficeDocx
@ -608,7 +608,7 @@ y: 0
// //
const currentParentId = ref<number | undefined>(undefined) const currentParentId = ref<number | undefined>(undefined)
const breadcrumbPath = ref<Array<{id: number, name: string}>>([]) const breadcrumbPath = ref<Array<{id: number, name: string}>>([])
const isScroll = ref(true) const isScroll = ref(false)
// //
interface BreadcrumbItem { interface BreadcrumbItem {
@ -1226,6 +1226,7 @@ try {
// //
await deleteDocument(parseInt(row.id)) await deleteDocument(parseInt(row.id))
// //
ElNotification({ ElNotification({
title: t('vabI18n.knowledge.document.messages.deleteSuccessOk'), title: t('vabI18n.knowledge.document.messages.deleteSuccessOk'),
@ -1407,6 +1408,7 @@ const handleScroll = async (event: Event) => {
isScroll.value = false isScroll.value = false
return return
} }
isScroll.value = true
// //
if (container.scrollHeight - container.scrollTop - container.clientHeight < 10) { if (container.scrollHeight - container.scrollTop - container.clientHeight < 10) {
// //

View File

@ -7,6 +7,7 @@ import com.bjtds.brichat.entity.dify.DatasetDto;
import com.bjtds.brichat.entity.dto.UserBindDatasetDto; import com.bjtds.brichat.entity.dto.UserBindDatasetDto;
import com.bjtds.brichat.entity.dto.UserLinkDatasetDto; import com.bjtds.brichat.entity.dto.UserLinkDatasetDto;
import com.bjtds.brichat.service.DatasetManagerService; import com.bjtds.brichat.service.DatasetManagerService;
import com.bjtds.brichat.service.EsTDatasetFilesService;
import com.bjtds.brichat.service.dify.DifyDatasetApiService; import com.bjtds.brichat.service.dify.DifyDatasetApiService;
import com.bjtds.brichat.util.ResultUtils; import com.bjtds.brichat.util.ResultUtils;
import com.bjtds.common.utils.Pagination; import com.bjtds.common.utils.Pagination;
@ -18,6 +19,7 @@ import org.springframework.http.ResponseEntity;
import org.springframework.web.bind.annotation.*; import org.springframework.web.bind.annotation.*;
import javax.annotation.Resource; import javax.annotation.Resource;
import java.io.IOException;
@Api(tags = "知识库管理") @Api(tags = "知识库管理")
@ -27,6 +29,9 @@ import javax.annotation.Resource;
@RequestMapping("/datasetManage") @RequestMapping("/datasetManage")
public class DatasetManageController { public class DatasetManageController {
@Resource
private EsTDatasetFilesService esTDatasetFilesService;
@Resource @Resource
private DatasetManagerService datasetManagerService; private DatasetManagerService datasetManagerService;
@ -70,6 +75,16 @@ public class DatasetManageController {
@PostMapping("/create") @PostMapping("/create")
public ResultUtils create(@RequestBody DatasetCreateRequest datasetCreateRequest) { public ResultUtils create(@RequestBody DatasetCreateRequest datasetCreateRequest) {
ResponseEntity<DatasetDto>res = difyDatasetApiService.createDataset(datasetCreateRequest.getName(), datasetCreateRequest.getDescription()); ResponseEntity<DatasetDto>res = difyDatasetApiService.createDataset(datasetCreateRequest.getName(), datasetCreateRequest.getDescription());
DatasetDto datasetDto = res.getBody();
String datasetId = datasetDto.getId();
//构建es索引
try {
esTDatasetFilesService.createIndex(datasetId);
log.info("创建es索引成功,知识库id:{}",datasetId);
} catch (IOException e) {
log.error("创建es索引失败,知识库id:{}",datasetId,e);
}
return ResultUtils.success(res.getBody()); return ResultUtils.success(res.getBody());
} }

View File

@ -99,7 +99,7 @@ public class KnowledgeBaseController {
// public ResultUtils createIndex(@RequestParam("documentId") String documentId) throws Exception { // public ResultUtils createIndex(@RequestParam("documentId") String documentId) throws Exception {
// //
// try{ // try{
// esTDatasetFilesImporter.importDocumentId(documentId); // esTDatasetFilesImporter.importDocumentId(Integer.valueOf(documentId));
// return ResultUtils.success("索引创建成功"); // return ResultUtils.success("索引创建成功");
// } catch (IOException e) { // } catch (IOException e) {
// return ResultUtils.error("索引创建失败: " + e.getMessage()); // return ResultUtils.error("索引创建失败: " + e.getMessage());

View File

@ -1,9 +1,13 @@
package com.bjtds.brichat.entity.dto; package com.bjtds.brichat.entity.dto;
import com.alibaba.fastjson.annotation.JSONField; import com.alibaba.fastjson.annotation.JSONField;
import lombok.AllArgsConstructor;
import lombok.Data; import lombok.Data;
import lombok.NoArgsConstructor;
@Data @Data
@NoArgsConstructor
@AllArgsConstructor
public class RecordDto { public class RecordDto {
/**分段信息*/ /**分段信息*/
@JSONField(name = "retrieval") @JSONField(name = "retrieval")

View File

@ -186,6 +186,13 @@ public interface TDatasetFilesMapper {
TDatasetFiles selectByDatasetIdAndDocId(@Param("difyDatasetId") String difyDatasetId, @Param("difyDocId") String difyDocId); TDatasetFiles selectByDatasetIdAndDocId(@Param("difyDatasetId") String difyDatasetId, @Param("difyDocId") String difyDocId);
/**
* 根据文档ID查询文件
*
* @param difyDocId 文档ID
* @return 文件信息
*/
TDatasetFiles selectByDocId( String difyDocId);
} }

View File

@ -171,6 +171,10 @@ public interface DatasetFilesService {
*/ */
void updateByDatasetIdAndDocId(String difyDatasetId, String difyDocId); void updateByDatasetIdAndDocId(String difyDatasetId, String difyDocId);
/**
* 根据文档ID查询文件
*/
TDatasetFiles getFileByDocId(String difyDocId);

View File

@ -455,5 +455,10 @@ public class DatasetFilesServiceImpl implements DatasetFilesService {
} }
} }
@Override
public TDatasetFiles getFileByDocId(String difyDocId) {
return datasetFilesMapper.selectByDocId(difyDocId);
}
} }

View File

@ -59,6 +59,7 @@ public class EsTDatasetFilesServiceImpl implements EsTDatasetFilesService {
} }
} }
// 创建索引 // 创建索引
@Override
public void createIndex(String DatasetId) throws IOException { public void createIndex(String DatasetId) throws IOException {
boolean exists = client.indices().exists(e -> e.index(DatasetId)).value(); boolean exists = client.indices().exists(e -> e.index(DatasetId)).value();
if (!exists) { if (!exists) {

View File

@ -19,6 +19,7 @@ import com.fasterxml.jackson.databind.JsonNode;
import com.fasterxml.jackson.databind.ObjectMapper; import com.fasterxml.jackson.databind.ObjectMapper;
import com.google.common.collect.Lists; import com.google.common.collect.Lists;
import lombok.extern.slf4j.Slf4j; import lombok.extern.slf4j.Slf4j;
import org.checkerframework.checker.units.qual.C;
import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.beans.factory.annotation.Value; import org.springframework.beans.factory.annotation.Value;
import org.springframework.stereotype.Service; import org.springframework.stereotype.Service;
@ -67,8 +68,8 @@ public class KnowledgeBaseServiceImpl implements KnowledgeBaseService {
@Override @Override
public List<RecordDto> retrieval(KnowledgeBaseDto knowledgeBaseDto) throws Exception { public List<RecordDto> retrieval(KnowledgeBaseDto knowledgeBaseDto) throws Exception {
String datasetPath = difyUrl + Constants.DATABASE_API; String datasetPath = difyUrl + Constants.DATABASE_API;
List<RecordDto> recordDtos = Lists.newArrayList(); List<RecordDto> recordDtos = new ArrayList<>();
List<Object> results = Lists.newArrayList(); List<RecordDto> results = Lists.newArrayList();
List<String> datasetIds =Lists.newArrayList(); List<String> datasetIds =Lists.newArrayList();
if (knowledgeBaseDto.getSelectedKnowledgeBaseIds() != null && !knowledgeBaseDto.getSelectedKnowledgeBaseIds().isEmpty()) { if (knowledgeBaseDto.getSelectedKnowledgeBaseIds() != null && !knowledgeBaseDto.getSelectedKnowledgeBaseIds().isEmpty()) {
@ -84,7 +85,16 @@ public class KnowledgeBaseServiceImpl implements KnowledgeBaseService {
if (knowledgeBaseDto.getSearchMethod().equals("keyword_search")) { if (knowledgeBaseDto.getSearchMethod().equals("keyword_search")) {
List<RecordDto> datasetFiles=esTDatasetFilesService.search(knowledgeBaseDto.getQuery(),datasetIds); List<RecordDto> datasetFiles=esTDatasetFilesService.search(knowledgeBaseDto.getQuery(),datasetIds);
recordDtos.addAll(datasetFiles); recordDtos.addAll(datasetFiles);
return recordDtos; recordDtos.sort((dto1, dto2) -> {
try {
double score1 = Double.parseDouble(dto1.getScore());
double score2 = Double.parseDouble(dto2.getScore());
return Double.compare(score2, score1);
} catch (NumberFormatException e) {
return 0;
}
});
return recordDtos;
} }
// 使用 CompletableFuture 并行查询多个数据集 // 使用 CompletableFuture 并行查询多个数据集
@ -136,7 +146,7 @@ public class KnowledgeBaseServiceImpl implements KnowledgeBaseService {
} }
}); });
results.addAll(recordDtos); results.addAll(recordDtos);
return recordDtos; return results;
} }
@Override @Override

View File

@ -3,13 +3,12 @@ package com.bjtds.brichat.util;
import com.bjtds.brichat.entity.dataset.TDatasetFiles; import com.bjtds.brichat.entity.dataset.TDatasetFiles;
import com.bjtds.brichat.service.DatasetFilesService; import com.bjtds.brichat.service.DatasetFilesService;
import com.bjtds.brichat.service.EsTDatasetFilesService; import com.bjtds.brichat.service.EsTDatasetFilesService;
import io.swagger.models.auth.In;
import lombok.extern.slf4j.Slf4j; import lombok.extern.slf4j.Slf4j;
import org.slf4j.Logger; import org.slf4j.Logger;
import org.slf4j.LoggerFactory; import org.slf4j.LoggerFactory;
import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.beans.factory.annotation.Qualifier;
import org.springframework.data.redis.core.RedisTemplate;
import org.springframework.data.redis.core.StringRedisTemplate; import org.springframework.data.redis.core.StringRedisTemplate;
import org.springframework.scheduling.annotation.Async; import org.springframework.scheduling.annotation.Async;
import org.springframework.stereotype.Service; import org.springframework.stereotype.Service;
@ -17,6 +16,7 @@ import org.springframework.stereotype.Service;
import java.io.File; import java.io.File;
import java.io.IOException; import java.io.IOException;
import java.util.List; import java.util.List;
@Slf4j @Slf4j
@Service @Service
public class EsTDatasetFilesImporter { public class EsTDatasetFilesImporter {
@ -25,7 +25,6 @@ public class EsTDatasetFilesImporter {
@Autowired @Autowired
private DatasetFilesService datasetFilesService; private DatasetFilesService datasetFilesService;
// private static final Logger log = LoggerFactory.getLogger(EsTDatasetFilesImporter.class);
@Autowired @Autowired
private StringRedisTemplate redisTemplate; private StringRedisTemplate redisTemplate;
@ -63,16 +62,16 @@ public class EsTDatasetFilesImporter {
if (document == null) continue; if (document == null) continue;
String filePath = document.getDifyStoragePath(); String filePath = document.getDifyStoragePath();
if (filePath == null) { if (filePath == null) {
log.info("documentId=" + document.getId() + " 不存在difyStoragePath跳过"); log.warn("documentId=" + document.getId() + " 不存在difyStoragePath跳过");
continue; continue;
} }
File file = new File(filePath); File file = new File(filePath);
if (!file.exists()) { if (!file.exists()) {
log.info(file.getAbsolutePath() + " 不存在,跳过"); log.warn(file.getAbsolutePath() + " 不存在,跳过");
continue; continue;
} }
if(Boolean.TRUE.equals(document.getIsEs())){ if(Boolean.TRUE.equals(document.getIsEs())){
log.info("documentId=" + document.getId() + " 是ES索引文件跳过"); log.warn("documentId=" + document.getId() + " 是ES索引文件跳过");
continue; continue;
} }
@ -83,9 +82,9 @@ public class EsTDatasetFilesImporter {
redisTemplate.opsForValue().set("import:task:" + taskId + ":finished", String.valueOf(finished)); redisTemplate.opsForValue().set("import:task:" + taskId + ":finished", String.valueOf(finished));
document.setIsEs(true); document.setIsEs(true);
datasetFilesService.updateFile(document); datasetFilesService.updateFile(document);
log.info("documentId=" + document.getId() + " 索引构建成功"); log.debug("documentId=" + document.getId() + " 索引构建成功");
} catch (Exception e) { } catch (Exception e) {
log.info("documentId=" + document.getId() + " 索引构建失败: " + e.getMessage()); log.debug("documentId=" + document.getId() + " 索引构建失败: " + e.getMessage());
} }
} }
redisTemplate.opsForValue().set("import:task:" + taskId + ":status", "done"); redisTemplate.opsForValue().set("import:task:" + taskId + ":status", "done");

View File

@ -281,4 +281,13 @@
AND dify_doc_id = #{difyDocId} AND dify_doc_id = #{difyDocId}
AND is_deleted = false AND is_deleted = false
</select> </select>
<!-- 根据文档ID查询文件 -->
<select id="selectByDocId" resultMap="TDatasetFilesResultMap">
SELECT <include refid="Base_Column_List"/>
FROM t_dataset_files
WHERE dify_doc_id = #{difyDocId}
AND is_deleted = false
</select>
</mapper> </mapper>