mirror of
https://github.com/RYDE-WORK/Langchain-Chatchat.git
synced 2026-01-19 21:37:20 +08:00
- 知识库管理中的add_docs/delete_docs/update_docs均支持批量操作,并利用多线程提高效率 - API的重建知识库接口支持多线程 - add_docs可提供参数控制上传文件后是否继续进行向量化 - add_docs/update_docs支持传入自定义docs(以json形式)。后续考虑区分完整或补充式自定义docs - download_doc接口添加`preview`参数,支持下载或预览 - kb_service增加`save_vector_store`方法,便于保存向量库(仅FAISS,其它无操作) - 将document_loader & text_splitter逻辑从KnowledgeFile中抽离出来,为后续对内存文件进行向量化做准备 - KowledgeFile支持docs & splitted_docs的缓存,方便在中间过程做一些自定义 其它: - 将部分错误输出由print改为logger.error
64 lines
2.4 KiB
Python
64 lines
2.4 KiB
Python
import urllib
|
|
from server.utils import BaseResponse, ListResponse
|
|
from server.knowledge_base.utils import validate_kb_name
|
|
from server.knowledge_base.kb_service.base import KBServiceFactory
|
|
from server.db.repository.knowledge_base_repository import list_kbs_from_db
|
|
from configs.model_config import EMBEDDING_MODEL, logger
|
|
from fastapi import Body
|
|
|
|
|
|
async def list_kbs():
|
|
# Get List of Knowledge Base
|
|
return ListResponse(data=list_kbs_from_db())
|
|
|
|
|
|
async def create_kb(knowledge_base_name: str = Body(..., examples=["samples"]),
|
|
vector_store_type: str = Body("faiss"),
|
|
embed_model: str = Body(EMBEDDING_MODEL),
|
|
) -> BaseResponse:
|
|
# Create selected knowledge base
|
|
if not validate_kb_name(knowledge_base_name):
|
|
return BaseResponse(code=403, msg="Don't attack me")
|
|
if knowledge_base_name is None or knowledge_base_name.strip() == "":
|
|
return BaseResponse(code=404, msg="知识库名称不能为空,请重新填写知识库名称")
|
|
|
|
kb = KBServiceFactory.get_service_by_name(knowledge_base_name)
|
|
if kb is not None:
|
|
return BaseResponse(code=404, msg=f"已存在同名知识库 {knowledge_base_name}")
|
|
|
|
kb = KBServiceFactory.get_service(knowledge_base_name, vector_store_type, embed_model)
|
|
try:
|
|
kb.create_kb()
|
|
except Exception as e:
|
|
msg = f"创建知识库出错: {e}"
|
|
logger.error(msg)
|
|
return BaseResponse(code=500, msg=msg)
|
|
|
|
return BaseResponse(code=200, msg=f"已新增知识库 {knowledge_base_name}")
|
|
|
|
|
|
async def delete_kb(
|
|
knowledge_base_name: str = Body(..., examples=["samples"])
|
|
) -> BaseResponse:
|
|
# Delete selected knowledge base
|
|
if not validate_kb_name(knowledge_base_name):
|
|
return BaseResponse(code=403, msg="Don't attack me")
|
|
knowledge_base_name = urllib.parse.unquote(knowledge_base_name)
|
|
|
|
kb = KBServiceFactory.get_service_by_name(knowledge_base_name)
|
|
|
|
if kb is None:
|
|
return BaseResponse(code=404, msg=f"未找到知识库 {knowledge_base_name}")
|
|
|
|
try:
|
|
status = kb.clear_vs()
|
|
status = kb.drop_kb()
|
|
if status:
|
|
return BaseResponse(code=200, msg=f"成功删除知识库 {knowledge_base_name}")
|
|
except Exception as e:
|
|
msg = f"删除知识库时出现意外: {e}"
|
|
logger.error(msg)
|
|
return BaseResponse(code=500, msg=msg)
|
|
|
|
return BaseResponse(code=500, msg=f"删除知识库失败 {knowledge_base_name}")
|