2023-10-09 11:03:41 +00:00
|
|
|
|
# coding=utf-8
|
|
|
|
|
|
"""
|
|
|
|
|
|
@project: maxkb
|
|
|
|
|
|
@Author:虎
|
|
|
|
|
|
@file: document.py
|
|
|
|
|
|
@date:2023/9/22 11:32
|
|
|
|
|
|
@desc:
|
|
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
|
|
from drf_yasg.utils import swagger_auto_schema
|
|
|
|
|
|
from rest_framework.decorators import action
|
2023-10-24 12:24:32 +00:00
|
|
|
|
from rest_framework.parsers import MultiPartParser
|
2023-10-09 11:03:41 +00:00
|
|
|
|
from rest_framework.views import APIView
|
|
|
|
|
|
from rest_framework.views import Request
|
|
|
|
|
|
|
|
|
|
|
|
from common.auth import TokenAuth, has_permissions
|
2024-04-26 10:35:46 +00:00
|
|
|
|
from common.constants.permission_constants import Permission, Group, Operate, CompareConstants
|
2023-10-09 11:03:41 +00:00
|
|
|
|
from common.response import result
|
2023-10-24 12:24:32 +00:00
|
|
|
|
from common.util.common import query_params_to_single_dict
|
2024-01-17 08:08:51 +00:00
|
|
|
|
from dataset.serializers.common_serializers import BatchSerializer
|
|
|
|
|
|
from dataset.serializers.document_serializers import DocumentSerializers, DocumentWebInstanceSerializer
|
2024-04-28 06:35:51 +00:00
|
|
|
|
from dataset.swagger_api.document_api import DocumentApi
|
2024-01-17 08:08:51 +00:00
|
|
|
|
|
|
|
|
|
|
|
2024-05-23 10:57:49 +00:00
|
|
|
|
class Template(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="获取QA模版",
|
|
|
|
|
|
operation_id="获取QA模版",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Export.get_request_params_api(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
def get(self, request: Request):
|
|
|
|
|
|
return DocumentSerializers.Export(data={'type': request.query_params.get('type')}).export(with_valid=True)
|
|
|
|
|
|
|
2024-08-30 10:45:25 +00:00
|
|
|
|
|
2024-08-22 08:52:32 +00:00
|
|
|
|
class TableTemplate(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="获取表格模版",
|
|
|
|
|
|
operation_id="获取表格模版",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Export.get_request_params_api(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
def get(self, request: Request):
|
|
|
|
|
|
return DocumentSerializers.Export(data={'type': request.query_params.get('type')}).table_export(with_valid=True)
|
|
|
|
|
|
|
2024-05-23 10:57:49 +00:00
|
|
|
|
|
2024-01-17 08:08:51 +00:00
|
|
|
|
class WebDocument(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="创建Web站点文档",
|
|
|
|
|
|
operation_id="创建Web站点文档",
|
|
|
|
|
|
request_body=DocumentWebInstanceSerializer.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Operate.get_response_body_api()),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def post(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Create(data={'dataset_id': dataset_id}).save_web(request.data, with_valid=True))
|
2023-10-09 11:03:41 +00:00
|
|
|
|
|
|
|
|
|
|
|
2024-05-23 10:57:49 +00:00
|
|
|
|
class QaDocument(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
parser_classes = [MultiPartParser]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="导入QA并创建文档",
|
|
|
|
|
|
operation_id="导入QA并创建文档",
|
|
|
|
|
|
manual_parameters=DocumentWebInstanceSerializer.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Create.get_response_body_api()),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def post(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Create(data={'dataset_id': dataset_id}).save_qa(
|
|
|
|
|
|
{'file_list': request.FILES.getlist('file')},
|
|
|
|
|
|
with_valid=True))
|
|
|
|
|
|
|
2024-08-30 10:45:25 +00:00
|
|
|
|
|
2024-08-22 08:52:32 +00:00
|
|
|
|
class TableDocument(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
parser_classes = [MultiPartParser]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="导入表格并创建文档",
|
|
|
|
|
|
operation_id="导入表格并创建文档",
|
|
|
|
|
|
manual_parameters=DocumentWebInstanceSerializer.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Create.get_response_body_api()),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def post(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Create(data={'dataset_id': dataset_id}).save_table(
|
|
|
|
|
|
{'file_list': request.FILES.getlist('file')},
|
|
|
|
|
|
with_valid=True))
|
2024-05-23 10:57:49 +00:00
|
|
|
|
|
2024-08-30 10:45:25 +00:00
|
|
|
|
|
2023-10-09 11:03:41 +00:00
|
|
|
|
class Document(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="创建文档",
|
|
|
|
|
|
operation_id="创建文档",
|
2023-10-24 12:24:32 +00:00
|
|
|
|
request_body=DocumentSerializers.Create.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Operate.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-24 12:24:32 +00:00
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
2023-10-09 11:03:41 +00:00
|
|
|
|
def post(self, request: Request, dataset_id: str):
|
2023-10-24 12:24:32 +00:00
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Create(data={'dataset_id': dataset_id}).save(request.data, with_valid=True))
|
2023-10-09 11:03:41 +00:00
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
2023-10-24 12:24:32 +00:00
|
|
|
|
@swagger_auto_schema(operation_summary="文档列表",
|
|
|
|
|
|
operation_id="文档列表",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Query.get_request_params_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Query.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-09 11:03:41 +00:00
|
|
|
|
@has_permissions(
|
2023-10-24 12:24:32 +00:00
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.USE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
2023-10-09 11:03:41 +00:00
|
|
|
|
def get(self, request: Request, dataset_id: str):
|
2023-10-24 12:24:32 +00:00
|
|
|
|
d = DocumentSerializers.Query(
|
|
|
|
|
|
data={**query_params_to_single_dict(request.query_params), 'dataset_id': dataset_id})
|
|
|
|
|
|
d.is_valid(raise_exception=True)
|
|
|
|
|
|
return result.success(d.list())
|
|
|
|
|
|
|
2024-04-28 06:35:51 +00:00
|
|
|
|
class BatchEditHitHandling(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="批量修改文档命中处理方式",
|
|
|
|
|
|
operation_id="批量修改文档命中处理方式",
|
|
|
|
|
|
request_body=
|
|
|
|
|
|
DocumentApi.BatchEditHitHandlingApi.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Batch(data={'dataset_id': dataset_id}).batch_edit_hit_handling(request.data))
|
|
|
|
|
|
|
2023-11-17 09:43:35 +00:00
|
|
|
|
class Batch(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="批量创建文档",
|
|
|
|
|
|
operation_id="批量创建文档",
|
|
|
|
|
|
request_body=
|
|
|
|
|
|
DocumentSerializers.Batch.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_api_array_response(
|
|
|
|
|
|
DocumentSerializers.Operate.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-11-17 09:43:35 +00:00
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def post(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(DocumentSerializers.Batch(data={'dataset_id': dataset_id}).batch_save(request.data))
|
|
|
|
|
|
|
2024-01-17 08:08:51 +00:00
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="批量同步文档",
|
|
|
|
|
|
operation_id="批量同步文档",
|
|
|
|
|
|
request_body=
|
|
|
|
|
|
BatchSerializer.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(DocumentSerializers.Batch(data={'dataset_id': dataset_id}).batch_sync(request.data))
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['DELETE'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="批量删除文档",
|
|
|
|
|
|
operation_id="批量删除文档",
|
|
|
|
|
|
request_body=
|
|
|
|
|
|
BatchSerializer.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def delete(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(DocumentSerializers.Batch(data={'dataset_id': dataset_id}).batch_delete(request.data))
|
|
|
|
|
|
|
2024-05-24 03:27:59 +00:00
|
|
|
|
class SyncWeb(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['PUT'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="同步web站点类型",
|
|
|
|
|
|
operation_id="同步web站点类型",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
|
|
|
|
|
tags=["知识库/文档"]
|
|
|
|
|
|
)
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Sync(data={'document_id': document_id, 'dataset_id': dataset_id}).sync(
|
|
|
|
|
|
))
|
|
|
|
|
|
|
2023-12-13 10:03:57 +00:00
|
|
|
|
class Refresh(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['PUT'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="刷新文档向量库",
|
|
|
|
|
|
operation_id="刷新文档向量库",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"]
|
2023-12-13 10:03:57 +00:00
|
|
|
|
)
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Operate(data={'document_id': document_id, 'dataset_id': dataset_id}).refresh(
|
|
|
|
|
|
))
|
|
|
|
|
|
|
2024-08-30 10:45:25 +00:00
|
|
|
|
class BatchRefresh(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
2024-09-14 10:36:37 +00:00
|
|
|
|
@action(methods=['PUT'], detail=False)
|
2024-08-30 10:45:25 +00:00
|
|
|
|
@swagger_auto_schema(operation_summary="批量刷新文档向量库",
|
|
|
|
|
|
operation_id="批量刷新文档向量库",
|
|
|
|
|
|
request_body=
|
|
|
|
|
|
DocumentApi.BatchEditHitHandlingApi.get_request_body_api(),
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Create.get_request_params_api(),
|
|
|
|
|
|
responses=result.get_default_response(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Batch(data={'dataset_id': dataset_id}).batch_refresh(request.data))
|
|
|
|
|
|
|
2024-04-26 10:35:46 +00:00
|
|
|
|
class Migrate(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['PUT'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="批量迁移文档",
|
|
|
|
|
|
operation_id="批量迁移文档",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Migrate.get_request_params_api(),
|
|
|
|
|
|
request_body=DocumentSerializers.Migrate.get_request_body_api(),
|
|
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Operate.get_response_body_api()),
|
|
|
|
|
|
tags=["知识库/文档"]
|
|
|
|
|
|
)
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')),
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('target_dataset_id')),
|
|
|
|
|
|
compare=CompareConstants.AND
|
|
|
|
|
|
)
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str, target_dataset_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Migrate(
|
|
|
|
|
|
data={'dataset_id': dataset_id, 'target_dataset_id': target_dataset_id,
|
|
|
|
|
|
'document_id_list': request.data}).migrate(
|
|
|
|
|
|
|
|
|
|
|
|
))
|
|
|
|
|
|
|
2024-05-27 07:48:24 +00:00
|
|
|
|
class Export(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="导出文档",
|
|
|
|
|
|
operation_id="导出文档",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
|
|
|
|
|
tags=["知识库/文档"])
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.USE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def get(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
return DocumentSerializers.Operate(data={'document_id': document_id, 'dataset_id': dataset_id}).export()
|
|
|
|
|
|
|
2023-10-24 12:24:32 +00:00
|
|
|
|
class Operate(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="获取文档详情",
|
|
|
|
|
|
operation_id="获取文档详情",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Operate.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-24 12:24:32 +00:00
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.USE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def get(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
operate = DocumentSerializers.Operate(data={'document_id': document_id, 'dataset_id': dataset_id})
|
|
|
|
|
|
operate.is_valid(raise_exception=True)
|
|
|
|
|
|
return result.success(operate.one())
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['PUT'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="修改文档",
|
|
|
|
|
|
operation_id="修改文档",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
|
|
|
|
|
request_body=DocumentSerializers.Operate.get_request_body_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_api_response(DocumentSerializers.Operate.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"]
|
2023-10-24 12:24:32 +00:00
|
|
|
|
)
|
|
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def put(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
return result.success(
|
|
|
|
|
|
DocumentSerializers.Operate(data={'document_id': document_id, 'dataset_id': dataset_id}).edit(
|
|
|
|
|
|
request.data,
|
|
|
|
|
|
with_valid=True))
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['DELETE'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="删除文档",
|
|
|
|
|
|
operation_id="删除文档",
|
|
|
|
|
|
manual_parameters=DocumentSerializers.Operate.get_request_params_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_default_response(),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-24 12:24:32 +00:00
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.MANAGE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def delete(self, request: Request, dataset_id: str, document_id: str):
|
|
|
|
|
|
operate = DocumentSerializers.Operate(data={'document_id': document_id, 'dataset_id': dataset_id})
|
|
|
|
|
|
operate.is_valid(raise_exception=True)
|
|
|
|
|
|
return result.success(operate.delete())
|
|
|
|
|
|
|
2023-11-20 10:53:18 +00:00
|
|
|
|
class SplitPattern(APIView):
|
2024-08-29 02:40:01 +00:00
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
2023-11-20 10:53:18 +00:00
|
|
|
|
@action(methods=['GET'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="获取分段标识列表",
|
|
|
|
|
|
operation_id="获取分段标识列表",
|
2024-08-29 02:40:01 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-11-20 10:53:18 +00:00
|
|
|
|
def get(self, request: Request):
|
|
|
|
|
|
return result.success(DocumentSerializers.SplitPattern.list())
|
|
|
|
|
|
|
2023-10-24 12:24:32 +00:00
|
|
|
|
class Split(APIView):
|
2024-08-29 02:40:01 +00:00
|
|
|
|
authentication_classes = [TokenAuth]
|
2023-10-24 12:24:32 +00:00
|
|
|
|
parser_classes = [MultiPartParser]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['POST'], detail=False)
|
|
|
|
|
|
@swagger_auto_schema(operation_summary="分段文档",
|
|
|
|
|
|
operation_id="分段文档",
|
2023-11-16 05:16:27 +00:00
|
|
|
|
manual_parameters=DocumentSerializers.Split.get_request_params_api(),
|
2024-08-29 02:40:01 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-24 12:24:32 +00:00
|
|
|
|
def post(self, request: Request):
|
2023-11-20 10:53:18 +00:00
|
|
|
|
split_data = {'file': request.FILES.getlist('file')}
|
|
|
|
|
|
request_data = request.data
|
|
|
|
|
|
if 'patterns' in request.data and request.data.get('patterns') is not None and len(
|
|
|
|
|
|
request.data.get('patterns')) > 0:
|
|
|
|
|
|
split_data.__setitem__('patterns', request_data.getlist('patterns'))
|
|
|
|
|
|
if 'limit' in request.data:
|
|
|
|
|
|
split_data.__setitem__('limit', request_data.get('limit'))
|
|
|
|
|
|
if 'with_filter' in request.data:
|
|
|
|
|
|
split_data.__setitem__('with_filter', request_data.get('with_filter'))
|
2023-10-24 12:24:32 +00:00
|
|
|
|
ds = DocumentSerializers.Split(
|
2023-11-20 10:53:18 +00:00
|
|
|
|
data=split_data)
|
2023-10-24 12:24:32 +00:00
|
|
|
|
ds.is_valid(raise_exception=True)
|
|
|
|
|
|
return result.success(ds.parse())
|
|
|
|
|
|
|
|
|
|
|
|
class Page(APIView):
|
|
|
|
|
|
authentication_classes = [TokenAuth]
|
|
|
|
|
|
|
|
|
|
|
|
@action(methods=['GET'], detail=False)
|
2023-12-18 03:32:29 +00:00
|
|
|
|
@swagger_auto_schema(operation_summary="获取知识库分页列表",
|
|
|
|
|
|
operation_id="获取知识库分页列表",
|
2023-10-24 12:24:32 +00:00
|
|
|
|
manual_parameters=DocumentSerializers.Query.get_request_params_api(),
|
2023-11-16 05:16:27 +00:00
|
|
|
|
responses=result.get_page_api_response(DocumentSerializers.Query.get_response_body_api()),
|
2023-12-18 03:32:29 +00:00
|
|
|
|
tags=["知识库/文档"])
|
2023-10-24 12:24:32 +00:00
|
|
|
|
@has_permissions(
|
|
|
|
|
|
lambda r, k: Permission(group=Group.DATASET, operate=Operate.USE,
|
|
|
|
|
|
dynamic_tag=k.get('dataset_id')))
|
|
|
|
|
|
def get(self, request: Request, dataset_id: str, current_page, page_size):
|
|
|
|
|
|
d = DocumentSerializers.Query(
|
|
|
|
|
|
data={**query_params_to_single_dict(request.query_params), 'dataset_id': dataset_id})
|
|
|
|
|
|
d.is_valid(raise_exception=True)
|
|
|
|
|
|
return result.success(d.page(current_page, page_size))
|