mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-07-04 18:45:38 +08:00
### What problem does this PR solve? Fix: Uploading TSV format documents to the knowledge base did not generate any error messages. ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue)
409 lines
12 KiB
TypeScript
409 lines
12 KiB
TypeScript
import { IRenameTag } from '@/interfaces/database/dataset';
|
|
import {
|
|
IFetchDocumentListRequestBody,
|
|
IFetchKnowledgeListRequestParams,
|
|
} from '@/interfaces/request/knowledge';
|
|
import { ProcessingType } from '@/pages/dataset/dataset-overview/dataset-common';
|
|
import api from '@/utils/api';
|
|
import registerServer from '@/utils/register-server';
|
|
import request from '@/utils/request';
|
|
|
|
const {
|
|
createKb,
|
|
rmKb,
|
|
kbList,
|
|
documentThumbnails,
|
|
documentIngest,
|
|
listTagByKnowledgeIds,
|
|
setMeta,
|
|
getMeta,
|
|
getMetaKeys,
|
|
retrievalTestShare,
|
|
} = api;
|
|
|
|
const methods = {
|
|
createKb: {
|
|
url: createKb,
|
|
method: 'post',
|
|
},
|
|
rmKb: {
|
|
url: rmKb,
|
|
method: 'delete',
|
|
},
|
|
getList: {
|
|
url: kbList,
|
|
method: 'get',
|
|
},
|
|
documentIngest: {
|
|
url: documentIngest,
|
|
method: 'post',
|
|
},
|
|
documentThumbnails: {
|
|
url: documentThumbnails,
|
|
method: 'get',
|
|
},
|
|
setMeta: {
|
|
url: setMeta,
|
|
method: 'post',
|
|
},
|
|
listTagByKnowledgeIds: {
|
|
url: listTagByKnowledgeIds,
|
|
method: 'get',
|
|
},
|
|
getMeta: {
|
|
url: getMeta,
|
|
method: 'get',
|
|
},
|
|
getMetaKeys: {
|
|
url: getMetaKeys,
|
|
method: 'get',
|
|
},
|
|
retrievalTestShare: {
|
|
url: retrievalTestShare,
|
|
method: 'post',
|
|
},
|
|
pipelineRerun: {
|
|
url: api.pipelineRerun,
|
|
method: 'post',
|
|
},
|
|
};
|
|
|
|
const baseKbService = registerServer<keyof typeof methods>(methods, request);
|
|
|
|
const getDatasetId = (params: Record<string, any>) =>
|
|
params.dataset_id || params.kb_id || params.knowledge_id;
|
|
|
|
const getDocumentId = (params: Record<string, any>) =>
|
|
params.document_id || params.doc_id;
|
|
|
|
const mapChunkToLegacy = (chunk: Record<string, any>) => ({
|
|
...chunk,
|
|
chunk_id: chunk.chunk_id || chunk.id,
|
|
content_with_weight: chunk.content_with_weight || chunk.content,
|
|
doc_id: chunk.doc_id || chunk.document_id,
|
|
doc_name: chunk.doc_name || chunk.docnm_kwd,
|
|
image_id: chunk.image_id || chunk.img_id,
|
|
important_kwd: chunk.important_kwd || chunk.important_keywords || [],
|
|
question_kwd: chunk.question_kwd || chunk.questions || [],
|
|
available_int: chunk.available_int ?? (chunk.available === false ? 0 : 1),
|
|
positions: chunk.positions || chunk.position_int || [],
|
|
});
|
|
|
|
const mapDocumentToLegacy = (doc: Record<string, any>) => ({
|
|
...doc,
|
|
chunk_num: doc.chunk_num ?? doc.chunk_count,
|
|
kb_id: doc.kb_id || doc.dataset_id,
|
|
parser_id: doc.parser_id || doc.chunk_method,
|
|
});
|
|
|
|
const mapChunkPayloadToRest = (payload: Record<string, any>) => ({
|
|
content: payload.content ?? payload.content_with_weight,
|
|
important_keywords: payload.important_keywords ?? payload.important_kwd,
|
|
questions: payload.questions ?? payload.question_kwd,
|
|
tag_kwd: payload.tag_kwd,
|
|
tag_feas: payload.tag_feas,
|
|
positions: payload.positions,
|
|
available:
|
|
payload.available ??
|
|
(payload.available_int === undefined
|
|
? undefined
|
|
: payload.available_int === 1),
|
|
image_base64: payload.image_base64,
|
|
});
|
|
|
|
const getAvailableParam = (available?: number) => {
|
|
if (available === undefined) {
|
|
return undefined;
|
|
}
|
|
return available === 1 ? 'true' : 'false';
|
|
};
|
|
|
|
const chunkService = {
|
|
retrievalTest: async (params: Record<string, any>) => {
|
|
const datasetId = params.dataset_id || params.kb_id || params.knowledge_id;
|
|
if (!datasetId) {
|
|
throw new Error(
|
|
'dataset_id (or kb_id/knowledge_id) is required for retrievalTest',
|
|
);
|
|
}
|
|
const datasetIds = Array.isArray(datasetId) ? datasetId : [datasetId];
|
|
const rest = { ...params };
|
|
delete rest.dataset_id;
|
|
delete rest.kb_id;
|
|
delete rest.knowledge_id;
|
|
return request.post(api.retrievalTest, {
|
|
data: { ...rest, dataset_ids: datasetIds },
|
|
});
|
|
},
|
|
chunkList: async (params: Record<string, any>) => {
|
|
const datasetId = getDatasetId(params);
|
|
const documentId = getDocumentId(params);
|
|
const response = await request.get(api.chunkList(datasetId, documentId), {
|
|
params: {
|
|
page: params.page,
|
|
page_size: params.page_size || params.size,
|
|
keywords: params.keywords,
|
|
available: getAvailableParam(params.available_int),
|
|
},
|
|
});
|
|
|
|
if (response.data?.code === 0) {
|
|
response.data.data = {
|
|
...response.data.data,
|
|
chunks: (response.data.data?.chunks || []).map(mapChunkToLegacy),
|
|
doc: mapDocumentToLegacy(response.data.data?.doc || {}),
|
|
};
|
|
}
|
|
|
|
return response;
|
|
},
|
|
createChunk: async (payload: Record<string, any>) => {
|
|
const datasetId = getDatasetId(payload);
|
|
const documentId = getDocumentId(payload);
|
|
const response = await request.post(api.chunkList(datasetId, documentId), {
|
|
data: mapChunkPayloadToRest(payload),
|
|
});
|
|
|
|
if (response.data?.code === 0 && response.data.data?.chunk) {
|
|
response.data.data.chunk = mapChunkToLegacy(response.data.data.chunk);
|
|
}
|
|
|
|
return response;
|
|
},
|
|
setChunk: (payload: Record<string, any>) => {
|
|
const datasetId = getDatasetId(payload);
|
|
const documentId = getDocumentId(payload);
|
|
const chunkId = payload.chunk_id || payload.id;
|
|
return request.patch(api.chunkDetail(datasetId, documentId, chunkId), {
|
|
data: mapChunkPayloadToRest(payload),
|
|
});
|
|
},
|
|
getChunk: async (params: Record<string, any>) => {
|
|
const datasetId = getDatasetId(params);
|
|
const documentId = getDocumentId(params);
|
|
const chunkId = params.chunk_id || params.id;
|
|
const response = await request.get(
|
|
api.chunkDetail(datasetId, documentId, chunkId),
|
|
);
|
|
|
|
if (response.data?.code === 0) {
|
|
response.data.data = mapChunkToLegacy(response.data.data || {});
|
|
}
|
|
|
|
return response;
|
|
},
|
|
switchChunk: (params: Record<string, any>) => {
|
|
const datasetId = getDatasetId(params);
|
|
const documentId = getDocumentId(params);
|
|
return request.patch(api.chunkList(datasetId, documentId), {
|
|
data: {
|
|
chunk_ids: params.chunk_ids || params.chunkIds,
|
|
available_int: params.available_int,
|
|
},
|
|
});
|
|
},
|
|
rmChunk: (params: Record<string, any>) => {
|
|
const datasetId = getDatasetId(params);
|
|
const documentId = getDocumentId(params);
|
|
return request.delete(api.chunkList(datasetId, documentId), {
|
|
data: {
|
|
chunk_ids: params.chunk_ids || params.chunkIds,
|
|
delete_all: params.delete_all,
|
|
},
|
|
});
|
|
},
|
|
};
|
|
|
|
const kbService = {
|
|
...baseKbService,
|
|
...chunkService,
|
|
};
|
|
|
|
export const getKbDetail = async (datasetId: string) => {
|
|
const response = await request.get(api.getKbDetail(datasetId));
|
|
// The /api/v1/datasets/<id> endpoint returns chunk_count/document_count,
|
|
// but legacy consumers (e.g. the GraphRAG/Raptor "magic wand" enable check
|
|
// in dataset/index.tsx) read chunk_num/doc_num. Normalize both shapes.
|
|
if (response.data?.code === 0 && response.data.data) {
|
|
const d = response.data.data;
|
|
response.data.data = {
|
|
...d,
|
|
chunk_num: d.chunk_num ?? d.chunk_count,
|
|
doc_num: d.doc_num ?? d.document_count,
|
|
};
|
|
}
|
|
return response;
|
|
};
|
|
|
|
export const listTag = (knowledgeId: string) =>
|
|
request.get(api.listTag(knowledgeId));
|
|
|
|
export const removeTag = (knowledgeId: string, tags: string[]) =>
|
|
request.delete(api.removeTag(knowledgeId), { data: { tags } });
|
|
|
|
export const renameTag = (
|
|
knowledgeId: string,
|
|
{ fromTag, toTag }: IRenameTag,
|
|
) => request.put(api.renameTag(knowledgeId), { data: { fromTag, toTag } });
|
|
|
|
export function getKnowledgeGraph(knowledgeId: string) {
|
|
return request.get(api.getKnowledgeGraph(knowledgeId));
|
|
}
|
|
|
|
export function deleteKnowledgeGraph(knowledgeId: string) {
|
|
return request.delete(api.knowledgeGraph(knowledgeId));
|
|
}
|
|
|
|
export const listDataset = (params?: IFetchKnowledgeListRequestParams) =>
|
|
request.get(api.kbList, { params });
|
|
|
|
export const updateKb = (datasetId: string, data: Record<string, any>) =>
|
|
request.put(api.updateKb(datasetId), { data });
|
|
|
|
export const runIndex = (datasetId: string, indexType: string) =>
|
|
request.post(api.runIndex(datasetId, indexType));
|
|
|
|
export const traceIndex = (datasetId: string, indexType: string) =>
|
|
request.get(api.traceIndex(datasetId, indexType));
|
|
|
|
// Using RESTful API: GET /api/v1/datasets/{dataset_id}/documents
|
|
export const listDocument = (
|
|
params?: IFetchKnowledgeListRequestParams,
|
|
body?: IFetchDocumentListRequestBody,
|
|
) => {
|
|
if (!params || !params.id) {
|
|
throw new Error('params and params.id are required');
|
|
}
|
|
// Extract page, page_size, and ext.keywords from params
|
|
const { page, page_size, ext } = params;
|
|
// Merge: page, page_size, keywords (from ext), body, and remaining params
|
|
const mergedParams = {
|
|
page,
|
|
page_size,
|
|
keywords: ext?.keywords,
|
|
...body,
|
|
};
|
|
return request.get(api.getDocumentList(params.id), { params: mergedParams });
|
|
};
|
|
|
|
export const documentFilter = (kb_id: string) =>
|
|
request.get(api.getDatasetFilter(kb_id), { params: {} });
|
|
|
|
export const uploadDocument = async (datasetId: string, formData: FormData) => {
|
|
const url = api.documentUpload(datasetId);
|
|
const response = await request.post(url, { data: formData });
|
|
return response.data;
|
|
};
|
|
|
|
export const createDocument = async (datasetId: string, name: string) => {
|
|
const response = await request.post(api.documentCreate(datasetId), {
|
|
data: { name },
|
|
});
|
|
return response.data;
|
|
};
|
|
|
|
export const renameDocument = (
|
|
datasetId: string,
|
|
documentId: string,
|
|
data: { name?: string },
|
|
) => request.patch(api.documentRename(datasetId, documentId), { data });
|
|
|
|
export const changeDocumentParser = (
|
|
datasetId: string,
|
|
documentId: string,
|
|
data: { name?: string },
|
|
) => request.patch(api.documentChangeParser(datasetId, documentId), { data });
|
|
|
|
export const deleteDocument = (datasetId: string, documentIds: string[]) =>
|
|
request.delete(api.documentDelete(datasetId), { data: { ids: documentIds } });
|
|
|
|
export const getMetaDataService = ({
|
|
kb_id,
|
|
doc_ids,
|
|
}: {
|
|
kb_id: string;
|
|
doc_ids?: string[];
|
|
}) =>
|
|
request.get(api.getMetaData(kb_id), {
|
|
params: doc_ids?.length ? { doc_ids: doc_ids.join(',') } : undefined,
|
|
});
|
|
export const updateDocumentsMetadata = ({
|
|
dataset_id,
|
|
selector,
|
|
updates,
|
|
deletes,
|
|
}: {
|
|
dataset_id: string;
|
|
selector?: {
|
|
document_ids?: string[];
|
|
metadata_condition?: any;
|
|
};
|
|
updates?: any[];
|
|
deletes?: any[];
|
|
}) =>
|
|
request.patch(api.updateDocumentsMetadata(dataset_id), {
|
|
data: { selector, updates, deletes },
|
|
});
|
|
|
|
export const updateDocumentMetaDataConfig = ({
|
|
kb_id,
|
|
doc_id,
|
|
data,
|
|
}: {
|
|
kb_id: string;
|
|
doc_id: string;
|
|
data: any;
|
|
}) =>
|
|
request.put(api.documentUpdateMetaDataConfig(kb_id, doc_id), {
|
|
data: { ...data },
|
|
});
|
|
|
|
export const changeDocumentsStatus = ({
|
|
kb_id,
|
|
doc_ids,
|
|
status,
|
|
}: {
|
|
kb_id: string;
|
|
doc_ids?: string[];
|
|
status: number;
|
|
}) =>
|
|
request.post(api.documentChangeStatus(kb_id), { data: { doc_ids, status } });
|
|
|
|
export const listDataPipelineLogDocument = (
|
|
datasetId: string,
|
|
params?: Record<string, any>,
|
|
) => request.get(api.fetchDataPipelineLog(datasetId), { params });
|
|
|
|
export const listPipelineDatasetLogs = (
|
|
datasetId: string,
|
|
params?: Record<string, any>,
|
|
) => request.get(api.fetchPipelineDatasetLogs(datasetId), { params });
|
|
|
|
export const getPipelineDetail = (datasetId: string, logId: string) =>
|
|
request.get(api.getPipelineDetail(datasetId, logId));
|
|
|
|
export const getKnowledgeBasicInfo = (datasetId: string) =>
|
|
request.get(api.getKnowledgeBasicInfo(datasetId));
|
|
|
|
export const checkEmbedding = (datasetId: string, data: Record<string, any>) =>
|
|
request.post(api.checkEmbedding(datasetId), { data });
|
|
|
|
export const kbUpdateMetaData = (
|
|
datasetId: string,
|
|
data: Record<string, any>,
|
|
) => request.put(api.kbUpdateMetaData(datasetId), { data });
|
|
|
|
export function deletePipelineTask({
|
|
kb_id,
|
|
type,
|
|
wipe,
|
|
}: {
|
|
kb_id: string;
|
|
type: ProcessingType;
|
|
wipe?: boolean;
|
|
}) {
|
|
return request.delete(api.unbindPipelineTask(kb_id, type, wipe));
|
|
}
|
|
|
|
export default kbService;
|