Files
ragflow/web/src/interfaces/database/document.ts
Wang Qi 13b422037f Refactor: enhance graphrag - part 2 (#14972)
### What problem does this PR solve?
1. expose batch_chunk_token_size for configuration
2. retrieve chunks when build subgraph for the doc, not retreive all
docs chunks at the begining
3. get all chunks for a document, used to be hard coded 10000
4. delete not used method run_graphrag

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
- [x] Refactoring

Follow on: #14617
2026-05-18 16:10:21 +08:00

83 lines
1.8 KiB
TypeScript

import { RunningStatus } from '@/constants/knowledge';
export interface IDocumentInfo {
// chunk_num: number;
create_date: string;
create_time: number;
created_by: string;
nickname: string;
id: string;
dataset_id: string;
location: string;
name: string;
parser_config: IParserConfig;
// parser_id: string;
pipeline_id: string;
pipeline_name: string;
process_begin_at?: string;
process_duration: number;
progress: number;
progress_msg: string;
run: RunningStatus;
size: number;
source_type: string;
status: string;
suffix: string;
thumbnail: string;
token_num: number;
type: string;
update_date: string;
update_time: number;
meta_fields?: Record<string, any>;
chunk_method: string;
chunk_count: number;
}
export interface IParserConfig {
delimiter?: string;
html4excel?: boolean;
layout_recognize?: string;
pages?: any[];
chunk_token_num?: number;
auto_keywords?: number;
auto_questions?: number;
toc_extraction?: boolean;
task_page_size?: number;
raptor?: Raptor;
graphrag?: GraphRag;
image_context_window?: number;
image_table_context_window?: number;
image_context_size?: number;
table_context_size?: number;
mineru_parse_method?: 'auto' | 'txt' | 'ocr';
mineru_formula_enable?: boolean;
mineru_table_enable?: boolean;
mineru_lang?: string;
entity_types?: string[];
metadata?: Array<{
key?: string;
description?: string;
enum?: string[];
}>;
enable_metadata?: boolean;
}
interface Raptor {
use_raptor: boolean;
}
interface GraphRag {
batch_chunk_token_size?: number;
community?: boolean;
entity_types?: string[];
method?: string;
resolution?: boolean;
use_graphrag?: boolean;
}
export type IDocumentInfoFilter = {
run_status: Record<number, number>;
suffix: Record<string, number>;
metadata: Record<string, Record<string, number>>;
};