mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-06-29 15:31:05 +08:00
## Summary Migrate the batch document deletion endpoint from Python to Go. Two modes supported: explicit `ids` list and `delete_all`. ## Changes | File | Change | |------|--------| | `internal/dao/file2document.go` | Add `GetByDocumentID`, `DeleteByDocumentID` | | `internal/dao/file2document_test.go` | 5 new tests | | `internal/dao/kb_test.go` | 2 new tests (`DecreaseDocumentNum`) | | `internal/service/document.go` | Add `deleteDocumentFull` + `DeleteDocuments`, refactor `DeleteDocument` | | `internal/service/document_test.go` | 10 new tests | | `internal/handler/document.go` | Add `documentServiceIface` + `DeleteDocuments` handler | | `internal/handler/document_test.go` | 7 new tests | | `internal/router/router.go` | Register `DELETE /:dataset_id/documents` | | `cmd/server_main.go` | Support `RAGFLOW_DICT_PATH` env var | | `internal/binding/rag_analyzer.go` | Use `-lpcre2-8` dynamic linking | | `internal/dao/database.go` | Skip Error 1091/1138 during migration | | `internal/service/llm.go` | Fix vet warning | ## Per-document cleanup - Delete tasks from DB - Hard-delete document + decrement KB counters - Delete chunks from document engine (nil-guarded) - Delete metadata from document engine (nil-guarded) - Remove file2document mapping + file record + storage blob ## Test Results **24 unit tests all passing** (7 DAO + 10 service + 7 handler) using SQLite :memory: + gin.TestMode. See [test report](docs/test_report_delete_documents.md) for manual integration test results. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com> --------- Co-authored-by: Claude Opus 4.8 <noreply@anthropic.com>
85 lines
2.8 KiB
Go
85 lines
2.8 KiB
Go
//
|
|
// Copyright 2026 The InfiniFlow Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
|
|
package dao
|
|
|
|
import (
|
|
"ragflow/internal/entity"
|
|
)
|
|
|
|
// File2DocumentDAO file to document mapping data access object
|
|
type File2DocumentDAO struct{}
|
|
|
|
// NewFile2DocumentDAO create file2document DAO
|
|
func NewFile2DocumentDAO() *File2DocumentDAO {
|
|
return &File2DocumentDAO{}
|
|
}
|
|
|
|
// GetKBInfoByFileID gets knowledge base info by file ID
|
|
func (dao *File2DocumentDAO) GetKBInfoByFileID(fileID string) ([]map[string]interface{}, error) {
|
|
var results []map[string]interface{}
|
|
|
|
rows, err := DB.Model(&entity.File{}).
|
|
Select("knowledgebase.id, knowledgebase.name, file2document.document_id").
|
|
Joins("JOIN file2document ON file2document.file_id = ?", fileID).
|
|
Joins("JOIN document ON document.id = file2document.document_id").
|
|
Joins("JOIN knowledgebase ON knowledgebase.id = document.kb_id").
|
|
Where("file.id = ?", fileID).
|
|
Rows()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
defer rows.Close()
|
|
|
|
for rows.Next() {
|
|
var kbID, kbName, docID string
|
|
if err := rows.Scan(&kbID, &kbName, &docID); err != nil {
|
|
continue
|
|
}
|
|
results = append(results, map[string]interface{}{
|
|
"kb_id": kbID,
|
|
"kb_name": kbName,
|
|
"document_id": docID,
|
|
})
|
|
}
|
|
|
|
return results, nil
|
|
}
|
|
|
|
// GetByFileID gets file2document mappings by file ID
|
|
func (dao *File2DocumentDAO) GetByFileID(fileID string) ([]*entity.File2Document, error) {
|
|
var mappings []*entity.File2Document
|
|
err := DB.Where("file_id = ?", fileID).Find(&mappings).Error
|
|
return mappings, err
|
|
}
|
|
|
|
// DeleteByFileID deletes file2document mappings by file ID
|
|
func (dao *File2DocumentDAO) DeleteByFileID(fileID string) error {
|
|
return DB.Unscoped().Where("file_id = ?", fileID).Delete(&entity.File2Document{}).Error
|
|
}
|
|
|
|
// GetByDocumentID gets file2document mappings by document ID
|
|
func (dao *File2DocumentDAO) GetByDocumentID(docID string) ([]*entity.File2Document, error) {
|
|
var mappings []*entity.File2Document
|
|
err := DB.Where("document_id = ?", docID).Find(&mappings).Error
|
|
return mappings, err
|
|
}
|
|
|
|
// DeleteByDocumentID deletes file2document mappings by document ID
|
|
func (dao *File2DocumentDAO) DeleteByDocumentID(docID string) error {
|
|
return DB.Unscoped().Where("document_id = ?", docID).Delete(&entity.File2Document{}).Error
|
|
}
|