mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-07-02 00:35:46 +08:00
### What problem does this PR solve? 1. Go ingestion server will connected with admin server with gRPC stream 2. Go ingestion server will be responsible for ingestion tasks ``` RAGFlow(admin)> list ingestors; +-----------------+-----------+----------------------------------+---------------------------+----------+------------+--------------+--------+------------+---------------+ | address | cpu_usage | id | last_heartbeat | name | process_id | rss_usage | status | task_count | vms_usage | +-----------------+-----------+----------------------------------+---------------------------+----------+------------+--------------+--------+------------+---------------+ | 127.0.0.1:58564 | 0 | bdd1870eea2646e0aacb8a2cd3307aa2 | 2026-05-24T18:16:17+08:00 | ingestor | 680152 | 212.72265625 | active | 0 | 2589.12109375 | +-----------------+-----------+----------------------------------+---------------------------+----------+------------+--------------+--------+------------+---------------+ RAGFlow(admin)> start ingestion 'abc'; +----------------------------------+ | task_id | +----------------------------------+ | e714777639ca4760ab427b5f211e81ad | +----------------------------------+ RAGFlow(admin)> stop ingestion 'f7bd39d0a724457eb5fdce6d81699776'; +----------------------------------+ | task_id | +----------------------------------+ | f7bd39d0a724457eb5fdce6d81699776 | +----------------------------------+ RAGFlow(admin)> list tasks; +-----+----------------------------------+-------+------+----------------------------------+---------------------------+------------+------------+ | ETA | assign_to | error | from | id | last_update | start_time | status | +-----+----------------------------------+-------+------+----------------------------------+---------------------------+------------+------------+ | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | eae6431da72a40e796cff3a03008091b | 2026-05-24T19:46:03+08:00 | | COMPLETED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 6cccdd174bd049ecb05a774bbb47593f | 2026-05-24T19:46:03+08:00 | | COMPLETED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | ef360d777e57485799adb96b30f2b4b8 | 2026-05-24T19:46:03+08:00 | | CANCELED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | bcc5c5448cb64de48b6b6171c36fb790 | 2026-05-24T19:46:03+08:00 | | CANCELED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | bfc25384c43a443294fe2da979a38ac2 | 2026-05-24T19:46:03+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 84960537b85d413b8990a9efd5952d67 | 2026-05-24T19:46:04+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 3d223c1b51e24b36861a3bfb2f1d58d4 | 2026-05-24T19:46:03+08:00 | | CANCELED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | e433b0e356b846c89c301621a3c54494 | 2026-05-24T19:46:03+08:00 | | COMPLETED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 7c93a3880f074ebd8eca14e6b51bb7ef | 2026-05-24T19:46:03+08:00 | | COMPLETED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | df2e4ef51aaf4390bff9a23f2692486e | 2026-05-24T19:46:04+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 7377c53010194ef7a83aa206698d66ff | 2026-05-24T19:46:05+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | df64d1a1f9d348e3a2f174c4d7d69e73 | 2026-05-24T19:46:05+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | b59834512e2847e1bdf13ace04b8a456 | 2026-05-24T19:46:06+08:00 | | DISPATCHED | | 0 | 17937da188b84f23a5c10bb87588944b | | CLI | 0064bb0ab69344028d1ecfda053826f4 | 2026-05-24T19:46:03+08:00 | | QUEUED | +-----+----------------------------------+-------+------+----------------------------------+---------------------------+------------+------------+ ``` ### Type of change - [x] New Feature (non-breaking change which adds functionality) --------- Signed-off-by: Jin Hai <haijin.chn@gmail.com>
588 lines
16 KiB
Go
588 lines
16 KiB
Go
//
|
|
// Copyright 2026 The InfiniFlow Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
|
|
package admin
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"net"
|
|
"sync"
|
|
"time"
|
|
|
|
"ragflow/internal/common"
|
|
|
|
"google.golang.org/grpc"
|
|
"google.golang.org/grpc/peer"
|
|
)
|
|
|
|
const heartbeatTimeout = 30 * time.Second
|
|
|
|
type IngestionManager struct {
|
|
common.UnimplementedIngestionManagerServer
|
|
mu sync.RWMutex
|
|
|
|
// Registered ingestion servers
|
|
ingestionServers map[string]*IngestorState // ingestor id -> ingestor id
|
|
|
|
taskStates map[string]*TaskState // task_id -> task state
|
|
|
|
// In-memory task queue
|
|
taskQueue chan *pendingTask
|
|
|
|
// Notifies that an ingestor slot may have freed up
|
|
slotFreed chan struct{}
|
|
|
|
grpcServer *grpc.Server // gRPC server instance for graceful shutdown via Stop()
|
|
|
|
ctx context.Context
|
|
cancel context.CancelFunc
|
|
}
|
|
|
|
type TaskState struct {
|
|
taskID string // same as task_id in database
|
|
status string // created, assigned, processing, completed, failed
|
|
comeFrom string // api server id
|
|
assignTo string // ingestor id
|
|
lastUpdate time.Time
|
|
startTime *time.Time
|
|
estimatedRemainingTime time.Duration // estimated cost in seconds to complete the task
|
|
errorMessage string
|
|
}
|
|
|
|
type IngestorState struct {
|
|
ID string
|
|
Info *common.RegisterInfo
|
|
LastHeartbeat time.Time
|
|
Stream common.IngestionManager_ActionServer
|
|
Status string // active, draining
|
|
Address string
|
|
ProcessID int64
|
|
cpuUsage float64
|
|
vmsUsage float64
|
|
rssUsage float64
|
|
}
|
|
|
|
type pendingTask struct {
|
|
Task *common.TaskAssignment
|
|
CreatedAt time.Time
|
|
}
|
|
|
|
var ingestionManager *IngestionManager
|
|
|
|
func GetIngestionManager() *IngestionManager {
|
|
return ingestionManager
|
|
}
|
|
|
|
func NewAdminServer() *IngestionManager {
|
|
ctx, cancel := context.WithCancel(context.Background())
|
|
ingestionManager = &IngestionManager{
|
|
taskStates: make(map[string]*TaskState),
|
|
ingestionServers: make(map[string]*IngestorState),
|
|
taskQueue: make(chan *pendingTask, 10000),
|
|
slotFreed: make(chan struct{}, 100),
|
|
ctx: ctx,
|
|
cancel: cancel,
|
|
}
|
|
go ingestionManager.dispatchLoop()
|
|
//go ingestionManager.heartbeatCheckLoop() no need to check heartbeat timeout
|
|
return ingestionManager
|
|
}
|
|
|
|
// Action handles the bidirectional streaming RPC from ingestion servers
|
|
func (s *IngestionManager) Action(stream common.IngestionManager_ActionServer) error {
|
|
var ingestionServerID string
|
|
var state *IngestorState
|
|
|
|
common.Info("New ingestion_server connection")
|
|
|
|
// Start receive goroutine
|
|
receiveErrorCH := make(chan error, 1)
|
|
go func() {
|
|
for {
|
|
msg, err := stream.Recv()
|
|
if err != nil {
|
|
receiveErrorCH <- err
|
|
return
|
|
}
|
|
s.handleMessage(stream, msg, &ingestionServerID, &state)
|
|
}
|
|
}()
|
|
|
|
// Start send goroutine: send tasks immediately when assigned to this ingestion_server
|
|
sendDone := make(chan struct{})
|
|
go func() {
|
|
defer close(sendDone)
|
|
for {
|
|
select {
|
|
case <-stream.Context().Done():
|
|
return
|
|
case <-s.ctx.Done():
|
|
return
|
|
}
|
|
}
|
|
}()
|
|
|
|
select {
|
|
case err := <-receiveErrorCH:
|
|
// Connection dropped, clean up
|
|
s.cleanupIngestionServer(ingestionServerID)
|
|
return err
|
|
case <-sendDone:
|
|
// Stream context canceled (client disconnect or server shutdown)
|
|
s.cleanupIngestionServer(ingestionServerID)
|
|
return nil
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) handleMessage(
|
|
stream common.IngestionManager_ActionServer,
|
|
msg *common.IngestionMessage,
|
|
ingestionServerID *string,
|
|
state **IngestorState,
|
|
) {
|
|
switch msg.MessageType {
|
|
case "REGISTER":
|
|
s.handleRegister(stream, msg, ingestionServerID, state)
|
|
|
|
case "HEARTBEAT":
|
|
s.handleHeartbeat(msg, *ingestionServerID, *state)
|
|
|
|
case "TASK_RESULT":
|
|
s.handleTaskResult(msg, *ingestionServerID, *state)
|
|
|
|
case "TASK_PROGRESS":
|
|
s.handleTaskProgress(msg, *ingestionServerID, *state)
|
|
|
|
default:
|
|
common.Info(fmt.Sprintf("Unknown message type: %s", msg.MessageType))
|
|
err := stream.Send(&common.AdminMessage{
|
|
MessageType: "ERROR",
|
|
ErrorMessage: "unknown message type",
|
|
})
|
|
if err != nil {
|
|
common.Error("Fail to send unknown message", err)
|
|
return
|
|
}
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) handleRegister(
|
|
stream common.IngestionManager_ActionServer,
|
|
msg *common.IngestionMessage,
|
|
ingestionServerID *string,
|
|
state **IngestorState,
|
|
) {
|
|
if msg.RegisterInfo == nil {
|
|
err := stream.Send(&common.AdminMessage{
|
|
MessageType: "ERROR",
|
|
ErrorMessage: "missing register info",
|
|
})
|
|
if err != nil {
|
|
common.Error("Fail to send missing register info", err)
|
|
return
|
|
}
|
|
return
|
|
}
|
|
|
|
peerHost, ok := peer.FromContext(stream.Context())
|
|
if !ok {
|
|
err := stream.Send(&common.AdminMessage{
|
|
MessageType: "ERROR",
|
|
ErrorMessage: "peer not found in context",
|
|
})
|
|
if err != nil {
|
|
common.Error("Fail to send 'peer not found' message", err)
|
|
return
|
|
}
|
|
return
|
|
}
|
|
clientAddr := peerHost.Addr.String()
|
|
|
|
*ingestionServerID = msg.IngestorId
|
|
*state = &IngestorState{
|
|
ID: msg.IngestorId,
|
|
Info: msg.RegisterInfo,
|
|
LastHeartbeat: time.Now().Truncate(time.Second),
|
|
Stream: stream,
|
|
Status: "active",
|
|
Address: clientAddr,
|
|
}
|
|
|
|
s.mu.Lock()
|
|
s.ingestionServers[*ingestionServerID] = *state
|
|
s.mu.Unlock()
|
|
|
|
err := stream.Send(&common.AdminMessage{
|
|
MessageType: "ACK",
|
|
AckInfo: &common.AckInfo{
|
|
TaskId: "",
|
|
Success: true,
|
|
Message: "registered successfully",
|
|
},
|
|
})
|
|
if err != nil {
|
|
common.Error("Fail to send ACK message", err)
|
|
return
|
|
}
|
|
|
|
common.Info(fmt.Sprintf("Ingestor %s registered, max_concurrency=%d, supported_types=%v",
|
|
*ingestionServerID, msg.RegisterInfo.MaxConcurrency, msg.RegisterInfo.SupportedDocTypes))
|
|
}
|
|
|
|
func (s *IngestionManager) handleHeartbeat(msg *common.IngestionMessage, ingestorID string, state *IngestorState) {
|
|
if state == nil {
|
|
return
|
|
}
|
|
|
|
state.LastHeartbeat = time.Now().Truncate(time.Second)
|
|
|
|
if msg.HeartbeatInfo != nil {
|
|
|
|
lastUpdateTime := time.Now().Truncate(time.Second)
|
|
s.mu.Lock()
|
|
ingestorState := s.ingestionServers[msg.IngestorId]
|
|
ingestorState.LastHeartbeat = lastUpdateTime
|
|
if ingestorState.Status == "timeout" {
|
|
ingestorState.Status = "active"
|
|
common.Info(fmt.Sprintf("Ingestor %s recovered from timeout, status set to active", msg.IngestorId))
|
|
}
|
|
ingestorState.ProcessID = msg.HeartbeatInfo.ProcessId
|
|
ingestorState.cpuUsage = float64(msg.HeartbeatInfo.CpuUsage)
|
|
ingestorState.vmsUsage = float64(msg.HeartbeatInfo.VmsUsage) / 1024 / 1024 // in MB
|
|
ingestorState.rssUsage = float64(msg.HeartbeatInfo.RssUsage) / 1024 / 1024 // in MB
|
|
|
|
// Delete expired terminal tasks from currentTasks
|
|
for _, taskID := range msg.HeartbeatInfo.DeleteTaskIds {
|
|
delete(s.taskStates, taskID)
|
|
}
|
|
|
|
for _, ingestorTaskState := range msg.HeartbeatInfo.TaskStates {
|
|
localTaskState := s.taskStates[ingestorTaskState.TaskId]
|
|
if localTaskState == nil {
|
|
startTime := time.Unix(0, ingestorTaskState.StartTime)
|
|
localTaskState = &TaskState{
|
|
taskID: ingestorTaskState.TaskId,
|
|
comeFrom: ingestorTaskState.ComeFrom,
|
|
startTime: &startTime,
|
|
}
|
|
}
|
|
localTaskState.estimatedRemainingTime = time.Duration(ingestorTaskState.EstimatedRemainingTimeSeconds)
|
|
localTaskState.lastUpdate = lastUpdateTime
|
|
localTaskState.status = ingestorTaskState.Status
|
|
localTaskState.errorMessage = ingestorTaskState.ErrorMessage
|
|
localTaskState.assignTo = msg.IngestorId
|
|
}
|
|
s.mu.Unlock()
|
|
|
|
common.Debug(fmt.Sprintf("Heartbeat from %s", ingestorID))
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) handleTaskResult(msg *common.IngestionMessage, ingestorID string, state *IngestorState) {
|
|
if msg.TaskResult == nil {
|
|
return
|
|
}
|
|
|
|
result := msg.TaskResult
|
|
common.Info(fmt.Sprintf("Task result from %s: task=%s, status=%s, message=%s", ingestorID, result.TaskId, result.Status, result.ErrorMessage))
|
|
|
|
// Signal that a slot may have freed up for pending tasks
|
|
select {
|
|
case s.slotFreed <- struct{}{}:
|
|
default:
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) handleTaskProgress(msg *common.IngestionMessage, ingestorID string, state *IngestorState) {
|
|
if msg.TaskProgress == nil {
|
|
return
|
|
}
|
|
|
|
progress := msg.TaskProgress
|
|
common.Info(fmt.Sprintf("Task progress from %s: task=%s, progress=%d%%, detail=%s",
|
|
ingestorID, progress.TaskId, progress.Progress, progress.Info))
|
|
}
|
|
|
|
// SubmitTask is for API Server to call (non-gRPC, for testing only)
|
|
func (s *IngestionManager) SubmitTask(task *common.TaskAssignment) {
|
|
s.taskQueue <- &pendingTask{
|
|
Task: task,
|
|
CreatedAt: time.Now().Truncate(time.Second),
|
|
}
|
|
common.Info(fmt.Sprintf("Task %s submitted to queue", task.TaskId))
|
|
|
|
// Wake up dispatchLoop if it's blocked waiting for a slot
|
|
select {
|
|
case s.slotFreed <- struct{}{}:
|
|
default:
|
|
}
|
|
}
|
|
|
|
// dispatchLoop pulls tasks from the queue and assigns them to available ingestors.
|
|
// Runs in a background goroutine.
|
|
func (s *IngestionManager) dispatchLoop() {
|
|
for {
|
|
select {
|
|
case <-s.ctx.Done():
|
|
return
|
|
case pending := <-s.taskQueue:
|
|
go s.tryAssign(pending.Task)
|
|
}
|
|
}
|
|
}
|
|
|
|
// heartbeatCheckLoop periodically checks all registered ingestors for heartbeat timeout.
|
|
// If an ingestor's LastHeartbeat is older than heartbeatTimeout, its status is set to "timeout".
|
|
func (s *IngestionManager) heartbeatCheckLoop() {
|
|
ticker := time.NewTicker(heartbeatTimeout / 3)
|
|
defer ticker.Stop()
|
|
|
|
for {
|
|
select {
|
|
case <-s.ctx.Done():
|
|
return
|
|
case <-ticker.C:
|
|
s.checkHeartbeats()
|
|
}
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) checkHeartbeats() {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
|
|
now := time.Now().Truncate(time.Second)
|
|
for id, state := range s.ingestionServers {
|
|
if now.Sub(state.LastHeartbeat) > heartbeatTimeout {
|
|
if state.Status != "timeout" {
|
|
state.Status = "timeout"
|
|
common.Info(fmt.Sprintf("Ingestor %s heartbeat timeout, marked as timeout", id))
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) SelectIngestorForTask(task *common.TaskAssignment) *IngestorState {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
|
|
switch task.TaskType {
|
|
case "start_ingestion_task":
|
|
for _, ingestor := range s.ingestionServers {
|
|
if ingestor.Status == "active" {
|
|
s.taskStates[task.TaskId] = &TaskState{
|
|
taskID: task.TaskId,
|
|
status: "DISPATCHED",
|
|
comeFrom: "CLI",
|
|
startTime: nil,
|
|
lastUpdate: time.Now().Truncate(time.Second),
|
|
assignTo: ingestor.ID,
|
|
}
|
|
return ingestor
|
|
}
|
|
}
|
|
case "cancel_ingestion_task":
|
|
taskState := s.taskStates[task.TaskId]
|
|
if taskState != nil {
|
|
switch taskState.status {
|
|
case "COMPLETED":
|
|
return nil
|
|
case "DISPATCHED":
|
|
{
|
|
taskState.status = "CANCELING"
|
|
return s.ingestionServers[taskState.assignTo]
|
|
}
|
|
default:
|
|
return s.ingestionServers[taskState.assignTo]
|
|
}
|
|
}
|
|
|
|
case "shutdown_ingestor":
|
|
return s.ingestionServers[task.AssignedTo]
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// tryAssign repeatedly tries to find an available ingestor and assign the task.
|
|
// Blocks until either the task is assigned or the context is canceled.
|
|
func (s *IngestionManager) tryAssign(task *common.TaskAssignment) {
|
|
for {
|
|
|
|
target := s.SelectIngestorForTask(task)
|
|
if target != nil {
|
|
task.AssignedTo = target.ID
|
|
s.assignToIngestor(task, target)
|
|
return
|
|
}
|
|
|
|
if task.TaskType == "start_ingestion_task" {
|
|
// Receives a start ingestion task, save and change the states
|
|
s.mu.Lock()
|
|
s.taskStates[task.TaskId] = &TaskState{
|
|
taskID: task.TaskId,
|
|
status: "pending",
|
|
comeFrom: task.ComeFrom,
|
|
lastUpdate: time.Now().Truncate(time.Second),
|
|
startTime: nil,
|
|
}
|
|
s.mu.Unlock()
|
|
} else {
|
|
// shutdown ingestor or cancel task
|
|
common.Info("Task is completed, canceled, or ingestor is shutdown")
|
|
return
|
|
}
|
|
|
|
// No ingestor available, wait for a slot to free up
|
|
select {
|
|
case <-s.ctx.Done():
|
|
return
|
|
case <-s.slotFreed:
|
|
// A slot might be free, retry
|
|
case <-time.After(2 * time.Second):
|
|
// Periodic retry as fallback
|
|
}
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) assignToIngestor(task *common.TaskAssignment, state *IngestorState) {
|
|
err := state.Stream.Send(&common.AdminMessage{
|
|
MessageType: "TASK_ASSIGNMENT",
|
|
TaskAssignment: task,
|
|
})
|
|
if err != nil {
|
|
common.Info(fmt.Sprintf("Failed to assign task %s to ingestor %s: %v", task.TaskId, state.ID, err))
|
|
// Re-queue the task
|
|
s.taskQueue <- &pendingTask{Task: task, CreatedAt: time.Now().Truncate(time.Second)}
|
|
return
|
|
}
|
|
common.Info(fmt.Sprintf("Assigned task %s to ingestion_server %s", task.TaskId, state.ID))
|
|
}
|
|
|
|
func (s *IngestionManager) cleanupIngestionServer(ingestorID string) {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
|
|
if ingestorID == "" {
|
|
// Client disconnected before REGISTER completed — nothing to clean up
|
|
common.Info("Unregistered ingestion server disconnected")
|
|
return
|
|
}
|
|
|
|
if _, exists := s.ingestionServers[ingestorID]; exists {
|
|
delete(s.ingestionServers, ingestorID)
|
|
common.Info(fmt.Sprintf("Ingestor %s cleaned up", ingestorID))
|
|
|
|
// Clean the tasks handled by this ingestor
|
|
var tasksToDelete []string
|
|
for _, taskState := range s.taskStates {
|
|
if taskState.assignTo == ingestorID {
|
|
tasksToDelete = append(tasksToDelete, taskState.taskID)
|
|
}
|
|
}
|
|
for _, taskID := range tasksToDelete {
|
|
delete(s.taskStates, taskID)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (s *IngestionManager) ListIngestors() ([]map[string]interface{}, error) {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
|
|
var result []map[string]interface{}
|
|
for ingestorID, state := range s.ingestionServers {
|
|
|
|
var taskCount int64
|
|
for _, task := range s.taskStates {
|
|
if task.assignTo == ingestorID {
|
|
taskCount++
|
|
}
|
|
}
|
|
|
|
result = append(result, map[string]interface{}{
|
|
"id": ingestorID,
|
|
"name": state.Info.Name,
|
|
"address": state.Address,
|
|
"last_heartbeat": state.LastHeartbeat,
|
|
"task_count": taskCount,
|
|
"status": state.Status,
|
|
"cpu_usage": state.cpuUsage,
|
|
"rss_usage": state.rssUsage,
|
|
"vms_usage": state.vmsUsage,
|
|
"process_id": state.ProcessID,
|
|
})
|
|
}
|
|
return result, nil
|
|
}
|
|
|
|
func (s *IngestionManager) ListIngestionTasks() ([]map[string]interface{}, error) {
|
|
|
|
var result []map[string]interface{}
|
|
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
for index, taskState := range s.taskStates {
|
|
common.Info(fmt.Sprintf("Task %s: %s", index, taskState.taskID))
|
|
result = append(result, map[string]interface{}{
|
|
"id": taskState.taskID,
|
|
"status": taskState.status,
|
|
"from": taskState.comeFrom,
|
|
"assign_to": taskState.assignTo,
|
|
"last_update": taskState.lastUpdate,
|
|
"start_time": taskState.startTime,
|
|
"ETA": taskState.estimatedRemainingTime,
|
|
"error": taskState.errorMessage,
|
|
})
|
|
}
|
|
|
|
return result, nil
|
|
}
|
|
|
|
// Start starts the admin service
|
|
func (s *IngestionManager) Start(port string) error {
|
|
lis, err := net.Listen("tcp", port)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
s.grpcServer = grpc.NewServer()
|
|
common.RegisterIngestionManagerServer(s.grpcServer, s)
|
|
|
|
return s.grpcServer.Serve(lis)
|
|
}
|
|
|
|
// Stop gracefully shuts down the admin service
|
|
func (s *IngestionManager) Stop() {
|
|
common.Info("Stopping RAGFlow ingestion manager...")
|
|
|
|
// Notify all goroutines to exit
|
|
s.cancel()
|
|
|
|
// Gracefully stop gRPC server (stop accepting new connections, wait for in-flight requests)
|
|
if s.grpcServer != nil {
|
|
s.grpcServer.GracefulStop()
|
|
}
|
|
|
|
// Close the task queue
|
|
s.mu.Lock()
|
|
close(s.taskQueue)
|
|
s.mu.Unlock()
|
|
|
|
common.Info("RAGFlow ingestion manager stopped")
|
|
}
|