mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-06-30 16:01:58 +08:00
Ports the agent canvas subsystem from Python to Go.
## What's included
### Canvas Engine (Phase 0/1)
- State engine, scheduler, variable resolver, Redis checkpoint store,
cancel protocol
- **209 tests** across canvas / component / io packages
### 22 Components (P0–P4)
| Tier | Components |
|---|---|
| P0 T1+T2+T3 | LLM, Agent, ExitLoop, Switch, Categorize, Begin,
Message, Invoke |
| P1 T3 | VariableAggregator, VariableAssigner, StringTransform,
ListOperations, DataOperations |
| P2 T3 | Iteration, IterationItem, Loop, LoopItem |
| P3 T3 | UserFillUp, Fillup |
| P4 T5 | Browser, ExcelProcessor, DocsGenerator |
### DSL v2 Schema (Phase 2.5)
- Typed v2 in-memory model with v1-to-v2 auto-detect converter
- v1 legacy field stripping per plan §2.11.7
### HTTP Endpoints & Bug Fixes (Plans PR1–PR3)
- **DELETE SQL bug fix**: gorm v2 `Where("id = ?", id).Delete(...)`
pattern
- **CreateAgent validation**: title/DSL required, duplicate check, 103
envelope
- **13 new endpoints**: templates, prompts, tags, sessions CRUD,
chat/completions (SSE + non-stream stubs), rerun, test_db_connection,
logs, webhook/logs
- **756 Go unit tests** (745 → 756, +18)
- **17 → 0 Python integration test failures** (test_agents.py +
test_session_management/)
### Tools
21 eino tools: HTTPHelper, search tools, financial/data tools, mandatory
stubs
### Infrastructure
OTel observability, NATS message queue, DeepDoc gRPC client, SSRF
guards, IDOR mitigation
278 lines
8.7 KiB
Go
278 lines
8.7 KiB
Go
//
|
|
// Copyright 2026 The InfiniFlow Authors. All Rights Reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
//
|
|
|
|
// runtime — per-run shared state for canvas components.
|
|
//
|
|
// CanvasState lives here (not in the canvas package) so that the
|
|
// builder-side (canvas) and the implementation-side (component) can
|
|
// both depend on it without forming an import cycle. The canvas
|
|
// package owns DSL types and topology building; the component package
|
|
// owns the registered component implementations; both read/write
|
|
// CanvasState through this package.
|
|
//
|
|
// Concurrency: a single sync.RWMutex guards every map in CanvasState
|
|
// (plan §2.5 — "start simple"). Helper methods (GetVar / SetVar /
|
|
// ReadVars / Snapshot / etc.) lock internally; callers should not
|
|
// acquire OutputsLock unless they have a specific reason to extend a
|
|
// critical section.
|
|
package runtime
|
|
|
|
import (
|
|
"encoding/json"
|
|
"fmt"
|
|
"strings"
|
|
"sync"
|
|
"sync/atomic"
|
|
)
|
|
|
|
// CanvasState is the per-run shared state bag that all components read/write
|
|
// through eino's StatePreHandler / StatePostHandler (compose/state.go).
|
|
//
|
|
// Fields mirror Python agent/canvas.py:43-95 with these mappings:
|
|
// - Outputs : cpn_id -> param_name -> resolved value (variable source)
|
|
// - Sys : sys.* namespace (query, user_id, conversation_turns, files)
|
|
// - Env : env.* namespace (deployment-time constants)
|
|
// - Path : entry-point sequence (Begin nodes)
|
|
// - History : conversation history (chat-flow agents)
|
|
// - Retrieval : aggregate retrieval result (chunks, doc_aggs)
|
|
// - Globals : cross-canvas-instance globals
|
|
// - CancelFlag : set when cancel signal received; nodes may poll
|
|
// - RunID : unique per-run identifier (used by RunTracker + CheckPointStore)
|
|
type CanvasState struct {
|
|
mu sync.RWMutex
|
|
Outputs map[string]map[string]any
|
|
Sys map[string]any
|
|
Env map[string]any
|
|
Path []string
|
|
History []map[string]any
|
|
Retrieval map[string]any
|
|
Globals map[string]any
|
|
CancelFlag *atomic.Bool
|
|
RunID string
|
|
TaskID string
|
|
}
|
|
|
|
// NewCanvasState returns a zero-valued CanvasState with all maps allocated.
|
|
// The atomic CancelFlag is allocated eagerly so nodes can safely poll it
|
|
// even before any cancel signal has been wired.
|
|
func NewCanvasState(runID, taskID string) *CanvasState {
|
|
return &CanvasState{
|
|
Outputs: make(map[string]map[string]any),
|
|
Sys: make(map[string]any),
|
|
Env: make(map[string]any),
|
|
Path: []string{},
|
|
History: []map[string]any{},
|
|
Retrieval: make(map[string]any),
|
|
Globals: make(map[string]any),
|
|
CancelFlag: &atomic.Bool{},
|
|
RunID: runID,
|
|
TaskID: taskID,
|
|
}
|
|
}
|
|
|
|
// GetVar resolves a variable reference to its current value.
|
|
//
|
|
// Supported forms (matches plan §2.5 + agent/canvas.py:168-239):
|
|
//
|
|
// "cpn_id@param" — Outputs[cpn_id][param]
|
|
// "cpn_id@param.path" — dot-path traversal on Outputs[cpn_id][param]
|
|
// "sys.x" — Sys["x"] (also "sys.x.path")
|
|
// "env.x" — Env["x"] (also "env.x.path")
|
|
// "item" — iteration alias (Phase 2; nil if unset)
|
|
// "index" — iteration alias (Phase 2; nil if unset)
|
|
//
|
|
// An unknown cpn_id returns (nil, nil) — mirrors Python's "treat as literal"
|
|
// fallback (canvas.py:494-495).
|
|
func (s *CanvasState) GetVar(ref string) (any, error) {
|
|
if ref == "" {
|
|
return nil, fmt.Errorf("canvas: empty variable reference")
|
|
}
|
|
s.mu.RLock()
|
|
defer s.mu.RUnlock()
|
|
return getVarLocked(s, ref)
|
|
}
|
|
|
|
// SetVar writes Outputs[cpnID][param] = v. Nested keys separated by "." are
|
|
// auto-created (mirrors Python's set_variable_param_value at
|
|
// canvas.py:261-271). The lock is held for the entire walk to keep
|
|
// "walk + assign" atomic under concurrent writers.
|
|
func (s *CanvasState) SetVar(cpnID, param string, v any) {
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
setVarLocked(s.Outputs, cpnID, param, v)
|
|
}
|
|
|
|
// ReadVars resolves a list of {{...}} references against the current state
|
|
// and returns them keyed by the original ref string. Intended for parameter
|
|
// binding: a component declares its input parameter references once, this
|
|
// resolves them in one locked pass.
|
|
//
|
|
// Empty / unresolvable refs map to nil (caller decides on nil-handling).
|
|
// The first error is returned and short-circuits the rest, but partial
|
|
// results are NOT used by callers — discard on err.
|
|
func (s *CanvasState) ReadVars(refs []string) (map[string]any, error) {
|
|
out := make(map[string]any, len(refs))
|
|
s.mu.RLock()
|
|
defer s.mu.RUnlock()
|
|
for _, ref := range refs {
|
|
v, err := getVarLocked(s, ref)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
out[ref] = v
|
|
}
|
|
return out, nil
|
|
}
|
|
|
|
// Snapshot returns a shallow copy of every cpn's outputs map. It is the
|
|
// snapshot that StatePreHandler exposes to component bodies. Shallow is
|
|
// fine: components only re-read primitive values from this snapshot
|
|
// during one execution; a deeper copy would just cost allocations.
|
|
//
|
|
// The lock is held only for the duration of the copy; callers may pass
|
|
// the returned map around freely.
|
|
func (s *CanvasState) Snapshot() map[string]map[string]any {
|
|
s.mu.RLock()
|
|
defer s.mu.RUnlock()
|
|
out := make(map[string]map[string]any, len(s.Outputs))
|
|
for k, v := range s.Outputs {
|
|
cp := make(map[string]any, len(v))
|
|
for kk, vv := range v {
|
|
cp[kk] = vv
|
|
}
|
|
out[k] = cp
|
|
}
|
|
return out
|
|
}
|
|
|
|
// RecordOutput stores payload under Outputs[cpnID][bucket]. Used by the
|
|
// StatePostHandler to persist a node's result so downstream nodes can
|
|
// resolve {{cpnID@bucket.x}} references against it.
|
|
func (s *CanvasState) RecordOutput(cpnID, bucket string, payload any) {
|
|
if cpnID == "" {
|
|
return
|
|
}
|
|
s.mu.Lock()
|
|
defer s.mu.Unlock()
|
|
b, ok := s.Outputs[cpnID]
|
|
if !ok {
|
|
b = make(map[string]any)
|
|
s.Outputs[cpnID] = b
|
|
}
|
|
b[bucket] = payload
|
|
}
|
|
|
|
// getVarLocked is the lock-free inner GetVar. Caller must hold s.mu (read or
|
|
// write) for the entire call.
|
|
func getVarLocked(s *CanvasState, ref string) (any, error) {
|
|
switch {
|
|
case ref == "item":
|
|
return s.Globals["__item__"], nil
|
|
case ref == "index":
|
|
return s.Globals["__index__"], nil
|
|
case strings.HasPrefix(ref, "sys."):
|
|
return dotTraverse(s.Sys, strings.TrimPrefix(ref, "sys.")), nil
|
|
case strings.HasPrefix(ref, "env."):
|
|
return dotTraverse(s.Env, strings.TrimPrefix(ref, "env.")), nil
|
|
case strings.Contains(ref, "@"):
|
|
idx := strings.Index(ref, "@")
|
|
cpnID, tail := ref[:idx], ref[idx+1:]
|
|
outputs, ok := s.Outputs[cpnID]
|
|
if !ok {
|
|
return nil, nil
|
|
}
|
|
return dotTraverse(outputs, tail), nil
|
|
default:
|
|
return nil, fmt.Errorf("canvas: invalid variable reference %q", ref)
|
|
}
|
|
}
|
|
|
|
// setVarLocked is the lock-free inner SetVar. Caller must hold s.mu.
|
|
func setVarLocked(outputs map[string]map[string]any, cpnID, param string, v any) {
|
|
bucket, ok := outputs[cpnID]
|
|
if !ok {
|
|
bucket = make(map[string]any)
|
|
outputs[cpnID] = bucket
|
|
}
|
|
parts := strings.Split(param, ".")
|
|
cur := bucket
|
|
for i, p := range parts {
|
|
if i == len(parts)-1 {
|
|
cur[p] = v
|
|
return
|
|
}
|
|
next, ok := cur[p].(map[string]any)
|
|
if !ok {
|
|
next = make(map[string]any)
|
|
cur[p] = next
|
|
}
|
|
cur = next
|
|
}
|
|
}
|
|
|
|
// dotTraverse walks a dot-path inside a generic Go value. The path is split
|
|
// on "." and dispatched by intermediate type, mirroring Python's
|
|
// get_variable_param_value precedence (canvas.py:212-239):
|
|
//
|
|
// 1. nil → return nil
|
|
// 2. string → try json.Unmarshal, then continue on the parsed value
|
|
// 3. map[string]any → index by key
|
|
// 4. []any → index by int (cast failure → nil)
|
|
// 5. else → return nil
|
|
//
|
|
// The empty path returns the root value as-is.
|
|
func dotTraverse(root any, path string) any {
|
|
if path == "" {
|
|
return root
|
|
}
|
|
parts := strings.Split(path, ".")
|
|
cur := root
|
|
for _, p := range parts {
|
|
cur = step(cur, p)
|
|
if cur == nil {
|
|
return nil
|
|
}
|
|
}
|
|
return cur
|
|
}
|
|
|
|
func step(cur any, key string) any {
|
|
switch v := cur.(type) {
|
|
case nil:
|
|
return nil
|
|
case map[string]any:
|
|
return v[key]
|
|
case string:
|
|
// Strings can be JSON-encoded dicts/lists; try once.
|
|
var parsed any
|
|
if err := json.Unmarshal([]byte(v), &parsed); err == nil {
|
|
return step(parsed, key)
|
|
}
|
|
return nil
|
|
case []any:
|
|
var idx int
|
|
if _, err := fmt.Sscanf(key, "%d", &idx); err != nil {
|
|
return nil
|
|
}
|
|
if idx < 0 || idx >= len(v) {
|
|
return nil
|
|
}
|
|
return v[idx]
|
|
default:
|
|
return nil
|
|
}
|
|
}
|