mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-06-29 15:31:05 +08:00
### What problem does this PR solve? Http API based on onnx model. pdf_parser.py to golang ### Type of change - [x] Refactoring
239 lines
6.6 KiB
Go
239 lines
6.6 KiB
Go
package parser
|
||
|
||
import (
|
||
"context"
|
||
"image"
|
||
"testing"
|
||
)
|
||
|
||
// mockRotationDoc implements DocAnalyzer with deterministic OCR results per angle.
|
||
// The mock tracks the call sequence: evaluateTableOrientation tests angles in
|
||
// order 0°, 90°, 180°, 270°. Each call to OCRDetect increments an internal
|
||
// counter and returns data for the corresponding angle.
|
||
type mockRotationDoc struct {
|
||
// angle → {regions count, average confidence, error}
|
||
angles map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}
|
||
callSeq int // incremented per OCRDetect call, selects the angle's data
|
||
}
|
||
|
||
var rotationOrder = []int{0, 90, 180, 270}
|
||
|
||
func (m *mockRotationDoc) DLA(_ context.Context, _ image.Image) ([]DLARegion, error) { return nil, nil }
|
||
func (m *mockRotationDoc) TSR(_ context.Context, _ image.Image) ([]TSRCell, error) { return nil, nil }
|
||
func (m *mockRotationDoc) OCR(_ image.Image) (string, error) { return "", nil }
|
||
func (m *mockRotationDoc) Health() bool { return true }
|
||
func (m *mockRotationDoc) ModelType() ModelType { return ModelSaas }
|
||
|
||
func (m *mockRotationDoc) currentAngle() int {
|
||
idx := m.callSeq % len(rotationOrder)
|
||
return rotationOrder[idx]
|
||
}
|
||
|
||
func (m *mockRotationDoc) OCRDetect(_ context.Context, img image.Image) ([]OCRBox, error) {
|
||
defer func() { m.callSeq++ }()
|
||
angle := m.currentAngle()
|
||
cfg, ok := m.angles[angle]
|
||
if !ok {
|
||
cfg = m.angles[0] // fallback to 0° config
|
||
}
|
||
if cfg.err != nil {
|
||
return nil, cfg.err
|
||
}
|
||
if cfg.regions == 0 {
|
||
return nil, nil
|
||
}
|
||
w, h := img.Bounds().Dx(), img.Bounds().Dy()
|
||
boxes := make([]OCRBox, cfg.regions)
|
||
step := w / (cfg.regions + 1)
|
||
for i := 0; i < cfg.regions; i++ {
|
||
x := step * (i + 1)
|
||
boxes[i] = OCRBox{
|
||
X0: float64(x), Y0: float64(h / 4),
|
||
X1: float64(x + 20), Y1: float64(h / 4),
|
||
X2: float64(x + 20), Y2: float64(h * 3 / 4),
|
||
X3: float64(x), Y3: float64(h * 3 / 4),
|
||
}
|
||
}
|
||
return boxes, nil
|
||
}
|
||
|
||
func (m *mockRotationDoc) OCRRecognizeBatch(_ context.Context, cropped []image.Image) ([][]OCRText, []error) {
|
||
results := make([][]OCRText, len(cropped))
|
||
errs := make([]error, len(cropped))
|
||
for i, img := range cropped {
|
||
results[i], errs[i] = m.OCRRecognize(context.Background(), img)
|
||
}
|
||
return results, errs
|
||
}
|
||
|
||
func (m *mockRotationDoc) OCRRecognize(_ context.Context, _ image.Image) ([]OCRText, error) {
|
||
angle := rotationOrder[(m.callSeq-1)%len(rotationOrder)] // use angle from last Detect call
|
||
cfg, ok := m.angles[angle]
|
||
if !ok {
|
||
cfg = m.angles[0]
|
||
}
|
||
if cfg.err != nil {
|
||
return nil, cfg.err
|
||
}
|
||
if cfg.regions == 0 {
|
||
return nil, nil
|
||
}
|
||
texts := make([]OCRText, cfg.regions)
|
||
for i := 0; i < cfg.regions; i++ {
|
||
texts[i] = OCRText{Text: "X", Confidence: cfg.avgConf}
|
||
}
|
||
return texts, nil
|
||
}
|
||
|
||
func makeTestTableImage() image.Image {
|
||
return image.NewRGBA(image.Rect(0, 0, 200, 100))
|
||
}
|
||
|
||
func TestEvaluateTableOrientation(t *testing.T) {
|
||
t.Run("normal table 0° wins", func(t *testing.T) {
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 10, avgConf: 0.9},
|
||
},
|
||
}
|
||
angle, _, scores := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 0 {
|
||
t.Errorf("expected 0°, got %d° (scores: %v)", angle, scores)
|
||
}
|
||
})
|
||
|
||
t.Run("90° rotated table wins", func(t *testing.T) {
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 2, avgConf: 0.2},
|
||
90: {regions: 10, avgConf: 0.9},
|
||
180: {regions: 2, avgConf: 0.2},
|
||
270: {regions: 2, avgConf: 0.2},
|
||
},
|
||
}
|
||
angle, _, scores := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 90 {
|
||
t.Errorf("expected 90°, got %d° (scores: %v)", angle, scores)
|
||
}
|
||
})
|
||
|
||
t.Run("180° rotated table wins", func(t *testing.T) {
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 1, avgConf: 0.1},
|
||
90: {regions: 1, avgConf: 0.1},
|
||
180: {regions: 8, avgConf: 0.85},
|
||
270: {regions: 1, avgConf: 0.1},
|
||
},
|
||
}
|
||
angle, _, scores := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 180 {
|
||
t.Errorf("expected 180°, got %d° (scores: %v)", angle, scores)
|
||
}
|
||
})
|
||
|
||
t.Run("270° rotated table wins", func(t *testing.T) {
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 1, avgConf: 0.1},
|
||
90: {regions: 1, avgConf: 0.1},
|
||
180: {regions: 1, avgConf: 0.1},
|
||
270: {regions: 9, avgConf: 0.88},
|
||
},
|
||
}
|
||
angle, _, scores := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 270 {
|
||
t.Errorf("expected 270°, got %d° (scores: %v)", angle, scores)
|
||
}
|
||
})
|
||
|
||
t.Run("threshold protection — 0° keeps when diff too small", func(t *testing.T) {
|
||
// Region-count scoring: 8 vs 9 is too close (< 1.4×) → 0° wins.
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 8},
|
||
90: {regions: 9},
|
||
},
|
||
}
|
||
angle, _, _ := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 0 {
|
||
t.Errorf("expected 0° (threshold protection), got %d°", angle)
|
||
}
|
||
})
|
||
|
||
t.Run("threshold pass — 90° wins when region count is clearly higher", func(t *testing.T) {
|
||
// 0° has few regions AND 90° has ≥1.4× more → 90° wins.
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {regions: 4},
|
||
90: {regions: 10},
|
||
},
|
||
}
|
||
angle, _, _ := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 90 {
|
||
t.Errorf("expected 90° (threshold passed), got %d°", angle)
|
||
}
|
||
})
|
||
|
||
t.Run("all angles fail OCR → fallback 0°", func(t *testing.T) {
|
||
doc := &mockRotationDoc{
|
||
angles: map[int]struct {
|
||
regions int
|
||
avgConf float64
|
||
err error
|
||
}{
|
||
0: {err: errMockOCR},
|
||
90: {err: errMockOCR},
|
||
180: {err: errMockOCR},
|
||
270: {err: errMockOCR},
|
||
},
|
||
}
|
||
angle, img, scores := evaluateTableOrientation(context.Background(), makeTestTableImage(), doc)
|
||
if angle != 0 {
|
||
t.Errorf("expected 0° fallback, got %d°", angle)
|
||
}
|
||
if img == nil {
|
||
t.Error("expected non-nil fallback image")
|
||
}
|
||
for _, s := range scores {
|
||
if s != 0 {
|
||
t.Error("all scores should be 0 on OCR failure")
|
||
}
|
||
}
|
||
})
|
||
}
|
||
|
||
var errMockOCR = &mockError{"mock OCR failure"}
|
||
|
||
type mockError struct{ msg string }
|
||
|
||
func (e *mockError) Error() string { return e.msg }
|