mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-06-29 23:41:12 +08:00
## Summary
This PR re-enables the Go test steps in CI that were previously
commented out, and fixes all compilation errors that have accumulated in
`internal/entity/models/` since the `ListModels` return type was changed
from `[]string` to `[]ListModelResponse`.
## Changes
### CI (`.github/workflows/tests.yml`)
- Re-enable **Prepare test resources** step (clones resource repo with
WordNet data)
- Re-enable **Test Go packages** step (runs `go test ./internal/...`)
- Fix resource path race condition by using
`/tmp/resource-${GITHUB_RUN_ID}` instead of `/tmp/resource`
- Exclude `/cli` package from Go tests (contains `main` redeclarations)
### Test fixes (16 model provider test files)
All errors were caused by the upstream change from `[]string` to
`[]ListModelResponse` in the `ListModels` interface:
- Add `joinModelNames` test helper to extract `.Name` from
`[]ListModelResponse` slices
- `strings.Join(models, ",")` → `joinModelNames(models, ",")` (11 files)
- `ids[i] != "..."` → `ids[i].Name != "..."` (cometapi, mistral)
- `got[i] != want[i]` → `got[i].Name != want[i]` (bedrock)
- `[]string` return types → `[]ListModelResponse` (google)
### Pre-existing bugs in model_test.go
Bugs introduced by the upstream `entity/` → `entity/models/` directory
rename:
- Add missing `pm := GetProviderManager()` calls in 3 test functions
- Fix `InitProviderManager` signature (`_, err :=` → `err :=`)
- Fix `MaxTokens` `*int` dereference (6 comparisons)
- Fix `readProviderConfig` relative path (3 levels up instead of 2)
### model.go
- Add `findRepoRoot()` to make `conf/all_models.json` resolution work
from any CWD, fixing `TestSiliconFlowProviderConfigLoadsLatestProModels`
### Test validation
```bash
go build ./internal/... # ✅
go test ./internal/entity/models/... -count=1 # ✅ all pass
```
🤖 Generated with [Claude Code](https://claude.com/claude-code)
Co-authored-by: Claude Opus 4.8 <noreply@anthropic.com>
663 lines
21 KiB
Go
663 lines
21 KiB
Go
package models
|
|
|
|
import (
|
|
"encoding/json"
|
|
"io"
|
|
"net/http"
|
|
"net/http/httptest"
|
|
"strings"
|
|
"testing"
|
|
)
|
|
|
|
func newGPUStackServer(t *testing.T, expectedPath string, handler func(t *testing.T, body map[string]interface{}, w http.ResponseWriter)) *httptest.Server {
|
|
t.Helper()
|
|
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
if r.URL.Path != expectedPath {
|
|
t.Errorf("expected path=%s, got %s", expectedPath, r.URL.Path)
|
|
return
|
|
}
|
|
if got := r.Header.Get("Authorization"); got != "Bearer test-key" {
|
|
t.Errorf("expected Authorization=Bearer test-key, got %q", got)
|
|
return
|
|
}
|
|
if r.Method == http.MethodPost {
|
|
if got := r.Header.Get("Content-Type"); !strings.HasPrefix(got, "application/json") {
|
|
t.Errorf("expected Content-Type to start with application/json, got %q", got)
|
|
return
|
|
}
|
|
raw, err := io.ReadAll(r.Body)
|
|
if err != nil {
|
|
t.Errorf("read body: %v", err)
|
|
return
|
|
}
|
|
var body map[string]interface{}
|
|
if err := json.Unmarshal(raw, &body); err != nil {
|
|
t.Errorf("unmarshal: %v\nraw=%s", err, string(raw))
|
|
return
|
|
}
|
|
handler(t, body, w)
|
|
return
|
|
}
|
|
handler(t, nil, w)
|
|
}))
|
|
}
|
|
|
|
func newGPUStackSSEServer(t *testing.T, expectedPath, ssePayload string) *httptest.Server {
|
|
t.Helper()
|
|
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
if r.Method != http.MethodPost {
|
|
t.Errorf("expected POST, got %s", r.Method)
|
|
return
|
|
}
|
|
if r.URL.Path != expectedPath {
|
|
t.Errorf("expected path=%s, got %s", expectedPath, r.URL.Path)
|
|
return
|
|
}
|
|
if got := r.Header.Get("Authorization"); got != "Bearer test-key" {
|
|
t.Errorf("expected Authorization=Bearer test-key, got %q", got)
|
|
return
|
|
}
|
|
if got := r.Header.Get("Content-Type"); !strings.HasPrefix(got, "application/json") {
|
|
t.Errorf("expected Content-Type to start with application/json, got %q", got)
|
|
return
|
|
}
|
|
if got := r.Header.Get("Accept"); got != "text/event-stream" {
|
|
t.Errorf("expected Accept=text/event-stream, got %q", got)
|
|
return
|
|
}
|
|
w.Header().Set("Content-Type", "text/event-stream")
|
|
_, _ = io.WriteString(w, ssePayload)
|
|
}))
|
|
}
|
|
|
|
func newGPUStackForTest(baseURL string) *GPUStackModel {
|
|
return NewGPUStackModel(
|
|
map[string]string{"default": baseURL},
|
|
URLSuffix{Chat: "v1/chat/completions", Models: "v1/models", Embedding: "v1-openai/embeddings"},
|
|
)
|
|
}
|
|
|
|
const gpustackEmbeddingsPath = "/v1-openai/embeddings"
|
|
|
|
func TestGPUStackName(t *testing.T) {
|
|
if got := newGPUStackForTest("http://unused").Name(); got != "gpustack" {
|
|
t.Errorf("Name()=%q, want %q", got, "gpustack")
|
|
}
|
|
}
|
|
|
|
func TestGPUStackFactory(t *testing.T) {
|
|
driver, err := NewModelFactory().CreateModelDriver("GPUStack", map[string]string{"default": "http://unused"}, URLSuffix{})
|
|
if err != nil {
|
|
t.Fatalf("CreateModelDriver: %v", err)
|
|
}
|
|
if _, ok := driver.(*GPUStackModel); !ok {
|
|
t.Fatalf("driver type=%T, want *GPUStackModel", driver)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatHappyPath(t *testing.T) {
|
|
srv := newGPUStackServer(t, "/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
|
|
if body["model"] != "qwen3-8b" {
|
|
t.Errorf("model=%v", body["model"])
|
|
}
|
|
if body["stream"] != false {
|
|
t.Errorf("stream=%v want false", body["stream"])
|
|
}
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"choices": []map[string]interface{}{{
|
|
"message": map[string]interface{}{"content": "pong"},
|
|
}},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
resp, err := newGPUStackForTest(srv.URL).ChatWithMessages(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "ping"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err != nil {
|
|
t.Fatalf("Chat: %v", err)
|
|
}
|
|
if resp.Answer == nil || *resp.Answer != "pong" {
|
|
t.Errorf("Answer=%v", resp.Answer)
|
|
}
|
|
if resp.ReasonContent == nil || *resp.ReasonContent != "" {
|
|
t.Errorf("ReasonContent=%v want empty", resp.ReasonContent)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatExtractsReasoningContent(t *testing.T) {
|
|
srv := newGPUStackServer(t, "/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"choices": []map[string]interface{}{{
|
|
"message": map[string]interface{}{
|
|
"role": "assistant",
|
|
"content": "12",
|
|
"reasoning_content": "0.15 * 80 = 12",
|
|
},
|
|
}},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
resp, err := newGPUStackForTest(srv.URL).ChatWithMessages(
|
|
"qwen3-32b",
|
|
[]Message{{Role: "user", Content: "15% of 80?"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err != nil {
|
|
t.Fatalf("Chat: %v", err)
|
|
}
|
|
if *resp.Answer != "12" {
|
|
t.Errorf("Answer=%q", *resp.Answer)
|
|
}
|
|
if *resp.ReasonContent != "0.15 * 80 = 12" {
|
|
t.Errorf("ReasonContent=%q", *resp.ReasonContent)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatForwardsDocumentedFields(t *testing.T) {
|
|
srv := newGPUStackServer(t, "/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
|
|
for _, k := range []string{"model", "messages", "stream", "max_tokens", "temperature", "top_p", "stop"} {
|
|
if _, present := body[k]; !present {
|
|
t.Errorf("documented field %q missing from request body", k)
|
|
}
|
|
}
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"choices": []map[string]interface{}{{
|
|
"message": map[string]interface{}{"content": "ok"},
|
|
}},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
mt := 64
|
|
temp := 0.5
|
|
topP := 0.95
|
|
stop := []string{"END"}
|
|
_, err := newGPUStackForTest(srv.URL).ChatWithMessages(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey},
|
|
&ChatConfig{MaxTokens: &mt, Temperature: &temp, TopP: &topP, Stop: &stop},
|
|
)
|
|
if err != nil {
|
|
t.Fatalf("Chat: %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatAllowsEmptyAPIKey(t *testing.T) {
|
|
_, err := newGPUStackForTest("http://unused").ChatWithMessages(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{}, nil,
|
|
)
|
|
if err == nil || strings.Contains(err.Error(), "api key is required") {
|
|
t.Errorf("self-hosted model should not require api key, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatRequiresModelName(t *testing.T) {
|
|
apiKey := "test-key"
|
|
_, err := newGPUStackForTest("http://unused").ChatWithMessages(
|
|
"",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "model name is required") {
|
|
t.Errorf("expected model-name error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatRequiresMessages(t *testing.T) {
|
|
apiKey := "test-key"
|
|
_, err := newGPUStackForTest("http://unused").ChatWithMessages(
|
|
"qwen3-8b", nil, &APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "messages is empty") {
|
|
t.Errorf("expected messages-empty error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatRejectsHTTPError(t *testing.T) {
|
|
srv := newGPUStackServer(t, "/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
|
|
w.WriteHeader(http.StatusUnauthorized)
|
|
_, _ = w.Write([]byte(`{"error":"unauthorized"}`))
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
_, err := newGPUStackForTest(srv.URL).ChatWithMessages(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "401") {
|
|
t.Errorf("expected 401 propagated, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackChatRequiresBaseURL(t *testing.T) {
|
|
model := NewGPUStackModel(map[string]string{}, URLSuffix{Chat: "v1/chat/completions"})
|
|
apiKey := "test-key"
|
|
_, err := model.ChatWithMessages(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "no base URL configured") {
|
|
t.Errorf("expected base-URL error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamHappyPath(t *testing.T) {
|
|
srv := newGPUStackSSEServer(t, "/v1/chat/completions",
|
|
`data: {"choices":[{"index":0,"delta":{"role":"assistant"}}]}`+"\n"+
|
|
`data: {"choices":[{"index":0,"delta":{"content":"Hello"}}]}`+"\n"+
|
|
`data: {"choices":[{"index":0,"delta":{"content":" world"},"finish_reason":"stop"}]}`+"\n"+
|
|
`data: [DONE]`+"\n",
|
|
)
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
var chunks []string
|
|
var sawDone bool
|
|
err := newGPUStackForTest(srv.URL).ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "hi"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
func(c *string, _ *string) error {
|
|
if c == nil {
|
|
return nil
|
|
}
|
|
if *c == "[DONE]" {
|
|
sawDone = true
|
|
return nil
|
|
}
|
|
chunks = append(chunks, *c)
|
|
return nil
|
|
},
|
|
)
|
|
if err != nil {
|
|
t.Fatalf("stream: %v", err)
|
|
}
|
|
if strings.Join(chunks, "") != "Hello world" {
|
|
t.Errorf("content=%v", chunks)
|
|
}
|
|
if !sawDone {
|
|
t.Error("expected [DONE] sentinel")
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamExtractsReasoningContent(t *testing.T) {
|
|
srv := newGPUStackSSEServer(t, "/v1/chat/completions",
|
|
`data: {"choices":[{"index":0,"delta":{"role":"assistant"}}]}`+"\n"+
|
|
`data: {"choices":[{"index":0,"delta":{"reasoning_content":"think "}}]}`+"\n"+
|
|
`data: {"choices":[{"index":0,"delta":{"content":"answer"},"finish_reason":"stop"}]}`+"\n"+
|
|
`data: [DONE]`+"\n",
|
|
)
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
var content, reasoning []string
|
|
err := newGPUStackForTest(srv.URL).ChatStreamlyWithSender(
|
|
"qwen3-32b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
func(c *string, r *string) error {
|
|
if r != nil && *r != "" {
|
|
reasoning = append(reasoning, *r)
|
|
}
|
|
if c != nil && *c != "" && *c != "[DONE]" {
|
|
content = append(content, *c)
|
|
}
|
|
return nil
|
|
},
|
|
)
|
|
if err != nil {
|
|
t.Fatalf("stream: %v", err)
|
|
}
|
|
if strings.Join(reasoning, "") != "think " {
|
|
t.Errorf("reasoning=%q", strings.Join(reasoning, ""))
|
|
}
|
|
if strings.Join(content, "") != "answer" {
|
|
t.Errorf("content=%q", strings.Join(content, ""))
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamRejectsExplicitFalse(t *testing.T) {
|
|
apiKey := "test-key"
|
|
stream := false
|
|
err := newGPUStackForTest("http://unused").ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey},
|
|
&ChatConfig{Stream: &stream},
|
|
func(*string, *string) error { return nil },
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "stream must be true") {
|
|
t.Errorf("expected stream-true guard, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamRequiresSender(t *testing.T) {
|
|
apiKey := "test-key"
|
|
err := newGPUStackForTest("http://unused").ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil, nil,
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "sender is required") {
|
|
t.Errorf("expected sender-required error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamFailsWithoutTerminal(t *testing.T) {
|
|
srv := newGPUStackSSEServer(t, "/v1/chat/completions",
|
|
`data: {"choices":[{"delta":{"content":"half"}}]}`+"\n",
|
|
)
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
err := newGPUStackForTest(srv.URL).ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
func(*string, *string) error { return nil },
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "stream ended before") {
|
|
t.Errorf("expected truncation error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamRejectsMalformedFrame(t *testing.T) {
|
|
srv := newGPUStackSSEServer(t, "/v1/chat/completions",
|
|
`data: {"choices":[{"delta":{"content":"ok"}}]}`+"\n"+
|
|
`data: {this is not valid json}`+"\n",
|
|
)
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
err := newGPUStackForTest(srv.URL).ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
func(*string, *string) error { return nil },
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "invalid SSE event") {
|
|
t.Errorf("expected invalid-SSE error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackStreamSurfacesUpstreamError(t *testing.T) {
|
|
srv := newGPUStackSSEServer(t, "/v1/chat/completions",
|
|
`data: {"choices":[{"delta":{"content":"partial "}}]}`+"\n"+
|
|
`data: {"error":{"message":"oom","type":"runtime_error"}}`+"\n",
|
|
)
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
err := newGPUStackForTest(srv.URL).ChatStreamlyWithSender(
|
|
"qwen3-8b",
|
|
[]Message{{Role: "user", Content: "x"}},
|
|
&APIConfig{ApiKey: &apiKey}, nil,
|
|
func(*string, *string) error { return nil },
|
|
)
|
|
if err == nil || !strings.Contains(err.Error(), "upstream stream error") {
|
|
t.Errorf("expected upstream-error surfacing, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackListModelsHappyPath(t *testing.T) {
|
|
srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
|
|
if r.Method != http.MethodGet {
|
|
t.Errorf("method=%s want GET", r.Method)
|
|
}
|
|
if r.URL.Path != "/v1/models" {
|
|
t.Errorf("path=%s", r.URL.Path)
|
|
}
|
|
if got := r.Header.Get("Authorization"); got != "Bearer test-key" {
|
|
t.Errorf("Authorization=%q", got)
|
|
}
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"id": "qwen3-8b"},
|
|
{"id": "qwen3-32b"},
|
|
},
|
|
})
|
|
}))
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := newGPUStackForTest(srv.URL)
|
|
models, err := model.ListModels(&APIConfig{ApiKey: &apiKey})
|
|
if err != nil {
|
|
t.Fatalf("ListModels: %v", err)
|
|
}
|
|
if joinModelNames(models, ",") != "qwen3-8b,qwen3-32b" {
|
|
t.Errorf("models=%v", models)
|
|
}
|
|
if err := model.CheckConnection(&APIConfig{ApiKey: &apiKey}); err != nil {
|
|
t.Fatalf("CheckConnection: %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackListModelsAllowsEmptyAPIKey(t *testing.T) {
|
|
_, err := newGPUStackForTest("http://unused").ListModels(&APIConfig{})
|
|
if err == nil || strings.Contains(err.Error(), "api key is required") {
|
|
t.Errorf("self-hosted model should not require api key, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedHappyPath verifies request shape and dimensions on v1-openai/embeddings.
|
|
func TestGPUStackEmbedHappyPath(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
|
|
if body["model"] != "bge-m3" {
|
|
t.Errorf("model=%v", body["model"])
|
|
}
|
|
if body["dimensions"] != float64(512) {
|
|
t.Errorf("dimensions=%v, want 512", body["dimensions"])
|
|
}
|
|
inputs, ok := body["input"].([]interface{})
|
|
if !ok || len(inputs) != 2 {
|
|
t.Errorf("input=%v, want 2-element array", body["input"])
|
|
}
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{0.2, 0.2}, "index": 1},
|
|
{"embedding": []float64{0.1, 0.2}, "index": 0},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
vecs, err := newGPUStackForTest(srv.URL).Embed(
|
|
&model, []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, &EmbeddingConfig{Dimension: 512})
|
|
if err != nil {
|
|
t.Fatalf("Embed: %v", err)
|
|
}
|
|
if len(vecs) != 2 {
|
|
t.Fatalf("len(vecs)=%d, want 2", len(vecs))
|
|
}
|
|
if vecs[0].Index != 0 || vecs[0].Embedding[0] != 0.1 || vecs[1].Index != 1 || vecs[1].Embedding[0] != 0.2 {
|
|
t.Errorf("vecs=%+v", vecs)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedReordersByIndex verifies out-of-order response indices are mapped correctly.
|
|
func TestGPUStackEmbedReordersByIndex(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{2}, "index": 2},
|
|
{"embedding": []float64{0}, "index": 0},
|
|
{"embedding": []float64{1}, "index": 1},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
vecs, err := newGPUStackForTest(srv.URL).Embed(
|
|
&model, []string{"a", "b", "c"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err != nil {
|
|
t.Fatalf("Embed: %v", err)
|
|
}
|
|
for i, v := range vecs {
|
|
if v.Index != i || v.Embedding[0] != float64(i) {
|
|
t.Errorf("slot %d = %+v, want Embedding=[%d] Index=%d", i, v, i, i)
|
|
}
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedEmptyInputShortCircuits avoids HTTP when texts is empty.
|
|
func TestGPUStackEmbedEmptyInputShortCircuits(t *testing.T) {
|
|
srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, _ *http.Request) {
|
|
t.Error("Embed([]) made an unexpected HTTP call")
|
|
w.WriteHeader(http.StatusInternalServerError)
|
|
}))
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
vecs, err := newGPUStackForTest(srv.URL).Embed(&model, []string{}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err != nil {
|
|
t.Fatalf("Embed([]): %v", err)
|
|
}
|
|
if len(vecs) != 0 {
|
|
t.Errorf("len(vecs)=%d, want 0", len(vecs))
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRequiresAPIKey rejects requests without an API key.
|
|
func TestGPUStackEmbedAllowsEmptyAPIKey(t *testing.T) {
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest("http://unused").Embed(&model, []string{"a"}, &APIConfig{}, nil)
|
|
if err == nil || strings.Contains(err.Error(), "api key is required") {
|
|
t.Errorf("self-hosted model should not require api key, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRejectsDuplicateIndex errors on duplicate response indices.
|
|
func TestGPUStackEmbedRejectsDuplicateIndex(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{0.1}, "index": 0},
|
|
{"embedding": []float64{0.2}, "index": 0},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest(srv.URL).Embed(&model, []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err == nil || !strings.Contains(err.Error(), "duplicate") {
|
|
t.Errorf("expected duplicate-index error, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRejectsOutOfRangeIndex errors when index exceeds input length.
|
|
func TestGPUStackEmbedRejectsOutOfRangeIndex(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{0.1}, "index": 2},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest(srv.URL).Embed(&model, []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err == nil || !strings.Contains(err.Error(), "out of range") {
|
|
t.Errorf("expected out-of-range error, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRejectsMissingIndex errors when index is omitted from response.
|
|
func TestGPUStackEmbedRejectsMissingIndex(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{0.1}},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest(srv.URL).Embed(&model, []string{"a"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err == nil || !strings.Contains(err.Error(), "missing embedding index") {
|
|
t.Errorf("expected missing-index error, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRejectsEmptyVector errors when the API returns a zero-length vector.
|
|
func TestGPUStackEmbedRejectsEmptyVector(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{}, "index": 0},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest(srv.URL).Embed(&model, []string{"a"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err == nil || !strings.Contains(err.Error(), "empty embedding vector") {
|
|
t.Errorf("expected empty-vector error, got %v", err)
|
|
}
|
|
}
|
|
|
|
// TestGPUStackEmbedRejectsMissingSlot errors when a response index is never returned.
|
|
func TestGPUStackEmbedRejectsMissingSlot(t *testing.T) {
|
|
srv := newGPUStackServer(t, gpustackEmbeddingsPath, func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
|
|
_ = json.NewEncoder(w).Encode(map[string]interface{}{
|
|
"data": []map[string]interface{}{
|
|
{"embedding": []float64{0.1}, "index": 0},
|
|
},
|
|
})
|
|
})
|
|
defer srv.Close()
|
|
|
|
apiKey := "test-key"
|
|
model := "bge-m3"
|
|
_, err := newGPUStackForTest(srv.URL).Embed(&model, []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, nil)
|
|
if err == nil || !strings.Contains(err.Error(), "missing embedding for input index") {
|
|
t.Errorf("expected missing-slot error, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestGPUStackUnsupportedMethods(t *testing.T) {
|
|
m := newGPUStackForTest("http://unused")
|
|
model := "x"
|
|
if _, err := m.Rerank(&model, "q", []string{"a"}, &APIConfig{}, &RerankConfig{TopN: 1}); err == nil || !strings.Contains(err.Error(), "no such method") {
|
|
t.Errorf("Rerank: %v", err)
|
|
}
|
|
if _, err := m.Balance(&APIConfig{}); err == nil || !strings.Contains(err.Error(), "no such method") {
|
|
t.Errorf("Balance: %v", err)
|
|
}
|
|
if _, err := m.TranscribeAudio(&model, &model, &APIConfig{}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
|
|
t.Errorf("TranscribeAudio: %v", err)
|
|
}
|
|
if _, err := m.AudioSpeech(&model, &model, &APIConfig{}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
|
|
t.Errorf("AudioSpeech: %v", err)
|
|
}
|
|
if _, err := m.OCRFile(&model, nil, &model, &APIConfig{}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
|
|
t.Errorf("OCRFile: %v", err)
|
|
}
|
|
}
|