Files
ragflow/internal/entity/models/novita_test.go
Jack 338fdb65fb feat(ci): enable go test in CI pipeline (#15750)
## What problem does this PR solve?

Go test files are never compiled in CI — only production binaries via
`go build`. This allowed a missing `"sort"` import in
`metadata_filter_test.go` to be merged without detection.

## Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
- [x] New Feature (non-breaking change which adds functionality)

## Changes

- Add `go test -count=1 ./internal/...` step after Go build in CI
workflow
- Fix missing `"sort"` import in `metadata_filter_test.go` (pre-existing
compile error)

🤖 Generated with [Claude Code](https://claude.com/claude-code)

---------

Co-authored-by: Claude Opus 4.8 <noreply@anthropic.com>
2026-06-08 20:06:57 +08:00

921 lines
30 KiB
Go

package models
import (
"encoding/json"
"io"
"net/http"
"net/http/httptest"
"strings"
"testing"
)
func newNovitaServer(t *testing.T, expectedPath string, handler func(t *testing.T, body map[string]interface{}, w http.ResponseWriter)) *httptest.Server {
t.Helper()
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
if r.URL.Path != expectedPath {
t.Errorf("expected path=%s, got %s", expectedPath, r.URL.Path)
return
}
if got := r.Header.Get("Authorization"); got != "Bearer test-key" {
t.Errorf("expected Authorization=Bearer test-key, got %q", got)
return
}
// Content-Type must declare JSON on BOTH POST chat (body is
// JSON) and GET ListModels (Novita platform expects callers to
// negotiate JSON content even though the body is empty —
// maintainer review explicitly flagged the missing header).
if got := r.Header.Get("Content-Type"); !strings.HasPrefix(got, "application/json") {
t.Errorf("expected Content-Type to start with application/json, got %q", got)
return
}
if r.Method == http.MethodPost {
raw, err := io.ReadAll(r.Body)
if err != nil {
t.Errorf("read body: %v", err)
return
}
var body map[string]interface{}
if err := json.Unmarshal(raw, &body); err != nil {
t.Errorf("unmarshal: %v\nraw=%s", err, string(raw))
return
}
handler(t, body, w)
return
}
handler(t, nil, w)
}))
}
func newNovitaForTest(baseURL string) *NovitaModel {
return NewNovitaModel(
map[string]string{"default": baseURL},
URLSuffix{
Chat: "openai/v1/chat/completions",
Models: "openai/v1/models",
Embedding: "openai/v1/embeddings",
Rerank: "openai/v1/rerank",
},
)
}
func TestNovitaNewModelWithCustomDefaultTransport(t *testing.T) {
original := http.DefaultTransport
http.DefaultTransport = roundTripperFunc(func(*http.Request) (*http.Response, error) {
return nil, nil
})
t.Cleanup(func() {
http.DefaultTransport = original
})
if model := NewNovitaModel(map[string]string{"default": "http://unused"}, URLSuffix{}); model == nil {
t.Fatal("NewNovitaModel returned nil")
}
}
// newNovitaSSEServer asserts the SSE-chat wire contract (POST, path,
// Authorization, Content-Type) the same way newNovitaServer does for
// the JSON-chat path, then writes the supplied SSE payload. Closes
// the gap CodeRabbit flagged where streaming tests used
// httptest.NewServer directly and skipped the request-shape checks.
func newNovitaSSEServer(t *testing.T, expectedPath, ssePayload string) *httptest.Server {
t.Helper()
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
if r.Method != http.MethodPost {
t.Errorf("expected POST, got %s", r.Method)
return
}
if r.URL.Path != expectedPath {
t.Errorf("expected path=%s, got %s", expectedPath, r.URL.Path)
return
}
if got := r.Header.Get("Authorization"); got != "Bearer test-key" {
t.Errorf("expected Authorization=Bearer test-key, got %q", got)
return
}
if got := r.Header.Get("Content-Type"); !strings.HasPrefix(got, "application/json") {
t.Errorf("expected Content-Type to start with application/json, got %q", got)
return
}
w.Header().Set("Content-Type", "text/event-stream")
_, _ = io.WriteString(w, ssePayload)
}))
}
// ---- think-tag split helpers ----
func TestSplitNovitaThinkPureText(t *testing.T) {
v, r := splitNovitaThink("hello world")
if v != "hello world" || r != "" {
t.Errorf("got (%q,%q)", v, r)
}
}
func TestSplitNovitaThinkSingleBlock(t *testing.T) {
v, r := splitNovitaThink("<think>15% = 0.15. 0.15*80 = 12.</think>The answer is 12.")
if v != "The answer is 12." {
t.Errorf("visible=%q", v)
}
if r != "15% = 0.15. 0.15*80 = 12." {
t.Errorf("reasoning=%q", r)
}
}
func TestSplitNovitaThinkLeadingText(t *testing.T) {
v, r := splitNovitaThink("intro <think>thought</think>tail")
if v != "intro tail" {
t.Errorf("visible=%q", v)
}
if r != "thought" {
t.Errorf("reasoning=%q", r)
}
}
func TestSplitNovitaThinkMultipleBlocks(t *testing.T) {
v, r := splitNovitaThink("<think>A</think>part1<think>B</think>part2")
if v != "part1part2" {
t.Errorf("visible=%q", v)
}
if r != "AB" {
t.Errorf("reasoning=%q", r)
}
}
func TestSplitNovitaThinkUnclosedTag(t *testing.T) {
// Unclosed <think> -> everything after the open tag is reasoning;
// content stops at the open tag. This matches a real upstream that
// got cut off mid-reasoning by max_tokens.
v, r := splitNovitaThink("visible <think>still thinking when tokens ran out")
if v != "visible " {
t.Errorf("visible=%q", v)
}
if r != "still thinking when tokens ran out" {
t.Errorf("reasoning=%q", r)
}
}
// ---- streaming extractor ----
// Helper to push multiple chunks through and concatenate all output by
// kind. Each chunk goes into Feed; the output is what's safe to emit.
func feedAll(e *novitaThinkExtractor, chunks []string) (content, reasoning string) {
var cb, rb strings.Builder
for _, c := range chunks {
for _, seg := range e.Feed(c) {
cb.WriteString(seg.content)
rb.WriteString(seg.reasoning)
}
}
if seg := e.Flush(); seg != nil {
cb.WriteString(seg.content)
rb.WriteString(seg.reasoning)
}
return cb.String(), rb.String()
}
func TestNovitaThinkExtractorSingleChunk(t *testing.T) {
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{"hello <think>thought</think> world"})
if c != "hello world" {
t.Errorf("content=%q", c)
}
if r != "thought" {
t.Errorf("reasoning=%q", r)
}
}
func TestNovitaThinkExtractorTagSpansChunks(t *testing.T) {
// "<think>" split across two SSE deltas: "<thi" + "nk>"
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{"hello <thi", "nk>thought</think>tail"})
if c != "hello tail" {
t.Errorf("content=%q", c)
}
if r != "thought" {
t.Errorf("reasoning=%q", r)
}
}
func TestNovitaThinkExtractorClosingTagSpansChunks(t *testing.T) {
// "</think>" split across two deltas
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{"<think>reasoning</thi", "nk>visible"})
if c != "visible" {
t.Errorf("content=%q", c)
}
if r != "reasoning" {
t.Errorf("reasoning=%q", r)
}
}
func TestNovitaThinkExtractorTokenBoundaries(t *testing.T) {
// Simulate the kind of chunking we saw on the wire for qwen3 — many
// small chunks, sometimes splitting tag bytes.
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{
"<", "think>", "Ok", "ay, ", "compute. </", "think>", "12", "."})
if c != "12." {
t.Errorf("content=%q", c)
}
if r != "Okay, compute. " {
t.Errorf("reasoning=%q", r)
}
}
func TestNovitaThinkExtractorNoTags(t *testing.T) {
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{"plain ", "content ", "all ", "the way"})
if c != "plain content all the way" {
t.Errorf("content=%q", c)
}
if r != "" {
t.Errorf("reasoning=%q", r)
}
}
func TestNovitaThinkExtractorLessThanIsNotTagStart(t *testing.T) {
// "<10" or "<a" in legitimate content must not be held back as
// possible tag start. The extractor reserves trailing bytes only
// when a "<" is present in the suffix.
e := &novitaThinkExtractor{}
c, r := feedAll(e, []string{"a < b and c < d"})
if c != "a < b and c < d" {
t.Errorf("content=%q", c)
}
if r != "" {
t.Errorf("reasoning=%q", r)
}
}
// ---- driver methods ----
func TestNovitaName(t *testing.T) {
if got := newNovitaForTest("http://unused").Name(); got != "novita" {
t.Errorf("Name()=%q", got)
}
}
func TestNovitaChatPureText(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"choices": []map[string]interface{}{{
"message": map[string]interface{}{"content": "pong"},
}},
})
})
defer srv.Close()
apiKey := "test-key"
resp, err := newNovitaForTest(srv.URL).ChatWithMessages(
"meta-llama/llama-3.3-70b-instruct",
[]Message{{Role: "user", Content: "ping"}},
&APIConfig{ApiKey: &apiKey}, nil)
if err != nil {
t.Fatalf("Chat: %v", err)
}
if *resp.Answer != "pong" || *resp.ReasonContent != "" {
t.Errorf("(%q,%q)", *resp.Answer, *resp.ReasonContent)
}
}
func TestNovitaChatExtractsThinkTags(t *testing.T) {
// qwen3-style response: <think>...</think> embedded in content.
// Driver must split it into Answer + ReasonContent.
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"choices": []map[string]interface{}{{
"message": map[string]interface{}{
"role": "assistant",
"content": "<think>15% = 0.15; 0.15 * 80 = 12.</think>The answer is 12.",
},
}},
})
})
defer srv.Close()
apiKey := "test-key"
resp, err := newNovitaForTest(srv.URL).ChatWithMessages(
"qwen/qwen3-30b-a3b-fp8",
[]Message{{Role: "user", Content: "15% of 80?"}},
&APIConfig{ApiKey: &apiKey}, nil)
if err != nil {
t.Fatalf("Chat: %v", err)
}
if *resp.Answer != "The answer is 12." {
t.Errorf("Answer=%q", *resp.Answer)
}
if *resp.ReasonContent != "15% = 0.15; 0.15 * 80 = 12." {
t.Errorf("ReasonContent=%q", *resp.ReasonContent)
}
}
// deepseek-v3.1 / glm-4.5 with enable_thinking=true return reasoning
// in a separate `reasoning_content` field on the message rather than
// inline as <think>...</think>. The driver must surface this field
// to ChatResponse.ReasonContent. Live-confirmed against
// api.novita.ai/openai/v1/chat/completions with deepseek/deepseek-v3.1.
func TestNovitaChatExtractsReasoningContentField(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"choices": []map[string]interface{}{{
"message": map[string]interface{}{
"role": "assistant",
"content": "4",
"reasoning_content": "2+2 is straightforward arithmetic: the answer is 4.",
},
}},
})
})
defer srv.Close()
apiKey := "test-key"
resp, err := newNovitaForTest(srv.URL).ChatWithMessages(
"deepseek/deepseek-v3.1",
[]Message{{Role: "user", Content: "2+2?"}},
&APIConfig{ApiKey: &apiKey}, nil)
if err != nil {
t.Fatalf("Chat: %v", err)
}
if resp.Answer == nil || resp.ReasonContent == nil {
t.Fatalf("Answer/ReasonContent must be non-nil pointers")
}
if *resp.Answer != "4" {
t.Errorf("Answer=%q", *resp.Answer)
}
if *resp.ReasonContent != "2+2 is straightforward arithmetic: the answer is 4." {
t.Errorf("ReasonContent=%q", *resp.ReasonContent)
}
}
// Streaming deepseek-v3.1 with thinking on emits delta.reasoning_content
// (not delta.content with <think> tags). The driver must forward
// those chunks via the sender's second arg.
func TestNovitaStreamExtractsDeltaReasoningContent(t *testing.T) {
srv := newNovitaSSEServer(t, "/openai/v1/chat/completions",
`data: {"choices":[{"index":0,"delta":{"role":"assistant","reasoning_content":"step 1. "}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"reasoning_content":"step 2."}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"final answer"},"finish_reason":"stop"}]}`+"\n"+
`data: [DONE]`+"\n",
)
defer srv.Close()
apiKey := "test-key"
var content, reasoning []string
err := newNovitaForTest(srv.URL).ChatStreamlyWithSender(
"deepseek/deepseek-v3.1",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil,
func(c *string, r *string) error {
if c != nil && r != nil {
t.Errorf("sender called with both args non-nil")
}
if r != nil && *r != "" {
reasoning = append(reasoning, *r)
}
if c != nil && *c != "" && *c != "[DONE]" {
content = append(content, *c)
}
return nil
})
if err != nil {
t.Fatalf("stream: %v", err)
}
if got := strings.Join(reasoning, ""); got != "step 1. step 2." {
t.Errorf("reasoning=%q", got)
}
if got := strings.Join(content, ""); got != "final answer" {
t.Errorf("content=%q", got)
}
}
// TestNovitaChatPropagatesEnableThinking pins the maintainer's
// requested behaviour: when ChatConfig.Thinking is set, the driver
// MUST forward it as Novita's documented `enable_thinking` body field
// so a tenant can switch a deepseek-v3.1 / glm-4.5 / qwen3 deployment
// out of its default thinking mode without prompt-level hacks.
func TestNovitaChatPropagatesEnableThinking(t *testing.T) {
cases := []struct {
name string
value bool
}{
{"enabled", true},
{"disabled", false},
}
for _, tc := range cases {
t.Run(tc.name, func(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
got, present := body["enable_thinking"]
if !present {
t.Errorf("enable_thinking missing from body, want %v", tc.value)
}
if got != tc.value {
t.Errorf("enable_thinking=%v want %v", got, tc.value)
}
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"choices": []map[string]interface{}{{
"message": map[string]interface{}{"content": "ok"},
}},
})
})
defer srv.Close()
apiKey := "test-key"
thinking := tc.value
_, err := newNovitaForTest(srv.URL).ChatWithMessages(
"qwen/qwen3-30b-a3b-fp8",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey},
&ChatConfig{Thinking: &thinking})
if err != nil {
t.Fatalf("Chat: %v", err)
}
})
}
}
// Sending enable_thinking when the caller didn't ask for it would
// silently flip behavior for downstream proxies that distinguish
// "field absent" from "field present with default". Leave it out.
func TestNovitaChatOmitsEnableThinkingWhenUnset(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
if _, present := body["enable_thinking"]; present {
t.Errorf("enable_thinking must be absent when Thinking unset, got %v", body["enable_thinking"])
}
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"choices": []map[string]interface{}{{
"message": map[string]interface{}{"content": "ok"},
}},
})
})
defer srv.Close()
apiKey := "test-key"
_, err := newNovitaForTest(srv.URL).ChatWithMessages("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey},
&ChatConfig{}) // no Thinking
if err != nil {
t.Fatalf("Chat: %v", err)
}
}
// TestNovitaStreamPropagatesEnableThinking mirrors the non-stream
// case for ChatStreamlyWithSender so callers get the same toggle
// regardless of streaming mode.
func TestNovitaStreamPropagatesEnableThinking(t *testing.T) {
var seen map[string]interface{}
srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
raw, _ := io.ReadAll(r.Body)
_ = json.Unmarshal(raw, &seen)
w.Header().Set("Content-Type", "text/event-stream")
_, _ = io.WriteString(w,
`data: {"choices":[{"delta":{"content":"ok"},"finish_reason":"stop"}]}`+"\n"+
`data: [DONE]`+"\n",
)
}))
defer srv.Close()
apiKey := "test-key"
thinking := false
err := newNovitaForTest(srv.URL).ChatStreamlyWithSender(
"deepseek/deepseek-v3.1",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey},
&ChatConfig{Thinking: &thinking},
func(*string, *string) error { return nil })
if err != nil {
t.Fatalf("Stream: %v", err)
}
if got, ok := seen["enable_thinking"].(bool); !ok || got != false {
t.Errorf("stream enable_thinking=%v want false", seen["enable_thinking"])
}
}
func TestNovitaChatRequiresAPIKey(t *testing.T) {
_, err := newNovitaForTest("http://unused").ChatWithMessages("m",
[]Message{{Role: "user", Content: "x"}}, &APIConfig{}, nil)
if err == nil || !strings.Contains(err.Error(), "api key is required") {
t.Errorf("got %v", err)
}
}
func TestNovitaChatRequiresMessages(t *testing.T) {
apiKey := "test-key"
_, err := newNovitaForTest("http://unused").ChatWithMessages("m", nil,
&APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "messages is empty") {
t.Errorf("got %v", err)
}
}
func TestNovitaChatRejectsHTTPError(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/chat/completions", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
w.WriteHeader(http.StatusUnauthorized)
_, _ = w.Write([]byte(`{"detail":"unauthorized"}`))
})
defer srv.Close()
apiKey := "test-key"
_, err := newNovitaForTest(srv.URL).ChatWithMessages("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "401") {
t.Errorf("got %v", err)
}
}
// Streaming: an SSE stream that emits <think>...</think> inline in
// delta.content must surface reasoning chunks through the sender's
// second arg, and visible content through the first.
func TestNovitaStreamSplitsThinkTags(t *testing.T) {
// Simulate the realistic case where tags span deltas — split
// "<think>" across two chunks, and split "</think>" too.
srv := newNovitaSSEServer(t, "/openai/v1/chat/completions",
`data: {"choices":[{"index":0,"delta":{"role":"assistant"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"<"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"think>"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"Okay, "}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"compute. </"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"think>"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"12"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"."},"finish_reason":"stop"}]}`+"\n"+
`data: [DONE]`+"\n",
)
defer srv.Close()
apiKey := "test-key"
var content, reasoning []string
err := newNovitaForTest(srv.URL).ChatStreamlyWithSender(
"qwen/qwen3-30b-a3b-fp8",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil,
func(c *string, r *string) error {
if c != nil && r != nil {
t.Errorf("sender called with both args non-nil")
}
if r != nil && *r != "" {
reasoning = append(reasoning, *r)
}
if c != nil && *c != "" && *c != "[DONE]" {
content = append(content, *c)
}
return nil
})
if err != nil {
t.Fatalf("stream: %v", err)
}
gotContent := strings.Join(content, "")
gotReason := strings.Join(reasoning, "")
if gotContent != "12." {
t.Errorf("content=%q want %q", gotContent, "12.")
}
if gotReason != "Okay, compute. " {
t.Errorf("reasoning=%q", gotReason)
}
}
// Streaming for a non-reasoning model that emits only content chunks
// must continue to work unchanged.
func TestNovitaStreamPureContent(t *testing.T) {
srv := newNovitaSSEServer(t, "/openai/v1/chat/completions",
`data: {"choices":[{"index":0,"delta":{"role":"assistant"}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"Hello "}}]}`+"\n"+
`data: {"choices":[{"index":0,"delta":{"content":"world"},"finish_reason":"stop"}]}`+"\n"+
`data: [DONE]`+"\n",
)
defer srv.Close()
apiKey := "test-key"
var chunks []string
var sawDone bool
err := newNovitaForTest(srv.URL).ChatStreamlyWithSender("meta-llama/llama-3.3-70b-instruct",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil,
func(c *string, _ *string) error {
if c == nil {
return nil
}
if *c == "[DONE]" {
sawDone = true
return nil
}
chunks = append(chunks, *c)
return nil
})
if err != nil {
t.Fatalf("stream: %v", err)
}
if strings.Join(chunks, "") != "Hello world" {
t.Errorf("content=%v", chunks)
}
if !sawDone {
t.Error("expected [DONE] sentinel")
}
}
func TestNovitaStreamRequiresSender(t *testing.T) {
apiKey := "test-key"
err := newNovitaForTest("http://unused").ChatStreamlyWithSender("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil, nil)
if err == nil || !strings.Contains(err.Error(), "sender is required") {
t.Errorf("got %v", err)
}
}
func TestNovitaStreamRejectsExplicitFalse(t *testing.T) {
apiKey := "test-key"
stream := false
err := newNovitaForTest("http://unused").ChatStreamlyWithSender("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey},
&ChatConfig{Stream: &stream},
func(*string, *string) error { return nil })
if err == nil || !strings.Contains(err.Error(), "stream must be true") {
t.Errorf("got %v", err)
}
}
func TestNovitaListModelsHappyPath(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/models", func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
_ = json.NewEncoder(w).Encode(map[string]interface{}{
"data": []map[string]interface{}{
{"id": "meta-llama/llama-3.3-70b-instruct"},
{"id": "qwen/qwen3-30b-a3b-fp8"},
{"id": "deepseek/deepseek-v4-pro"},
},
})
})
defer srv.Close()
apiKey := "test-key"
ids, err := newNovitaForTest(srv.URL).ListModels(&APIConfig{ApiKey: &apiKey})
if err != nil {
t.Fatalf("ListModels: %v", err)
}
if len(ids) != 3 {
t.Errorf("ids=%v", ids)
}
}
func TestNovitaCheckConnection(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/models", func(t *testing.T, _ map[string]interface{}, w http.ResponseWriter) {
_ = json.NewEncoder(w).Encode(map[string]interface{}{"data": []map[string]interface{}{{"id": "x"}}})
})
defer srv.Close()
apiKey := "test-key"
if err := newNovitaForTest(srv.URL).CheckConnection(&APIConfig{ApiKey: &apiKey}); err != nil {
t.Errorf("CheckConnection: %v", err)
}
}
func TestNovitaRerankHappyPathReordersByIndex(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/rerank", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
if body["model"] != "baai/bge-reranker-v2-m3" {
t.Errorf("model=%v", body["model"])
}
if body["query"] != "what is rag" {
t.Errorf("query=%v", body["query"])
}
docs, ok := body["documents"].([]interface{})
if !ok || len(docs) != 3 || docs[0] != "a" || docs[1] != "b" || docs[2] != "c" {
t.Errorf("documents=%v", body["documents"])
}
if body["top_n"] != float64(3) {
t.Errorf("top_n=%v, want 3", body["top_n"])
}
_, _ = io.WriteString(w, `{"results":[{"document":{"text":"c"},"index":2,"relevance_score":0.91},{"document":{"text":"a"},"index":0,"relevance_score":0.42},{"document":{"text":"b"},"index":1,"relevance_score":0.08}]}`)
})
defer srv.Close()
apiKey := "test-key"
model := "baai/bge-reranker-v2-m3"
resp, err := newNovitaForTest(srv.URL).Rerank(&model, "what is rag", []string{"a", "b", "c"}, &APIConfig{ApiKey: &apiKey}, nil)
if err != nil {
t.Fatalf("Rerank: %v", err)
}
if len(resp.Data) != 3 {
t.Fatalf("len(Data)=%d, want 3", len(resp.Data))
}
want := map[int]float64{2: 0.91, 0: 0.42, 1: 0.08}
for i, item := range resp.Data {
if want[item.Index] != item.RelevanceScore {
t.Errorf("Data[%d]={Index:%d, Score:%v}", i, item.Index, item.RelevanceScore)
}
}
}
func TestNovitaRerankRespectsTopNConfig(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/rerank", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
if body["top_n"] != float64(2) {
t.Errorf("top_n=%v, want 2", body["top_n"])
}
_, _ = io.WriteString(w, `{"results":[{"index":0,"relevance_score":0.9},{"index":1,"relevance_score":0.5}]}`)
})
defer srv.Close()
apiKey := "test-key"
model := "baai/bge-reranker-v2-m3"
if _, err := newNovitaForTest(srv.URL).Rerank(&model, "q", []string{"a", "b", "c"}, &APIConfig{ApiKey: &apiKey}, &RerankConfig{TopN: 2}); err != nil {
t.Fatalf("Rerank: %v", err)
}
}
func TestNovitaRerankEmptyDocumentsShortCircuits(t *testing.T) {
apiKey := "test-key"
model := "x"
resp, err := newNovitaForTest("http://unused").Rerank(&model, "q", nil, &APIConfig{ApiKey: &apiKey}, nil)
if err != nil {
t.Fatalf("expected nil error for empty docs, got %v", err)
}
if len(resp.Data) != 0 {
t.Errorf("len(Data)=%d, want 0", len(resp.Data))
}
}
func TestNovitaRerankRequiresApiKey(t *testing.T) {
model := "x"
_, err := newNovitaForTest("http://unused").Rerank(&model, "q", []string{"a"}, &APIConfig{}, nil)
if err == nil || !strings.Contains(err.Error(), "api key is required") {
t.Errorf("got %v", err)
}
}
func TestNovitaRerankRequiresModelName(t *testing.T) {
apiKey := "test-key"
_, err := newNovitaForTest("http://unused").Rerank(nil, "q", []string{"a"}, &APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "model name is required") {
t.Errorf("got %v", err)
}
}
func TestNovitaRerankRejectsOutOfRangeIndex(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/rerank", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
_, _ = io.WriteString(w, `{"results":[{"index":5,"relevance_score":0.5}]}`)
})
defer srv.Close()
apiKey := "test-key"
model := "x"
_, err := newNovitaForTest(srv.URL).Rerank(&model, "q", []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "out of range") {
t.Errorf("got %v", err)
}
}
func TestNovitaRerankRejectsDuplicateIndex(t *testing.T) {
srv := newNovitaServer(t, "/openai/v1/rerank", func(t *testing.T, body map[string]interface{}, w http.ResponseWriter) {
_, _ = io.WriteString(w, `{"results":[{"index":0,"relevance_score":0.9},{"index":0,"relevance_score":0.5}]}`)
})
defer srv.Close()
apiKey := "test-key"
model := "x"
_, err := newNovitaForTest(srv.URL).Rerank(&model, "q", []string{"a", "b"}, &APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "duplicate") {
t.Errorf("got %v", err)
}
}
func TestNovitaRerankSurfacesHTTPError(t *testing.T) {
srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
w.WriteHeader(http.StatusUnauthorized)
_, _ = io.WriteString(w, `{"error":"bad key"}`)
}))
defer srv.Close()
apiKey := "test-key"
model := "x"
_, err := newNovitaForTest(srv.URL).Rerank(&model, "q", []string{"a"}, &APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "Novita rerank API error") {
t.Errorf("got %v", err)
}
}
func TestNovitaRerankRejectsMissingRerankSuffix(t *testing.T) {
apiKey := "test-key"
model := "x"
driver := NewNovitaModel(
map[string]string{"default": "http://unused"},
URLSuffix{Chat: "openai/v1/chat/completions"},
)
_, err := driver.Rerank(&model, "q", []string{"a"}, &APIConfig{ApiKey: &apiKey}, nil)
if err == nil || !strings.Contains(err.Error(), "no rerank URL suffix configured") {
t.Errorf("got %v", err)
}
}
func TestNovitaBalanceReturnsNoSuchMethod(t *testing.T) {
// Balance IS implemented (makes HTTP call), not a "no such method" stub.
// With dummy key it should reach the HTTP call stage, not fail at APIConfigCheck.
apiKey := "test-key"
_, err := newNovitaForTest("http://unused").Balance(&APIConfig{ApiKey: &apiKey})
if err == nil || strings.Contains(err.Error(), "api key is required") {
t.Errorf("expected non-api-key error (e.g. connection refused), got %v", err)
}
}
func TestNovitaAudioOCRReturnNoSuchMethod(t *testing.T) {
m := "x"
apiKey := "test-key"
v := newNovitaForTest("http://unused")
if _, err := v.TranscribeAudio(&m, &m, &APIConfig{ApiKey: &apiKey}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
t.Errorf("TranscribeAudio: %v", err)
}
if _, err := v.AudioSpeech(&m, &m, &APIConfig{ApiKey: &apiKey}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
t.Errorf("AudioSpeech: %v", err)
}
if _, err := v.OCRFile(&m, nil, &m, &APIConfig{ApiKey: &apiKey}, nil); err == nil || !strings.Contains(err.Error(), "no such method") {
t.Errorf("OCRFile: %v", err)
}
}
// TestNovitaBaseURLTrimsTrailingSlash pins the fix for a `//`-in-path
// bug a tenant could hit by configuring a baseURL like
// "https://api.novita.ai/v3/openai/". Every URL the driver builds via
// fmt.Sprintf("%s/%s", base, suffix) would then produce a double
// slash. baseURLForRegion now trims the trailing "/" so all three
// endpoint builders (Chat, Stream, ListModels) emit clean paths.
func TestNovitaBaseURLTrimsTrailingSlash(t *testing.T) {
cases := []struct {
name string
path string
method string
invoke func(n *NovitaModel, apiKey string) error
urlSuffix URLSuffix
respBody string
respHeaders map[string]string
}{
{
name: "Chat",
path: "/openai/v1/chat/completions",
method: http.MethodPost,
urlSuffix: URLSuffix{Chat: "openai/v1/chat/completions"},
invoke: func(n *NovitaModel, apiKey string) error {
_, err := n.ChatWithMessages("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil)
return err
},
respBody: `{"choices":[{"message":{"content":"ok"}}]}`,
},
{
name: "ListModels",
path: "/openai/v1/models",
method: http.MethodGet,
urlSuffix: URLSuffix{Models: "openai/v1/models"},
invoke: func(n *NovitaModel, apiKey string) error {
_, err := n.ListModels(&APIConfig{ApiKey: &apiKey})
return err
},
respBody: `{"data":[]}`,
},
{
name: "Stream",
path: "/openai/v1/chat/completions",
method: http.MethodPost,
urlSuffix: URLSuffix{Chat: "openai/v1/chat/completions"},
invoke: func(n *NovitaModel, apiKey string) error {
return n.ChatStreamlyWithSender("m",
[]Message{{Role: "user", Content: "x"}},
&APIConfig{ApiKey: &apiKey}, nil,
func(*string, *string) error { return nil })
},
respBody: `data: {"choices":[{"index":0,"delta":{"content":"hi"},"finish_reason":"stop"}]}` + "\n" +
`data: [DONE]` + "\n",
respHeaders: map[string]string{"Content-Type": "text/event-stream"},
},
}
for _, tc := range cases {
t.Run(tc.name, func(t *testing.T) {
srv := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
// The load-bearing assertion: path is the clean
// "/openai/v1/chat/completions" or "/openai/v1/models", never "//chat/...".
if r.URL.Path != tc.path {
t.Errorf("path=%q want %q (double-slash bug?)", r.URL.Path, tc.path)
return
}
if r.Method != tc.method {
t.Errorf("method=%s want %s", r.Method, tc.method)
return
}
for k, v := range tc.respHeaders {
w.Header().Set(k, v)
}
_, _ = io.WriteString(w, tc.respBody)
}))
defer srv.Close()
// Configure baseURL WITH a trailing slash on purpose.
n := NewNovitaModel(
map[string]string{"default": srv.URL + "/"},
tc.urlSuffix,
)
apiKey := "test-key"
if err := tc.invoke(n, apiKey); err != nil {
t.Fatalf("%s: %v", tc.name, err)
}
})
}
}