package openai import ( "encoding/json" "testing" "time" "github.com/ollama/ollama/api" ) func TestResponsesInputMessage_UnmarshalJSON(t *testing.T) { tests := []struct { name string json string want ResponsesInputMessage wantErr bool }{ { name: "text content", json: `{"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}]}`, want: ResponsesInputMessage{ Type: "message", Role: "user", Content: []ResponsesContent{ResponsesTextContent{Type: "input_text", Text: "hello"}}, }, }, { name: "image content", json: `{"type": "message", "role": "user", "content": [{"type": "input_image", "detail": "auto", "image_url": "https://example.com/img.png"}]}`, want: ResponsesInputMessage{ Type: "message", Role: "user", Content: []ResponsesContent{ResponsesImageContent{ Type: "input_image", Detail: "auto", ImageURL: "https://example.com/img.png", }}, }, }, { name: "multiple content items", json: `{"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}, {"type": "input_text", "text": "world"}]}`, want: ResponsesInputMessage{ Type: "message", Role: "user", Content: []ResponsesContent{ ResponsesTextContent{Type: "input_text", Text: "hello"}, ResponsesTextContent{Type: "input_text", Text: "world"}, }, }, }, { name: "unknown content type", json: `{"type": "message", "role": "user", "content": [{"type": "unknown"}]}`, wantErr: true, }, } for _, tt := range tests { t.Run(tt.name, func(t *testing.T) { var got ResponsesInputMessage err := json.Unmarshal([]byte(tt.json), &got) if tt.wantErr { if err == nil { t.Error("expected error, got nil") } return } if err != nil { t.Fatalf("unexpected error: %v", err) } if got.Type != tt.want.Type { t.Errorf("Type = %q, want %q", got.Type, tt.want.Type) } if got.Role != tt.want.Role { t.Errorf("Role = %q, want %q", got.Role, tt.want.Role) } if len(got.Content) != len(tt.want.Content) { t.Fatalf("len(Content) = %d, want %d", len(got.Content), len(tt.want.Content)) } for i := range tt.want.Content { switch wantContent := tt.want.Content[i].(type) { case ResponsesTextContent: gotContent, ok := got.Content[i].(ResponsesTextContent) if !ok { t.Fatalf("Content[%d] type = %T, want ResponsesTextContent", i, got.Content[i]) } if gotContent != wantContent { t.Errorf("Content[%d] = %+v, want %+v", i, gotContent, wantContent) } case ResponsesImageContent: gotContent, ok := got.Content[i].(ResponsesImageContent) if !ok { t.Fatalf("Content[%d] type = %T, want ResponsesImageContent", i, got.Content[i]) } if gotContent != wantContent { t.Errorf("Content[%d] = %+v, want %+v", i, gotContent, wantContent) } } } }) } } func TestResponsesInput_UnmarshalJSON(t *testing.T) { tests := []struct { name string json string wantText string wantItems int wantErr bool }{ { name: "plain string", json: `"hello world"`, wantText: "hello world", }, { name: "array with one message", json: `[{"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}]}]`, wantItems: 1, }, { name: "array with multiple messages", json: `[{"type": "message", "role": "system", "content": [{"type": "input_text", "text": "you are helpful"}]}, {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}]}]`, wantItems: 2, }, { name: "invalid input", json: `123`, wantErr: true, }, } for _, tt := range tests { t.Run(tt.name, func(t *testing.T) { var got ResponsesInput err := json.Unmarshal([]byte(tt.json), &got) if tt.wantErr { if err == nil { t.Error("expected error, got nil") } return } if err != nil { t.Fatalf("unexpected error: %v", err) } if got.Text != tt.wantText { t.Errorf("Text = %q, want %q", got.Text, tt.wantText) } if len(got.Items) != tt.wantItems { t.Errorf("len(Items) = %d, want %d", len(got.Items), tt.wantItems) } }) } } func TestUnmarshalResponsesInputItem(t *testing.T) { t.Run("message item", func(t *testing.T) { got, err := unmarshalResponsesInputItem([]byte(`{"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}]}`)) if err != nil { t.Fatalf("unexpected error: %v", err) } msg, ok := got.(ResponsesInputMessage) if !ok { t.Fatalf("got type %T, want ResponsesInputMessage", got) } if msg.Role != "user" { t.Errorf("Role = %q, want %q", msg.Role, "user") } }) t.Run("function_call item", func(t *testing.T) { got, err := unmarshalResponsesInputItem([]byte(`{"type": "function_call", "call_id": "call_abc123", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"}`)) if err != nil { t.Fatalf("unexpected error: %v", err) } fc, ok := got.(ResponsesFunctionCall) if !ok { t.Fatalf("got type %T, want ResponsesFunctionCall", got) } if fc.Type != "function_call" { t.Errorf("Type = %q, want %q", fc.Type, "function_call") } if fc.CallID != "call_abc123" { t.Errorf("CallID = %q, want %q", fc.CallID, "call_abc123") } if fc.Name != "get_weather" { t.Errorf("Name = %q, want %q", fc.Name, "get_weather") } }) t.Run("function_call_output item", func(t *testing.T) { got, err := unmarshalResponsesInputItem([]byte(`{"type": "function_call_output", "call_id": "call_abc123", "output": "the result"}`)) if err != nil { t.Fatalf("unexpected error: %v", err) } output, ok := got.(ResponsesFunctionCallOutput) if !ok { t.Fatalf("got type %T, want ResponsesFunctionCallOutput", got) } if output.Type != "function_call_output" { t.Errorf("Type = %q, want %q", output.Type, "function_call_output") } if output.CallID != "call_abc123" { t.Errorf("CallID = %q, want %q", output.CallID, "call_abc123") } if output.Output != "the result" { t.Errorf("Output = %q, want %q", output.Output, "the result") } }) t.Run("unknown item type", func(t *testing.T) { _, err := unmarshalResponsesInputItem([]byte(`{"type": "unknown_type"}`)) if err == nil { t.Error("expected error, got nil") } }) } func TestResponsesRequest_UnmarshalJSON(t *testing.T) { tests := []struct { name string json string check func(t *testing.T, req ResponsesRequest) wantErr bool }{ { name: "simple string input", json: `{"model": "gpt-oss:20b", "input": "hello"}`, check: func(t *testing.T, req ResponsesRequest) { if req.Model != "gpt-oss:20b" { t.Errorf("Model = %q, want %q", req.Model, "gpt-oss:20b") } if req.Input.Text != "hello" { t.Errorf("Input.Text = %q, want %q", req.Input.Text, "hello") } }, }, { name: "array input with messages", json: `{"model": "gpt-oss:20b", "input": [{"type": "message", "role": "user", "content": [{"type": "input_text", "text": "hello"}]}]}`, check: func(t *testing.T, req ResponsesRequest) { if len(req.Input.Items) != 1 { t.Fatalf("len(Input.Items) = %d, want 1", len(req.Input.Items)) } msg, ok := req.Input.Items[0].(ResponsesInputMessage) if !ok { t.Fatalf("Input.Items[0] type = %T, want ResponsesInputMessage", req.Input.Items[0]) } if msg.Role != "user" { t.Errorf("Role = %q, want %q", msg.Role, "user") } }, }, { name: "with temperature", json: `{"model": "gpt-oss:20b", "input": "hello", "temperature": 0.5}`, check: func(t *testing.T, req ResponsesRequest) { if req.Temperature == nil || *req.Temperature != 0.5 { t.Errorf("Temperature = %v, want 0.5", req.Temperature) } }, }, } for _, tt := range tests { t.Run(tt.name, func(t *testing.T) { var got ResponsesRequest err := json.Unmarshal([]byte(tt.json), &got) if tt.wantErr { if err == nil { t.Error("expected error, got nil") } return } if err != nil { t.Fatalf("unexpected error: %v", err) } if tt.check != nil { tt.check(t, got) } }) } } func TestFromResponsesRequest_Tools(t *testing.T) { reqJSON := `{ "model": "gpt-oss:20b", "input": "hello", "tools": [ { "type": "function", "name": "shell", "description": "Runs a shell command", "strict": false, "parameters": { "type": "object", "properties": { "command": { "type": "array", "items": {"type": "string"}, "description": "The command to execute" } }, "required": ["command"] } } ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } // Check that tools were parsed if len(req.Tools) != 1 { t.Fatalf("expected 1 tool, got %d", len(req.Tools)) } if req.Tools[0].Name != "shell" { t.Errorf("expected tool name 'shell', got %q", req.Tools[0].Name) } // Convert and check chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } if len(chatReq.Tools) != 1 { t.Fatalf("expected 1 converted tool, got %d", len(chatReq.Tools)) } tool := chatReq.Tools[0] if tool.Type != "function" { t.Errorf("expected tool type 'function', got %q", tool.Type) } if tool.Function.Name != "shell" { t.Errorf("expected function name 'shell', got %q", tool.Function.Name) } if tool.Function.Description != "Runs a shell command" { t.Errorf("expected function description 'Runs a shell command', got %q", tool.Function.Description) } if tool.Function.Parameters.Type != "object" { t.Errorf("expected parameters type 'object', got %q", tool.Function.Parameters.Type) } if len(tool.Function.Parameters.Required) != 1 || tool.Function.Parameters.Required[0] != "command" { t.Errorf("expected required ['command'], got %v", tool.Function.Parameters.Required) } } func TestFromResponsesRequest_FunctionCallOutput(t *testing.T) { // Test a complete tool call round-trip: // 1. User message asking about weather // 2. Assistant's function call (from previous response) // 3. Function call output (the tool result) reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "what is the weather?"}]}, {"type": "function_call", "call_id": "call_abc123", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"}, {"type": "function_call_output", "call_id": "call_abc123", "output": "sunny, 72F"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } // Check that input items were parsed if len(req.Input.Items) != 3 { t.Fatalf("expected 3 input items, got %d", len(req.Input.Items)) } // Verify the function_call item fc, ok := req.Input.Items[1].(ResponsesFunctionCall) if !ok { t.Fatalf("Input.Items[1] type = %T, want ResponsesFunctionCall", req.Input.Items[1]) } if fc.Name != "get_weather" { t.Errorf("Name = %q, want %q", fc.Name, "get_weather") } // Verify the function_call_output item fcOutput, ok := req.Input.Items[2].(ResponsesFunctionCallOutput) if !ok { t.Fatalf("Input.Items[2] type = %T, want ResponsesFunctionCallOutput", req.Input.Items[2]) } if fcOutput.CallID != "call_abc123" { t.Errorf("CallID = %q, want %q", fcOutput.CallID, "call_abc123") } // Convert and check chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } if len(chatReq.Messages) != 3 { t.Fatalf("expected 3 messages, got %d", len(chatReq.Messages)) } // Check the user message userMsg := chatReq.Messages[0] if userMsg.Role != "user" { t.Errorf("expected role 'user', got %q", userMsg.Role) } // Check the assistant message with tool call assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("expected role 'assistant', got %q", assistantMsg.Role) } if len(assistantMsg.ToolCalls) != 1 { t.Fatalf("expected 1 tool call, got %d", len(assistantMsg.ToolCalls)) } if assistantMsg.ToolCalls[0].ID != "call_abc123" { t.Errorf("expected tool call ID 'call_abc123', got %q", assistantMsg.ToolCalls[0].ID) } if assistantMsg.ToolCalls[0].Function.Name != "get_weather" { t.Errorf("expected function name 'get_weather', got %q", assistantMsg.ToolCalls[0].Function.Name) } // Check the tool response message toolMsg := chatReq.Messages[2] if toolMsg.Role != "tool" { t.Errorf("expected role 'tool', got %q", toolMsg.Role) } if toolMsg.Content != "sunny, 72F" { t.Errorf("expected content 'sunny, 72F', got %q", toolMsg.Content) } if toolMsg.ToolCallID != "call_abc123" { t.Errorf("expected ToolCallID 'call_abc123', got %q", toolMsg.ToolCallID) } } func TestFromResponsesRequest_FunctionCallMerge(t *testing.T) { t.Run("function call merges with preceding assistant message", func(t *testing.T) { // When assistant message has content followed by function_call, // they should be merged into a single message reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "what is the weather?"}]}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "I'll check the weather for you."}]}, {"type": "function_call", "call_id": "call_abc123", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (with content + tool call merged) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Check user message if chatReq.Messages[0].Role != "user" { t.Errorf("Messages[0].Role = %q, want %q", chatReq.Messages[0].Role, "user") } // Check assistant message has both content and tool call assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("Messages[1].Role = %q, want %q", assistantMsg.Role, "assistant") } if assistantMsg.Content != "I'll check the weather for you." { t.Errorf("Messages[1].Content = %q, want %q", assistantMsg.Content, "I'll check the weather for you.") } if len(assistantMsg.ToolCalls) != 1 { t.Fatalf("expected 1 tool call, got %d", len(assistantMsg.ToolCalls)) } if assistantMsg.ToolCalls[0].Function.Name != "get_weather" { t.Errorf("ToolCalls[0].Function.Name = %q, want %q", assistantMsg.ToolCalls[0].Function.Name, "get_weather") } }) t.Run("function call without preceding assistant creates new message", func(t *testing.T) { // When there's no preceding assistant message, function_call creates its own message reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "what is the weather?"}]}, {"type": "function_call", "call_id": "call_abc123", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (tool call only) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Check assistant message has tool call but no content assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("Messages[1].Role = %q, want %q", assistantMsg.Role, "assistant") } if assistantMsg.Content != "" { t.Errorf("Messages[1].Content = %q, want empty", assistantMsg.Content) } if len(assistantMsg.ToolCalls) != 1 { t.Fatalf("expected 1 tool call, got %d", len(assistantMsg.ToolCalls)) } }) t.Run("multiple function calls merge into same assistant message", func(t *testing.T) { // Multiple consecutive function_calls should all merge into the same assistant message reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "check weather and time"}]}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "I'll check both."}]}, {"type": "function_call", "call_id": "call_1", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"}, {"type": "function_call", "call_id": "call_2", "name": "get_time", "arguments": "{\"city\":\"Paris\"}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (content + both tool calls) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Assistant has content + both tool calls assistantMsg := chatReq.Messages[1] if assistantMsg.Content != "I'll check both." { t.Errorf("Messages[1].Content = %q, want %q", assistantMsg.Content, "I'll check both.") } if len(assistantMsg.ToolCalls) != 2 { t.Fatalf("expected 2 tool calls, got %d", len(assistantMsg.ToolCalls)) } if assistantMsg.ToolCalls[0].Function.Name != "get_weather" { t.Errorf("ToolCalls[0].Function.Name = %q, want %q", assistantMsg.ToolCalls[0].Function.Name, "get_weather") } if assistantMsg.ToolCalls[1].Function.Name != "get_time" { t.Errorf("ToolCalls[1].Function.Name = %q, want %q", assistantMsg.ToolCalls[1].Function.Name, "get_time") } }) t.Run("new assistant message starts fresh tool call group", func(t *testing.T) { // assistant → tool_call → tool_call → assistant → tool_call // Should result in 2 assistant messages with their respective tool calls reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "do multiple things"}]}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "First batch."}]}, {"type": "function_call", "call_id": "call_1", "name": "func_a", "arguments": "{}"}, {"type": "function_call", "call_id": "call_2", "name": "func_b", "arguments": "{}"}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "Second batch."}]}, {"type": "function_call", "call_id": "call_3", "name": "func_c", "arguments": "{}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 3 messages: // 1. user // 2. assistant "First batch." + tool calls [func_a, func_b] // 3. assistant "Second batch." + tool calls [func_c] if len(chatReq.Messages) != 3 { t.Fatalf("expected 3 messages, got %d", len(chatReq.Messages)) } asst1 := chatReq.Messages[1] if asst1.Content != "First batch." { t.Errorf("Messages[1].Content = %q, want %q", asst1.Content, "First batch.") } if len(asst1.ToolCalls) != 2 { t.Fatalf("expected 2 tool calls in Messages[1], got %d", len(asst1.ToolCalls)) } if asst1.ToolCalls[0].Function.Name != "func_a" { t.Errorf("Messages[1].ToolCalls[0] = %q, want %q", asst1.ToolCalls[0].Function.Name, "func_a") } if asst1.ToolCalls[1].Function.Name != "func_b" { t.Errorf("Messages[1].ToolCalls[1] = %q, want %q", asst1.ToolCalls[1].Function.Name, "func_b") } asst2 := chatReq.Messages[2] if asst2.Content != "Second batch." { t.Errorf("Messages[2].Content = %q, want %q", asst2.Content, "Second batch.") } if len(asst2.ToolCalls) != 1 { t.Fatalf("expected 1 tool call in Messages[2], got %d", len(asst2.ToolCalls)) } if asst2.ToolCalls[0].Function.Name != "func_c" { t.Errorf("Messages[2].ToolCalls[0] = %q, want %q", asst2.ToolCalls[0].Function.Name, "func_c") } }) t.Run("function call merges with assistant that has thinking", func(t *testing.T) { // reasoning → assistant (gets thinking) → function_call → should merge reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "think and act"}]}, {"type": "reasoning", "id": "rs_1", "encrypted_content": "Let me think...", "summary": []}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "I thought about it."}]}, {"type": "function_call", "call_id": "call_1", "name": "do_thing", "arguments": "{}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (thinking + content + tool call) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } asst := chatReq.Messages[1] if asst.Thinking != "Let me think..." { t.Errorf("Messages[1].Thinking = %q, want %q", asst.Thinking, "Let me think...") } if asst.Content != "I thought about it." { t.Errorf("Messages[1].Content = %q, want %q", asst.Content, "I thought about it.") } if len(asst.ToolCalls) != 1 { t.Fatalf("expected 1 tool call, got %d", len(asst.ToolCalls)) } if asst.ToolCalls[0].Function.Name != "do_thing" { t.Errorf("ToolCalls[0].Function.Name = %q, want %q", asst.ToolCalls[0].Function.Name, "do_thing") } }) t.Run("mixed thinking and content with multiple tool calls", func(t *testing.T) { // Test: // 1. reasoning → assistant (empty content, gets thinking) → tc (merges) // 2. assistant with content → tc → tc (both merge) // Result: 2 assistant messages reqJSON := `{ "model": "gpt-oss:20b", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "complex task"}]}, {"type": "reasoning", "id": "rs_1", "encrypted_content": "Thinking first...", "summary": []}, {"type": "message", "role": "assistant", "content": ""}, {"type": "function_call", "call_id": "call_1", "name": "think_action", "arguments": "{}"}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "Now doing more."}]}, {"type": "function_call", "call_id": "call_2", "name": "action_a", "arguments": "{}"}, {"type": "function_call", "call_id": "call_3", "name": "action_b", "arguments": "{}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 3 messages: // 1. user // 2. assistant with thinking + tool call [think_action] // 3. assistant with content "Now doing more." + tool calls [action_a, action_b] if len(chatReq.Messages) != 3 { t.Fatalf("expected 3 messages, got %d", len(chatReq.Messages)) } // First assistant: thinking + tool call asst1 := chatReq.Messages[1] if asst1.Thinking != "Thinking first..." { t.Errorf("Messages[1].Thinking = %q, want %q", asst1.Thinking, "Thinking first...") } if asst1.Content != "" { t.Errorf("Messages[1].Content = %q, want empty", asst1.Content) } if len(asst1.ToolCalls) != 1 { t.Fatalf("expected 1 tool call in Messages[1], got %d", len(asst1.ToolCalls)) } if asst1.ToolCalls[0].Function.Name != "think_action" { t.Errorf("Messages[1].ToolCalls[0] = %q, want %q", asst1.ToolCalls[0].Function.Name, "think_action") } // Second assistant: content + 2 tool calls asst2 := chatReq.Messages[2] if asst2.Content != "Now doing more." { t.Errorf("Messages[2].Content = %q, want %q", asst2.Content, "Now doing more.") } if len(asst2.ToolCalls) != 2 { t.Fatalf("expected 2 tool calls in Messages[2], got %d", len(asst2.ToolCalls)) } if asst2.ToolCalls[0].Function.Name != "action_a" { t.Errorf("Messages[2].ToolCalls[0] = %q, want %q", asst2.ToolCalls[0].Function.Name, "action_a") } if asst2.ToolCalls[1].Function.Name != "action_b" { t.Errorf("Messages[2].ToolCalls[1] = %q, want %q", asst2.ToolCalls[1].Function.Name, "action_b") } }) } func TestDecodeImageURL(t *testing.T) { // Valid PNG base64 (1x1 red pixel) validPNG := "" t.Run("valid png", func(t *testing.T) { img, err := decodeImageURL(validPNG) if err != nil { t.Fatalf("unexpected error: %v", err) } if len(img) == 0 { t.Error("expected non-empty image data") } }) t.Run("valid jpeg", func(t *testing.T) { // Just test the prefix validation with minimal base64 _, err := decodeImageURL("") if err != nil { t.Fatalf("unexpected error: %v", err) } }) t.Run("blank mime type", func(t *testing.T) { _, err := decodeImageURL("data:;base64,dGVzdA==") if err != nil { t.Fatalf("unexpected error: %v", err) } }) t.Run("invalid mime type", func(t *testing.T) { _, err := decodeImageURL("") if err == nil { t.Error("expected error for unsupported mime type") } }) t.Run("invalid base64", func(t *testing.T) { _, err := decodeImageURL("-valid-base64!") if err == nil { t.Error("expected error for invalid base64") } }) t.Run("not a data url", func(t *testing.T) { _, err := decodeImageURL("https://example.com/image.png") if err == nil { t.Error("expected error for non-data URL") } }) } func TestFromResponsesRequest_Images(t *testing.T) { // 1x1 red PNG pixel pngBase64 := "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAYAAAAfFcSJAAAADUlEQVR42mP8z8DwHwAFBQIAX8jx0gAAAABJRU5ErkJggg==" reqJSON := `{ "model": "llava", "input": [ {"type": "message", "role": "user", "content": [ {"type": "input_text", "text": "What is in this image?"}, {"type": "input_image", "detail": "auto", "image_url": "data:image/png;base64,` + pngBase64 + `"} ]} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } if len(chatReq.Messages) != 1 { t.Fatalf("expected 1 message, got %d", len(chatReq.Messages)) } msg := chatReq.Messages[0] if msg.Role != "user" { t.Errorf("expected role 'user', got %q", msg.Role) } if msg.Content != "What is in this image?" { t.Errorf("expected content 'What is in this image?', got %q", msg.Content) } if len(msg.Images) != 1 { t.Fatalf("expected 1 image, got %d", len(msg.Images)) } if len(msg.Images[0]) == 0 { t.Error("expected non-empty image data") } } func TestResponsesStreamConverter_TextOnly(t *testing.T) { converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") // First chunk with content events := converter.Process(api.ChatResponse{ Message: api.Message{ Content: "Hello", }, }) // Should have: response.created, response.in_progress, output_item.added, content_part.added, output_text.delta if len(events) != 5 { t.Fatalf("expected 5 events, got %d", len(events)) } if events[0].Event != "response.created" { t.Errorf("events[0].Event = %q, want %q", events[0].Event, "response.created") } if events[1].Event != "response.in_progress" { t.Errorf("events[1].Event = %q, want %q", events[1].Event, "response.in_progress") } if events[2].Event != "response.output_item.added" { t.Errorf("events[2].Event = %q, want %q", events[2].Event, "response.output_item.added") } if events[3].Event != "response.content_part.added" { t.Errorf("events[3].Event = %q, want %q", events[3].Event, "response.content_part.added") } if events[4].Event != "response.output_text.delta" { t.Errorf("events[4].Event = %q, want %q", events[4].Event, "response.output_text.delta") } // Second chunk with more content events = converter.Process(api.ChatResponse{ Message: api.Message{ Content: " World", }, }) // Should only have output_text.delta (no more created/in_progress/added) if len(events) != 1 { t.Fatalf("expected 1 event, got %d", len(events)) } if events[0].Event != "response.output_text.delta" { t.Errorf("events[0].Event = %q, want %q", events[0].Event, "response.output_text.delta") } // Final chunk events = converter.Process(api.ChatResponse{ Message: api.Message{}, Done: true, }) // Should have: output_text.done, content_part.done, output_item.done, response.completed if len(events) != 4 { t.Fatalf("expected 4 events, got %d", len(events)) } if events[0].Event != "response.output_text.done" { t.Errorf("events[0].Event = %q, want %q", events[0].Event, "response.output_text.done") } // Check that accumulated text is present data := events[0].Data.(map[string]any) if data["text"] != "Hello World" { t.Errorf("accumulated text = %q, want %q", data["text"], "Hello World") } } func TestResponsesStreamConverter_ToolCalls(t *testing.T) { converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") events := converter.Process(api.ChatResponse{ Message: api.Message{ ToolCalls: []api.ToolCall{ { ID: "call_abc", Function: api.ToolCallFunction{ Name: "get_weather", Arguments: api.ToolCallFunctionArguments{"city": "Paris"}, }, }, }, }, }) // Should have: created, in_progress, output_item.added, arguments.delta, arguments.done, output_item.done if len(events) != 6 { t.Fatalf("expected 6 events, got %d", len(events)) } if events[2].Event != "response.output_item.added" { t.Errorf("events[2].Event = %q, want %q", events[2].Event, "response.output_item.added") } if events[3].Event != "response.function_call_arguments.delta" { t.Errorf("events[3].Event = %q, want %q", events[3].Event, "response.function_call_arguments.delta") } if events[4].Event != "response.function_call_arguments.done" { t.Errorf("events[4].Event = %q, want %q", events[4].Event, "response.function_call_arguments.done") } if events[5].Event != "response.output_item.done" { t.Errorf("events[5].Event = %q, want %q", events[5].Event, "response.output_item.done") } } func TestResponsesStreamConverter_Reasoning(t *testing.T) { converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") // First chunk with thinking events := converter.Process(api.ChatResponse{ Message: api.Message{ Thinking: "Let me think...", }, }) // Should have: created, in_progress, output_item.added (reasoning), reasoning_summary_text.delta if len(events) != 4 { t.Fatalf("expected 4 events, got %d", len(events)) } if events[2].Event != "response.output_item.added" { t.Errorf("events[2].Event = %q, want %q", events[2].Event, "response.output_item.added") } // Check it's a reasoning item data := events[2].Data.(map[string]any) item := data["item"].(map[string]any) if item["type"] != "reasoning" { t.Errorf("item type = %q, want %q", item["type"], "reasoning") } if events[3].Event != "response.reasoning_summary_text.delta" { t.Errorf("events[3].Event = %q, want %q", events[3].Event, "response.reasoning_summary_text.delta") } // Second chunk with text content (reasoning should close first) events = converter.Process(api.ChatResponse{ Message: api.Message{ Content: "The answer is 42", }, }) // Should have: reasoning_summary_text.done, output_item.done (reasoning), output_item.added (message), content_part.added, output_text.delta if len(events) != 5 { t.Fatalf("expected 5 events, got %d", len(events)) } if events[0].Event != "response.reasoning_summary_text.done" { t.Errorf("events[0].Event = %q, want %q", events[0].Event, "response.reasoning_summary_text.done") } if events[1].Event != "response.output_item.done" { t.Errorf("events[1].Event = %q, want %q", events[1].Event, "response.output_item.done") } // Check the reasoning done item has encrypted_content doneData := events[1].Data.(map[string]any) doneItem := doneData["item"].(map[string]any) if doneItem["encrypted_content"] != "Let me think..." { t.Errorf("encrypted_content = %q, want %q", doneItem["encrypted_content"], "Let me think...") } } func TestFromResponsesRequest_ReasoningMerge(t *testing.T) { t.Run("reasoning merged with following message", func(t *testing.T) { reqJSON := `{ "model": "qwen3", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "solve 2+2"}]}, {"type": "reasoning", "id": "rs_123", "encrypted_content": "Let me think about this math problem...", "summary": [{"type": "summary_text", "text": "Thinking about math"}]}, {"type": "message", "role": "assistant", "content": [{"type": "input_text", "text": "The answer is 4"}]} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (with thinking merged) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Check user message if chatReq.Messages[0].Role != "user" { t.Errorf("Messages[0].Role = %q, want %q", chatReq.Messages[0].Role, "user") } // Check assistant message has both content and thinking assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("Messages[1].Role = %q, want %q", assistantMsg.Role, "assistant") } if assistantMsg.Content != "The answer is 4" { t.Errorf("Messages[1].Content = %q, want %q", assistantMsg.Content, "The answer is 4") } if assistantMsg.Thinking != "Let me think about this math problem..." { t.Errorf("Messages[1].Thinking = %q, want %q", assistantMsg.Thinking, "Let me think about this math problem...") } }) t.Run("reasoning merged with following function call", func(t *testing.T) { reqJSON := `{ "model": "qwen3", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "what is the weather?"}]}, {"type": "reasoning", "id": "rs_123", "encrypted_content": "I need to call a tool for this...", "summary": []}, {"type": "function_call", "call_id": "call_abc", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (with thinking + tool call) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Check assistant message has both tool call and thinking assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("Messages[1].Role = %q, want %q", assistantMsg.Role, "assistant") } if assistantMsg.Thinking != "I need to call a tool for this..." { t.Errorf("Messages[1].Thinking = %q, want %q", assistantMsg.Thinking, "I need to call a tool for this...") } if len(assistantMsg.ToolCalls) != 1 { t.Fatalf("expected 1 tool call, got %d", len(assistantMsg.ToolCalls)) } if assistantMsg.ToolCalls[0].Function.Name != "get_weather" { t.Errorf("ToolCalls[0].Function.Name = %q, want %q", assistantMsg.ToolCalls[0].Function.Name, "get_weather") } }) t.Run("multi-turn conversation with reasoning", func(t *testing.T) { // Simulates: user asks -> model thinks + responds -> user follows up reqJSON := `{ "model": "qwen3", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "What is 2+2?"}]}, {"type": "reasoning", "id": "rs_001", "encrypted_content": "This is a simple arithmetic problem. 2+2=4.", "summary": [{"type": "summary_text", "text": "Calculating 2+2"}]}, {"type": "message", "role": "assistant", "content": [{"type": "input_text", "text": "The answer is 4."}]}, {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "Now multiply that by 3"}]} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 3 messages: // 1. user: "What is 2+2?" // 2. assistant: thinking + "The answer is 4." // 3. user: "Now multiply that by 3" if len(chatReq.Messages) != 3 { t.Fatalf("expected 3 messages, got %d", len(chatReq.Messages)) } // Check first user message if chatReq.Messages[0].Role != "user" || chatReq.Messages[0].Content != "What is 2+2?" { t.Errorf("Messages[0] = {Role: %q, Content: %q}, want {Role: \"user\", Content: \"What is 2+2?\"}", chatReq.Messages[0].Role, chatReq.Messages[0].Content) } // Check assistant message has merged thinking + content if chatReq.Messages[1].Role != "assistant" { t.Errorf("Messages[1].Role = %q, want \"assistant\"", chatReq.Messages[1].Role) } if chatReq.Messages[1].Content != "The answer is 4." { t.Errorf("Messages[1].Content = %q, want \"The answer is 4.\"", chatReq.Messages[1].Content) } if chatReq.Messages[1].Thinking != "This is a simple arithmetic problem. 2+2=4." { t.Errorf("Messages[1].Thinking = %q, want \"This is a simple arithmetic problem. 2+2=4.\"", chatReq.Messages[1].Thinking) } // Check second user message if chatReq.Messages[2].Role != "user" || chatReq.Messages[2].Content != "Now multiply that by 3" { t.Errorf("Messages[2] = {Role: %q, Content: %q}, want {Role: \"user\", Content: \"Now multiply that by 3\"}", chatReq.Messages[2].Role, chatReq.Messages[2].Content) } }) t.Run("multi-turn with tool calls and reasoning", func(t *testing.T) { // Simulates: user asks -> model thinks + calls tool -> tool responds -> model thinks + responds -> user follows up reqJSON := `{ "model": "qwen3", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "What is the weather in Paris?"}]}, {"type": "reasoning", "id": "rs_001", "encrypted_content": "I need to call the weather API for Paris.", "summary": []}, {"type": "function_call", "call_id": "call_abc", "name": "get_weather", "arguments": "{\"city\":\"Paris\"}"}, {"type": "function_call_output", "call_id": "call_abc", "output": "Sunny, 72°F"}, {"type": "reasoning", "id": "rs_002", "encrypted_content": "The weather API returned sunny and 72°F. I should format this nicely.", "summary": []}, {"type": "message", "role": "assistant", "content": [{"type": "input_text", "text": "It's sunny and 72°F in Paris!"}]}, {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "What about London?"}]} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 5 messages: // 1. user: "What is the weather in Paris?" // 2. assistant: thinking + tool call // 3. tool: "Sunny, 72°F" // 4. assistant: thinking + "It's sunny and 72°F in Paris!" // 5. user: "What about London?" if len(chatReq.Messages) != 5 { t.Fatalf("expected 5 messages, got %d", len(chatReq.Messages)) } // Message 1: user if chatReq.Messages[0].Role != "user" { t.Errorf("Messages[0].Role = %q, want \"user\"", chatReq.Messages[0].Role) } // Message 2: assistant with thinking + tool call if chatReq.Messages[1].Role != "assistant" { t.Errorf("Messages[1].Role = %q, want \"assistant\"", chatReq.Messages[1].Role) } if chatReq.Messages[1].Thinking != "I need to call the weather API for Paris." { t.Errorf("Messages[1].Thinking = %q, want \"I need to call the weather API for Paris.\"", chatReq.Messages[1].Thinking) } if len(chatReq.Messages[1].ToolCalls) != 1 || chatReq.Messages[1].ToolCalls[0].Function.Name != "get_weather" { t.Errorf("Messages[1].ToolCalls not as expected") } // Message 3: tool response if chatReq.Messages[2].Role != "tool" || chatReq.Messages[2].Content != "Sunny, 72°F" { t.Errorf("Messages[2] = {Role: %q, Content: %q}, want {Role: \"tool\", Content: \"Sunny, 72°F\"}", chatReq.Messages[2].Role, chatReq.Messages[2].Content) } // Message 4: assistant with thinking + content if chatReq.Messages[3].Role != "assistant" { t.Errorf("Messages[3].Role = %q, want \"assistant\"", chatReq.Messages[3].Role) } if chatReq.Messages[3].Thinking != "The weather API returned sunny and 72°F. I should format this nicely." { t.Errorf("Messages[3].Thinking = %q, want correct thinking", chatReq.Messages[3].Thinking) } if chatReq.Messages[3].Content != "It's sunny and 72°F in Paris!" { t.Errorf("Messages[3].Content = %q, want \"It's sunny and 72°F in Paris!\"", chatReq.Messages[3].Content) } // Message 5: user follow-up if chatReq.Messages[4].Role != "user" || chatReq.Messages[4].Content != "What about London?" { t.Errorf("Messages[4] = {Role: %q, Content: %q}, want {Role: \"user\", Content: \"What about London?\"}", chatReq.Messages[4].Role, chatReq.Messages[4].Content) } }) t.Run("trailing reasoning creates separate message", func(t *testing.T) { reqJSON := `{ "model": "qwen3", "input": [ {"type": "message", "role": "user", "content": [{"type": "input_text", "text": "think about this"}]}, {"type": "reasoning", "id": "rs_123", "encrypted_content": "Still thinking...", "summary": []} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: user and assistant (thinking only) if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // Check assistant message has only thinking assistantMsg := chatReq.Messages[1] if assistantMsg.Role != "assistant" { t.Errorf("Messages[1].Role = %q, want %q", assistantMsg.Role, "assistant") } if assistantMsg.Thinking != "Still thinking..." { t.Errorf("Messages[1].Thinking = %q, want %q", assistantMsg.Thinking, "Still thinking...") } if assistantMsg.Content != "" { t.Errorf("Messages[1].Content = %q, want empty", assistantMsg.Content) } }) } func TestToResponse_WithReasoning(t *testing.T) { response := ToResponse("gpt-oss:20b", "resp_123", "msg_456", api.ChatResponse{ CreatedAt: time.Now(), Message: api.Message{ Thinking: "Analyzing the question...", Content: "The answer is 42", }, Done: true, }) // Should have 2 output items: reasoning + message if len(response.Output) != 2 { t.Fatalf("expected 2 output items, got %d", len(response.Output)) } // First item should be reasoning if response.Output[0].Type != "reasoning" { t.Errorf("Output[0].Type = %q, want %q", response.Output[0].Type, "reasoning") } if len(response.Output[0].Summary) != 1 { t.Fatalf("expected 1 summary item, got %d", len(response.Output[0].Summary)) } if response.Output[0].Summary[0].Text != "Analyzing the question..." { t.Errorf("Summary[0].Text = %q, want %q", response.Output[0].Summary[0].Text, "Analyzing the question...") } if response.Output[0].EncryptedContent != "Analyzing the question..." { t.Errorf("EncryptedContent = %q, want %q", response.Output[0].EncryptedContent, "Analyzing the question...") } // Second item should be message if response.Output[1].Type != "message" { t.Errorf("Output[1].Type = %q, want %q", response.Output[1].Type, "message") } if response.Output[1].Content[0].Text != "The answer is 42" { t.Errorf("Content[0].Text = %q, want %q", response.Output[1].Content[0].Text, "The answer is 42") } } func TestFromResponsesRequest_Instructions(t *testing.T) { reqJSON := `{ "model": "gpt-oss:20b", "instructions": "You are a helpful pirate. Always respond in pirate speak.", "input": "Hello" }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Should have 2 messages: system (instructions) + user if len(chatReq.Messages) != 2 { t.Fatalf("expected 2 messages, got %d", len(chatReq.Messages)) } // First message should be system with instructions if chatReq.Messages[0].Role != "system" { t.Errorf("Messages[0].Role = %q, want %q", chatReq.Messages[0].Role, "system") } if chatReq.Messages[0].Content != "You are a helpful pirate. Always respond in pirate speak." { t.Errorf("Messages[0].Content = %q, want instructions", chatReq.Messages[0].Content) } // Second message should be user if chatReq.Messages[1].Role != "user" { t.Errorf("Messages[1].Role = %q, want %q", chatReq.Messages[1].Role, "user") } if chatReq.Messages[1].Content != "Hello" { t.Errorf("Messages[1].Content = %q, want %q", chatReq.Messages[1].Content, "Hello") } } func TestFromResponsesRequest_MaxOutputTokens(t *testing.T) { reqJSON := `{ "model": "gpt-oss:20b", "input": "Write a story", "max_output_tokens": 100 }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Check that num_predict is set in options numPredict, ok := chatReq.Options["num_predict"] if !ok { t.Fatal("expected num_predict in options") } if numPredict != 100 { t.Errorf("num_predict = %v, want 100", numPredict) } } func TestFromResponsesRequest_TextFormatJsonSchema(t *testing.T) { reqJSON := `{ "model": "gpt-oss:20b", "input": "Give me info about John who is 30", "text": { "format": { "type": "json_schema", "name": "person", "strict": true, "schema": { "type": "object", "properties": { "name": {"type": "string"}, "age": {"type": "integer"} }, "required": ["name", "age"] } } } }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } // Verify the text format was parsed if req.Text == nil || req.Text.Format == nil { t.Fatal("expected Text.Format to be set") } if req.Text.Format.Type != "json_schema" { t.Errorf("Text.Format.Type = %q, want %q", req.Text.Format.Type, "json_schema") } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Check that Format is set if chatReq.Format == nil { t.Fatal("expected Format to be set") } // Verify the schema is passed through var schema map[string]any if err := json.Unmarshal(chatReq.Format, &schema); err != nil { t.Fatalf("failed to unmarshal format: %v", err) } if schema["type"] != "object" { t.Errorf("schema type = %v, want %q", schema["type"], "object") } props, ok := schema["properties"].(map[string]any) if !ok { t.Fatal("expected properties in schema") } if _, ok := props["name"]; !ok { t.Error("expected 'name' in schema properties") } if _, ok := props["age"]; !ok { t.Error("expected 'age' in schema properties") } } func TestFromResponsesRequest_TextFormatText(t *testing.T) { // When format type is "text", Format should be nil (no constraint) reqJSON := `{ "model": "gpt-oss:20b", "input": "Hello", "text": { "format": { "type": "text" } } }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } // Format should be nil for "text" type if chatReq.Format != nil { t.Errorf("expected Format to be nil for text type, got %s", string(chatReq.Format)) } } func TestResponsesInputMessage_ShorthandFormats(t *testing.T) { t.Run("string content shorthand", func(t *testing.T) { // Content can be a plain string instead of an array of content items jsonStr := `{"type": "message", "role": "user", "content": "Hello world"}` var msg ResponsesInputMessage if err := json.Unmarshal([]byte(jsonStr), &msg); err != nil { t.Fatalf("unexpected error: %v", err) } if msg.Role != "user" { t.Errorf("Role = %q, want %q", msg.Role, "user") } if len(msg.Content) != 1 { t.Fatalf("len(Content) = %d, want 1", len(msg.Content)) } textContent, ok := msg.Content[0].(ResponsesTextContent) if !ok { t.Fatalf("Content[0] type = %T, want ResponsesTextContent", msg.Content[0]) } if textContent.Text != "Hello world" { t.Errorf("Content[0].Text = %q, want %q", textContent.Text, "Hello world") } if textContent.Type != "input_text" { t.Errorf("Content[0].Type = %q, want %q", textContent.Type, "input_text") } }) t.Run("output_text content type", func(t *testing.T) { // Previous assistant responses come back with output_text content type jsonStr := `{"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "I am an assistant"}]}` var msg ResponsesInputMessage if err := json.Unmarshal([]byte(jsonStr), &msg); err != nil { t.Fatalf("unexpected error: %v", err) } if msg.Role != "assistant" { t.Errorf("Role = %q, want %q", msg.Role, "assistant") } if len(msg.Content) != 1 { t.Fatalf("len(Content) = %d, want 1", len(msg.Content)) } outputContent, ok := msg.Content[0].(ResponsesOutputTextContent) if !ok { t.Fatalf("Content[0] type = %T, want ResponsesOutputTextContent", msg.Content[0]) } if outputContent.Text != "I am an assistant" { t.Errorf("Content[0].Text = %q, want %q", outputContent.Text, "I am an assistant") } }) } func TestUnmarshalResponsesInputItem_ShorthandMessage(t *testing.T) { t.Run("message without type field", func(t *testing.T) { // When type is omitted but role is present, treat as message jsonStr := `{"role": "user", "content": "Hello"}` item, err := unmarshalResponsesInputItem([]byte(jsonStr)) if err != nil { t.Fatalf("unexpected error: %v", err) } msg, ok := item.(ResponsesInputMessage) if !ok { t.Fatalf("got type %T, want ResponsesInputMessage", item) } if msg.Role != "user" { t.Errorf("Role = %q, want %q", msg.Role, "user") } if len(msg.Content) != 1 { t.Fatalf("len(Content) = %d, want 1", len(msg.Content)) } }) t.Run("message with both type and role", func(t *testing.T) { // Explicit type should still work jsonStr := `{"type": "message", "role": "system", "content": "You are helpful"}` item, err := unmarshalResponsesInputItem([]byte(jsonStr)) if err != nil { t.Fatalf("unexpected error: %v", err) } msg, ok := item.(ResponsesInputMessage) if !ok { t.Fatalf("got type %T, want ResponsesInputMessage", item) } if msg.Role != "system" { t.Errorf("Role = %q, want %q", msg.Role, "system") } }) } func TestFromResponsesRequest_ShorthandFormats(t *testing.T) { t.Run("shorthand message without type", func(t *testing.T) { // Real-world format from OpenAI SDK reqJSON := `{ "model": "gpt-4.1", "input": [ {"role": "user", "content": "What is the weather in Tokyo?"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } if len(req.Input.Items) != 1 { t.Fatalf("expected 1 input item, got %d", len(req.Input.Items)) } msg, ok := req.Input.Items[0].(ResponsesInputMessage) if !ok { t.Fatalf("Input.Items[0] type = %T, want ResponsesInputMessage", req.Input.Items[0]) } if msg.Role != "user" { t.Errorf("Role = %q, want %q", msg.Role, "user") } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } if len(chatReq.Messages) != 1 { t.Fatalf("expected 1 message, got %d", len(chatReq.Messages)) } if chatReq.Messages[0].Content != "What is the weather in Tokyo?" { t.Errorf("Content = %q, want %q", chatReq.Messages[0].Content, "What is the weather in Tokyo?") } }) t.Run("conversation with output_text from previous response", func(t *testing.T) { // Simulates a multi-turn conversation where previous assistant response is sent back reqJSON := `{ "model": "gpt-4.1", "input": [ {"role": "user", "content": "Hello"}, {"type": "message", "role": "assistant", "content": [{"type": "output_text", "text": "Hi there!"}]}, {"role": "user", "content": "How are you?"} ] }` var req ResponsesRequest if err := json.Unmarshal([]byte(reqJSON), &req); err != nil { t.Fatalf("failed to unmarshal request: %v", err) } chatReq, err := FromResponsesRequest(req) if err != nil { t.Fatalf("failed to convert request: %v", err) } if len(chatReq.Messages) != 3 { t.Fatalf("expected 3 messages, got %d", len(chatReq.Messages)) } // Check first user message if chatReq.Messages[0].Role != "user" || chatReq.Messages[0].Content != "Hello" { t.Errorf("Messages[0] = {Role: %q, Content: %q}, want {Role: \"user\", Content: \"Hello\"}", chatReq.Messages[0].Role, chatReq.Messages[0].Content) } // Check assistant message (output_text should be converted to content) if chatReq.Messages[1].Role != "assistant" || chatReq.Messages[1].Content != "Hi there!" { t.Errorf("Messages[1] = {Role: %q, Content: %q}, want {Role: \"assistant\", Content: \"Hi there!\"}", chatReq.Messages[1].Role, chatReq.Messages[1].Content) } // Check second user message if chatReq.Messages[2].Role != "user" || chatReq.Messages[2].Content != "How are you?" { t.Errorf("Messages[2] = {Role: %q, Content: %q}, want {Role: \"user\", Content: \"How are you?\"}", chatReq.Messages[2].Role, chatReq.Messages[2].Content) } }) } func TestResponsesStreamConverter_OutputIncludesContent(t *testing.T) { // Verify that response.output_item.done includes content field for messages converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") // First chunk converter.Process(api.ChatResponse{ Message: api.Message{Content: "Hello World"}, }) // Final chunk events := converter.Process(api.ChatResponse{ Message: api.Message{}, Done: true, }) // Find the output_item.done event var outputItemDone map[string]any for _, event := range events { if event.Event == "response.output_item.done" { outputItemDone = event.Data.(map[string]any) break } } if outputItemDone == nil { t.Fatal("expected response.output_item.done event") } item := outputItemDone["item"].(map[string]any) if item["type"] != "message" { t.Errorf("item.type = %q, want %q", item["type"], "message") } content, ok := item["content"].([]map[string]any) if !ok { t.Fatalf("item.content type = %T, want []map[string]any", item["content"]) } if len(content) != 1 { t.Fatalf("len(content) = %d, want 1", len(content)) } if content[0]["type"] != "output_text" { t.Errorf("content[0].type = %q, want %q", content[0]["type"], "output_text") } if content[0]["text"] != "Hello World" { t.Errorf("content[0].text = %q, want %q", content[0]["text"], "Hello World") } } func TestResponsesStreamConverter_ResponseCompletedIncludesOutput(t *testing.T) { // Verify that response.completed includes the output array converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") // Process some content converter.Process(api.ChatResponse{ Message: api.Message{Content: "Test response"}, }) // Final chunk events := converter.Process(api.ChatResponse{ Message: api.Message{}, Done: true, }) // Find the response.completed event var responseCompleted map[string]any for _, event := range events { if event.Event == "response.completed" { responseCompleted = event.Data.(map[string]any) break } } if responseCompleted == nil { t.Fatal("expected response.completed event") } response := responseCompleted["response"].(map[string]any) output, ok := response["output"].([]any) if !ok { t.Fatalf("response.output type = %T, want []any", response["output"]) } if len(output) != 1 { t.Fatalf("len(output) = %d, want 1", len(output)) } item := output[0].(map[string]any) if item["type"] != "message" { t.Errorf("output[0].type = %q, want %q", item["type"], "message") } } func TestResponsesStreamConverter_ResponseCreatedIncludesOutput(t *testing.T) { // Verify that response.created includes an empty output array converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") events := converter.Process(api.ChatResponse{ Message: api.Message{Content: "Hi"}, }) // First event should be response.created if events[0].Event != "response.created" { t.Fatalf("events[0].Event = %q, want %q", events[0].Event, "response.created") } data := events[0].Data.(map[string]any) response := data["response"].(map[string]any) output, ok := response["output"].([]any) if !ok { t.Fatalf("response.output type = %T, want []any", response["output"]) } // Should be empty array initially if len(output) != 0 { t.Errorf("len(output) = %d, want 0", len(output)) } } func TestResponsesStreamConverter_SequenceNumbers(t *testing.T) { // Verify that events include incrementing sequence numbers converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") events := converter.Process(api.ChatResponse{ Message: api.Message{Content: "Hello"}, }) for i, event := range events { data := event.Data.(map[string]any) seqNum, ok := data["sequence_number"].(int) if !ok { t.Fatalf("events[%d] missing sequence_number", i) } if seqNum != i { t.Errorf("events[%d].sequence_number = %d, want %d", i, seqNum, i) } } // Process more content, sequence should continue moreEvents := converter.Process(api.ChatResponse{ Message: api.Message{Content: " World"}, }) expectedSeq := len(events) for i, event := range moreEvents { data := event.Data.(map[string]any) seqNum := data["sequence_number"].(int) if seqNum != expectedSeq+i { t.Errorf("moreEvents[%d].sequence_number = %d, want %d", i, seqNum, expectedSeq+i) } } } func TestResponsesStreamConverter_FunctionCallStatus(t *testing.T) { // Verify that function call items include status field converter := NewResponsesStreamConverter("resp_123", "msg_456", "gpt-oss:20b") events := converter.Process(api.ChatResponse{ Message: api.Message{ ToolCalls: []api.ToolCall{ { ID: "call_abc", Function: api.ToolCallFunction{ Name: "get_weather", Arguments: api.ToolCallFunctionArguments{"city": "Paris"}, }, }, }, }, }) // Find output_item.added event var addedItem map[string]any var doneItem map[string]any for _, event := range events { data := event.Data.(map[string]any) if data["type"] == "response.output_item.added" { item := data["item"].(map[string]any) if item["type"] == "function_call" { addedItem = item } } if data["type"] == "response.output_item.done" { item := data["item"].(map[string]any) if item["type"] == "function_call" { doneItem = item } } } if addedItem == nil { t.Fatal("expected function_call output_item.added event") } if addedItem["status"] != "in_progress" { t.Errorf("output_item.added status = %q, want %q", addedItem["status"], "in_progress") } if doneItem == nil { t.Fatal("expected function_call output_item.done event") } if doneItem["status"] != "completed" { t.Errorf("output_item.done status = %q, want %q", doneItem["status"], "completed") } }