first commit

2026-04-26 21:52:23 +03:00
commit 880f412e2c
2662 changed files with 866266 additions and 0 deletions
--- a/core/internal/llmtests/automatic_function_calling.go
+++ b/core/internal/llmtests/automatic_function_calling.go
@@ -0,0 +1,182 @@
+package llmtests
+
+import (
+	"context"
+	"os"
+	"strings"
+	"testing"
+
+	bifrost "github.com/maximhq/bifrost/core"
+	"github.com/maximhq/bifrost/core/schemas"
+)
+
+// RunAutomaticFunctionCallingTest executes the automatic function calling test scenario using dual API testing framework
+func RunAutomaticFunctionCallingTest(t *testing.T, client *bifrost.Bifrost, ctx context.Context, testConfig ComprehensiveTestConfig) {
+	if !testConfig.Scenarios.AutomaticFunctionCall {
+		t.Logf("Automatic function calling not supported for provider %s", testConfig.Provider)
+		return
+	}
+
+	t.Run("AutomaticFunctionCalling", func(t *testing.T) {
+		if os.Getenv("SKIP_PARALLEL_TESTS") != "true" {
+			t.Parallel()
+		}
+
+		chatMessages := []schemas.ChatMessage{
+			CreateBasicChatMessage("Get the current time in UTC timezone"),
+		}
+		responsesMessages := []schemas.ResponsesMessage{
+			CreateBasicResponsesMessage("Get the current time in UTC timezone"),
+		}
+
+		// Get tools for both APIs using the new GetSampleTool function
+		chatTool := GetSampleChatTool(SampleToolTypeTime) // Chat Completions API
+		if chatTool == nil {
+			t.Fatalf("GetSampleChatTool returned nil for SampleToolTypeTime")
+		}
+
+		responsesTool := GetSampleResponsesTool(SampleToolTypeTime) // Responses API
+		if responsesTool == nil {
+			t.Fatalf("GetSampleResponsesTool returned nil for SampleToolTypeTime")
+		}
+
+		// Use specialized tool call retry configuration
+		retryConfig := ToolCallRetryConfig(string(SampleToolTypeTime))
+		retryContext := TestRetryContext{
+			ScenarioName: "AutomaticFunctionCalling",
+			ExpectedBehavior: map[string]interface{}{
+				"expected_tool_name": string(SampleToolTypeTime),
+				"is_forced_call":     true,
+				"timezone":           "UTC",
+			},
+			TestMetadata: map[string]interface{}{
+				"provider":    testConfig.Provider,
+				"model":       testConfig.ChatModel,
+				"tool_choice": "forced",
+			},
+		}
+
+		// Enhanced tool call validation for automatic/forced function calls (same for both APIs)
+		expectations := ToolCallExpectations(string(SampleToolTypeTime), []string{"timezone"})
+		expectations = ModifyExpectationsForProvider(expectations, testConfig.Provider)
+		expectations.ExpectedToolCalls[0].ArgumentTypes = map[string]string{
+			"timezone": "string",
+		}
+
+		// Create operations for both Chat Completions and Responses API
+		chatOperation := func() (*schemas.BifrostChatResponse, *schemas.BifrostError) {
+			bfCtx := schemas.NewBifrostContext(ctx, schemas.NoDeadline)
+			chatReq := &schemas.BifrostChatRequest{
+				Provider: testConfig.Provider,
+				Model:    testConfig.ChatModel,
+				Input:    chatMessages,
+				Params: &schemas.ChatParameters{
+					Tools: []schemas.ChatTool{
+						*chatTool,
+					},
+					ToolChoice: &schemas.ChatToolChoice{
+						ChatToolChoiceStruct: &schemas.ChatToolChoiceStruct{
+							Type: schemas.ChatToolChoiceTypeFunction,
+							Function: &schemas.ChatToolChoiceFunction{
+								Name: string(SampleToolTypeTime),
+							},
+						},
+					},
+				},
+				Fallbacks: testConfig.Fallbacks,
+			}
+
+			return client.ChatCompletionRequest(bfCtx, chatReq)
+		}
+
+		responsesOperation := func() (*schemas.BifrostResponsesResponse, *schemas.BifrostError) {
+			bfCtx := schemas.NewBifrostContext(ctx, schemas.NoDeadline)
+			responsesReq := &schemas.BifrostResponsesRequest{
+				Provider: testConfig.Provider,
+				Model:    testConfig.ChatModel,
+				Input:    responsesMessages,
+				Params: &schemas.ResponsesParameters{
+					Tools: []schemas.ResponsesTool{
+						*responsesTool,
+					},
+					ToolChoice: &schemas.ResponsesToolChoice{
+						ResponsesToolChoiceStruct: &schemas.ResponsesToolChoiceStruct{
+							Type: schemas.ResponsesToolChoiceTypeFunction,
+							Name: bifrost.Ptr(string(SampleToolTypeTime)),
+						},
+					},
+				},
+				Fallbacks: testConfig.Fallbacks,
+			}
+
+			return client.ResponsesRequest(bfCtx, responsesReq)
+		}
+
+		// Execute dual API test - passes only if BOTH APIs succeed
+		result := WithDualAPITestRetry(t,
+			retryConfig,
+			retryContext,
+			expectations,
+			"AutomaticFunctionCalling",
+			chatOperation,
+			responsesOperation)
+
+		// Validate both APIs succeeded
+		if !result.BothSucceeded {
+			var errors []string
+			if result.ChatCompletionsError != nil {
+				errors = append(errors, "Chat Completions: "+GetErrorMessage(result.ChatCompletionsError))
+			}
+			if result.ResponsesAPIError != nil {
+				errors = append(errors, "Responses API: "+GetErrorMessage(result.ResponsesAPIError))
+			}
+			if len(errors) == 0 {
+				errors = append(errors, "One or both APIs failed validation (see logs above)")
+			}
+			t.Fatalf("❌ AutomaticFunctionCalling dual API test failed: %v", errors)
+		}
+
+		// Additional validation specific to automatic function calling using universal tool extraction
+		validateChatAutomaticToolCall := func(response *schemas.BifrostChatResponse, apiName string) {
+			toolCalls := ExtractChatToolCalls(response)
+			validateAutomaticToolCall(t, toolCalls, apiName)
+		}
+
+		validateResponsesAutomaticToolCall := func(response *schemas.BifrostResponsesResponse, apiName string) {
+			toolCalls := ExtractResponsesToolCalls(response)
+			validateAutomaticToolCall(t, toolCalls, apiName)
+		}
+
+		// Validate both API responses
+		if result.ChatCompletionsResponse != nil {
+			validateChatAutomaticToolCall(result.ChatCompletionsResponse, "Chat Completions")
+		}
+
+		if result.ResponsesAPIResponse != nil {
+			validateResponsesAutomaticToolCall(result.ResponsesAPIResponse, "Responses")
+		}
+
+		t.Logf("🎉 Both Chat Completions and Responses APIs passed AutomaticFunctionCalling test!")
+	})
+}
+
+func validateAutomaticToolCall(t *testing.T, toolCalls []ToolCallInfo, apiName string) {
+	// Validation for tool call already happened inside WithDualAPITestRetry
+	// If we reach here, the tool call was successful
+	// This function just provides additional logging for tool call details
+	
+	for _, toolCall := range toolCalls {
+		if toolCall.Name == string(SampleToolTypeTime) {
+			t.Logf("✅ %s automatic function call: %s", apiName, toolCall.Arguments)
+
+			// Additional validation for timezone argument
+			lowerArgs := strings.ToLower(toolCall.Arguments)
+			if strings.Contains(lowerArgs, "utc") || strings.Contains(lowerArgs, "timezone") {
+				t.Logf("✅ %s tool call correctly includes timezone information", apiName)
+			} else {
+				t.Logf("⚠️ %s tool call may be missing timezone specification: %s", apiName, toolCall.Arguments)
+			}
+			break
+		}
+	}
+}