diff --git a/internal/translator/antigravity/claude/antigravity_claude_request.go b/internal/translator/antigravity/claude/antigravity_claude_request.go index 448aa976..b634436d 100644 --- a/internal/translator/antigravity/claude/antigravity_claude_request.go +++ b/internal/translator/antigravity/claude/antigravity_claude_request.go @@ -223,14 +223,65 @@ func ConvertClaudeRequestToAntigravity(modelName string, inputRawJSON []byte, _ functionResponseJSON, _ = sjson.Set(functionResponseJSON, "response.result", responseData) } else if functionResponseResult.IsArray() { frResults := functionResponseResult.Array() - if len(frResults) == 1 { - functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", frResults[0].Raw) + nonImageCount := 0 + lastNonImageRaw := "" + filteredJSON := "[]" + imagePartsJSON := "[]" + for _, fr := range frResults { + if fr.Get("type").String() == "image" && fr.Get("source.type").String() == "base64" { + inlineDataJSON := `{}` + if mimeType := fr.Get("source.media_type").String(); mimeType != "" { + inlineDataJSON, _ = sjson.Set(inlineDataJSON, "mimeType", mimeType) + } + if data := fr.Get("source.data").String(); data != "" { + inlineDataJSON, _ = sjson.Set(inlineDataJSON, "data", data) + } + + imagePartJSON := `{}` + imagePartJSON, _ = sjson.SetRaw(imagePartJSON, "inlineData", inlineDataJSON) + imagePartsJSON, _ = sjson.SetRaw(imagePartsJSON, "-1", imagePartJSON) + continue + } + + nonImageCount++ + lastNonImageRaw = fr.Raw + filteredJSON, _ = sjson.SetRaw(filteredJSON, "-1", fr.Raw) + } + + if nonImageCount == 1 { + functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", lastNonImageRaw) + } else if nonImageCount > 1 { + functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", filteredJSON) } else { - functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", functionResponseResult.Raw) + functionResponseJSON, _ = sjson.Set(functionResponseJSON, "response.result", "") + } + + // Place image data inside functionResponse.parts as inlineData + // instead of as sibling parts in the outer content, to avoid + // base64 data bloating the text context. + if gjson.Get(imagePartsJSON, "#").Int() > 0 { + functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "parts", imagePartsJSON) } } else if functionResponseResult.IsObject() { - functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", functionResponseResult.Raw) + if functionResponseResult.Get("type").String() == "image" && functionResponseResult.Get("source.type").String() == "base64" { + inlineDataJSON := `{}` + if mimeType := functionResponseResult.Get("source.media_type").String(); mimeType != "" { + inlineDataJSON, _ = sjson.Set(inlineDataJSON, "mimeType", mimeType) + } + if data := functionResponseResult.Get("source.data").String(); data != "" { + inlineDataJSON, _ = sjson.Set(inlineDataJSON, "data", data) + } + + imagePartJSON := `{}` + imagePartJSON, _ = sjson.SetRaw(imagePartJSON, "inlineData", inlineDataJSON) + imagePartsJSON := "[]" + imagePartsJSON, _ = sjson.SetRaw(imagePartsJSON, "-1", imagePartJSON) + functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "parts", imagePartsJSON) + functionResponseJSON, _ = sjson.Set(functionResponseJSON, "response.result", "") + } else { + functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", functionResponseResult.Raw) + } } else if functionResponseResult.Raw != "" { functionResponseJSON, _ = sjson.SetRaw(functionResponseJSON, "response.result", functionResponseResult.Raw) } else { @@ -248,7 +299,7 @@ func ConvertClaudeRequestToAntigravity(modelName string, inputRawJSON []byte, _ if sourceResult.Get("type").String() == "base64" { inlineDataJSON := `{}` if mimeType := sourceResult.Get("media_type").String(); mimeType != "" { - inlineDataJSON, _ = sjson.Set(inlineDataJSON, "mime_type", mimeType) + inlineDataJSON, _ = sjson.Set(inlineDataJSON, "mimeType", mimeType) } if data := sourceResult.Get("data").String(); data != "" { inlineDataJSON, _ = sjson.Set(inlineDataJSON, "data", data) diff --git a/internal/translator/antigravity/claude/antigravity_claude_request_test.go b/internal/translator/antigravity/claude/antigravity_claude_request_test.go index c28a14ec..865db668 100644 --- a/internal/translator/antigravity/claude/antigravity_claude_request_test.go +++ b/internal/translator/antigravity/claude/antigravity_claude_request_test.go @@ -413,8 +413,8 @@ func TestConvertClaudeRequestToAntigravity_ImageContent(t *testing.T) { if !inlineData.Exists() { t.Error("inlineData should exist") } - if inlineData.Get("mime_type").String() != "image/png" { - t.Error("mime_type mismatch") + if inlineData.Get("mimeType").String() != "image/png" { + t.Error("mimeType mismatch") } if !strings.Contains(inlineData.Get("data").String(), "iVBORw0KGgo") { t.Error("data mismatch") @@ -740,6 +740,429 @@ func TestConvertClaudeRequestToAntigravity_ToolResultNullContent(t *testing.T) { } } +func TestConvertClaudeRequestToAntigravity_ToolResultWithImage(t *testing.T) { + // tool_result with array content containing text + image should place + // image data inside functionResponse.parts as inlineData, not as a + // sibling part in the outer content (to avoid base64 context bloat). + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "Read-123-456", + "content": [ + { + "type": "text", + "text": "File content here" + }, + { + "type": "image", + "source": { + "type": "base64", + "media_type": "image/png", + "data": "iVBORw0KGgoAAAANSUhEUg==" + } + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + // Image should be inside functionResponse.parts, not as outer sibling part + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // Text content should be in response.result + resultText := funcResp.Get("response.result.text").String() + if resultText != "File content here" { + t.Errorf("Expected response.result.text = 'File content here', got '%s'", resultText) + } + + // Image should be in functionResponse.parts[0].inlineData + inlineData := funcResp.Get("parts.0.inlineData") + if !inlineData.Exists() { + t.Fatal("functionResponse.parts[0].inlineData should exist") + } + if inlineData.Get("mimeType").String() != "image/png" { + t.Errorf("Expected mimeType 'image/png', got '%s'", inlineData.Get("mimeType").String()) + } + if !strings.Contains(inlineData.Get("data").String(), "iVBORw0KGgo") { + t.Error("data mismatch") + } + + // Image should NOT be in outer parts (only functionResponse part should exist) + outerParts := gjson.Get(outputStr, "request.contents.0.parts") + if outerParts.IsArray() && len(outerParts.Array()) > 1 { + t.Errorf("Expected only 1 outer part (functionResponse), got %d", len(outerParts.Array())) + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultWithSingleImage(t *testing.T) { + // tool_result with single image object as content should place + // image data inside functionResponse.parts, not as outer sibling part. + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "Read-789-012", + "content": { + "type": "image", + "source": { + "type": "base64", + "media_type": "image/jpeg", + "data": "/9j/4AAQSkZJRgABAQ==" + } + } + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // response.result should be empty (image only) + if funcResp.Get("response.result").String() != "" { + t.Errorf("Expected empty response.result for image-only content, got '%s'", funcResp.Get("response.result").String()) + } + + // Image should be in functionResponse.parts[0].inlineData + inlineData := funcResp.Get("parts.0.inlineData") + if !inlineData.Exists() { + t.Fatal("functionResponse.parts[0].inlineData should exist") + } + if inlineData.Get("mimeType").String() != "image/jpeg" { + t.Errorf("Expected mimeType 'image/jpeg', got '%s'", inlineData.Get("mimeType").String()) + } + + // Image should NOT be in outer parts + outerParts := gjson.Get(outputStr, "request.contents.0.parts") + if outerParts.IsArray() && len(outerParts.Array()) > 1 { + t.Errorf("Expected only 1 outer part, got %d", len(outerParts.Array())) + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultWithMultipleImagesAndTexts(t *testing.T) { + // tool_result with array content: 2 text items + 2 images + // All images go into functionResponse.parts, texts into response.result array + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "Multi-001", + "content": [ + {"type": "text", "text": "First text"}, + { + "type": "image", + "source": {"type": "base64", "media_type": "image/png", "data": "AAAA"} + }, + {"type": "text", "text": "Second text"}, + { + "type": "image", + "source": {"type": "base64", "media_type": "image/jpeg", "data": "BBBB"} + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // Multiple text items => response.result is an array + resultArr := funcResp.Get("response.result") + if !resultArr.IsArray() { + t.Fatalf("Expected response.result to be an array, got: %s", resultArr.Raw) + } + results := resultArr.Array() + if len(results) != 2 { + t.Fatalf("Expected 2 result items, got %d", len(results)) + } + + // Both images should be in functionResponse.parts + imgParts := funcResp.Get("parts").Array() + if len(imgParts) != 2 { + t.Fatalf("Expected 2 image parts in functionResponse.parts, got %d", len(imgParts)) + } + if imgParts[0].Get("inlineData.mimeType").String() != "image/png" { + t.Errorf("Expected first image mimeType 'image/png', got '%s'", imgParts[0].Get("inlineData.mimeType").String()) + } + if imgParts[0].Get("inlineData.data").String() != "AAAA" { + t.Errorf("Expected first image data 'AAAA', got '%s'", imgParts[0].Get("inlineData.data").String()) + } + if imgParts[1].Get("inlineData.mimeType").String() != "image/jpeg" { + t.Errorf("Expected second image mimeType 'image/jpeg', got '%s'", imgParts[1].Get("inlineData.mimeType").String()) + } + if imgParts[1].Get("inlineData.data").String() != "BBBB" { + t.Errorf("Expected second image data 'BBBB', got '%s'", imgParts[1].Get("inlineData.data").String()) + } + + // Only 1 outer part (the functionResponse itself) + outerParts := gjson.Get(outputStr, "request.contents.0.parts").Array() + if len(outerParts) != 1 { + t.Errorf("Expected 1 outer part, got %d", len(outerParts)) + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultWithOnlyMultipleImages(t *testing.T) { + // tool_result with only images (no text) — response.result should be empty string + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "ImgOnly-001", + "content": [ + { + "type": "image", + "source": {"type": "base64", "media_type": "image/png", "data": "PNG1"} + }, + { + "type": "image", + "source": {"type": "base64", "media_type": "image/gif", "data": "GIF1"} + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // No text => response.result should be empty string + if funcResp.Get("response.result").String() != "" { + t.Errorf("Expected empty response.result, got '%s'", funcResp.Get("response.result").String()) + } + + // Both images in functionResponse.parts + imgParts := funcResp.Get("parts").Array() + if len(imgParts) != 2 { + t.Fatalf("Expected 2 image parts, got %d", len(imgParts)) + } + if imgParts[0].Get("inlineData.mimeType").String() != "image/png" { + t.Error("first image mimeType mismatch") + } + if imgParts[1].Get("inlineData.mimeType").String() != "image/gif" { + t.Error("second image mimeType mismatch") + } + + // Only 1 outer part + outerParts := gjson.Get(outputStr, "request.contents.0.parts").Array() + if len(outerParts) != 1 { + t.Errorf("Expected 1 outer part, got %d", len(outerParts)) + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultImageNotBase64(t *testing.T) { + // image with source.type != "base64" should be treated as non-image (falls through) + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "NotB64-001", + "content": [ + {"type": "text", "text": "some output"}, + { + "type": "image", + "source": {"type": "url", "url": "https://example.com/img.png"} + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // Non-base64 image is treated as non-image, so it goes into the filtered results + // along with the text item. Since there are 2 non-image items, result is array. + resultArr := funcResp.Get("response.result") + if !resultArr.IsArray() { + t.Fatalf("Expected response.result to be an array (2 non-image items), got: %s", resultArr.Raw) + } + results := resultArr.Array() + if len(results) != 2 { + t.Fatalf("Expected 2 result items, got %d", len(results)) + } + + // No functionResponse.parts (no base64 images collected) + if funcResp.Get("parts").Exists() { + t.Error("functionResponse.parts should NOT exist when no base64 images") + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultImageMissingData(t *testing.T) { + // image with source.type=base64 but missing data field + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "NoData-001", + "content": [ + {"type": "text", "text": "output"}, + { + "type": "image", + "source": {"type": "base64", "media_type": "image/png"} + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // The image is still classified as base64 image (type check passes), + // but data field is missing => inlineData has mimeType but no data + imgParts := funcResp.Get("parts").Array() + if len(imgParts) != 1 { + t.Fatalf("Expected 1 image part, got %d", len(imgParts)) + } + if imgParts[0].Get("inlineData.mimeType").String() != "image/png" { + t.Error("mimeType should still be set") + } + if imgParts[0].Get("inlineData.data").Exists() { + t.Error("data should not exist when source.data is missing") + } +} + +func TestConvertClaudeRequestToAntigravity_ToolResultImageMissingMediaType(t *testing.T) { + // image with source.type=base64 but missing media_type field + inputJSON := []byte(`{ + "model": "claude-3-5-sonnet-20240620", + "messages": [ + { + "role": "user", + "content": [ + { + "type": "tool_result", + "tool_use_id": "NoMime-001", + "content": [ + {"type": "text", "text": "output"}, + { + "type": "image", + "source": {"type": "base64", "data": "AAAA"} + } + ] + } + ] + } + ] + }`) + + output := ConvertClaudeRequestToAntigravity("claude-sonnet-4-5", inputJSON, false) + outputStr := string(output) + + if !gjson.Valid(outputStr) { + t.Fatalf("Result is not valid JSON:\n%s", outputStr) + } + + funcResp := gjson.Get(outputStr, "request.contents.0.parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist") + } + + // The image is still classified as base64 image, + // but media_type is missing => inlineData has data but no mimeType + imgParts := funcResp.Get("parts").Array() + if len(imgParts) != 1 { + t.Fatalf("Expected 1 image part, got %d", len(imgParts)) + } + if imgParts[0].Get("inlineData.mimeType").Exists() { + t.Error("mimeType should not exist when media_type is missing") + } + if imgParts[0].Get("inlineData.data").String() != "AAAA" { + t.Error("data should still be set") + } +} + func TestConvertClaudeRequestToAntigravity_ToolAndThinking_NoExistingSystem(t *testing.T) { // When tools + thinking but no system instruction, should create one with hint inputJSON := []byte(`{ diff --git a/internal/translator/antigravity/gemini/antigravity_gemini_request_test.go b/internal/translator/antigravity/gemini/antigravity_gemini_request_test.go index 8867a30e..da581d1a 100644 --- a/internal/translator/antigravity/gemini/antigravity_gemini_request_test.go +++ b/internal/translator/antigravity/gemini/antigravity_gemini_request_test.go @@ -93,3 +93,81 @@ func TestConvertGeminiRequestToAntigravity_ParallelFunctionCalls(t *testing.T) { } } } + +func TestFixCLIToolResponse_PreservesFunctionResponseParts(t *testing.T) { + // When functionResponse contains a "parts" field with inlineData (from Claude + // translator's image embedding), fixCLIToolResponse should preserve it as-is. + // parseFunctionResponseRaw returns response.Raw for valid JSON objects, + // so extra fields like "parts" survive the pipeline. + input := `{ + "model": "claude-opus-4-6-thinking", + "request": { + "contents": [ + { + "role": "model", + "parts": [ + { + "functionCall": {"name": "screenshot", "args": {}} + } + ] + }, + { + "role": "function", + "parts": [ + { + "functionResponse": { + "id": "tool-001", + "name": "screenshot", + "response": {"result": "Screenshot taken"}, + "parts": [ + {"inlineData": {"mimeType": "image/png", "data": "iVBOR"}} + ] + } + } + ] + } + ] + } + }` + + result, err := fixCLIToolResponse(input) + if err != nil { + t.Fatalf("fixCLIToolResponse failed: %v", err) + } + + // Find the function response content (role=function) + contents := gjson.Get(result, "request.contents").Array() + var funcContent gjson.Result + for _, c := range contents { + if c.Get("role").String() == "function" { + funcContent = c + break + } + } + if !funcContent.Exists() { + t.Fatal("function role content should exist in output") + } + + // The functionResponse should be preserved with its parts field + funcResp := funcContent.Get("parts.0.functionResponse") + if !funcResp.Exists() { + t.Fatal("functionResponse should exist in output") + } + + // Verify the parts field with inlineData is preserved + inlineParts := funcResp.Get("parts").Array() + if len(inlineParts) != 1 { + t.Fatalf("Expected 1 inlineData part in functionResponse.parts, got %d", len(inlineParts)) + } + if inlineParts[0].Get("inlineData.mimeType").String() != "image/png" { + t.Errorf("Expected mimeType 'image/png', got '%s'", inlineParts[0].Get("inlineData.mimeType").String()) + } + if inlineParts[0].Get("inlineData.data").String() != "iVBOR" { + t.Errorf("Expected data 'iVBOR', got '%s'", inlineParts[0].Get("inlineData.data").String()) + } + + // Verify response.result is also preserved + if funcResp.Get("response.result").String() != "Screenshot taken" { + t.Errorf("Expected response.result 'Screenshot taken', got '%s'", funcResp.Get("response.result").String()) + } +} diff --git a/internal/translator/antigravity/openai/chat-completions/antigravity_openai_request.go b/internal/translator/antigravity/openai/chat-completions/antigravity_openai_request.go index a8105c4e..85b28b8b 100644 --- a/internal/translator/antigravity/openai/chat-completions/antigravity_openai_request.go +++ b/internal/translator/antigravity/openai/chat-completions/antigravity_openai_request.go @@ -187,7 +187,7 @@ func ConvertOpenAIRequestToAntigravity(modelName string, inputRawJSON []byte, _ if len(pieces) == 2 && len(pieces[1]) > 7 { mime := pieces[0] data := pieces[1][7:] - node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mime_type", mime) + node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mimeType", mime) node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.data", data) node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".thoughtSignature", geminiCLIFunctionThoughtSignature) p++ @@ -201,7 +201,7 @@ func ConvertOpenAIRequestToAntigravity(modelName string, inputRawJSON []byte, _ ext = sp[len(sp)-1] } if mimeType, ok := misc.MimeTypes[ext]; ok { - node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mime_type", mimeType) + node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mimeType", mimeType) node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.data", fileData) p++ } else { @@ -235,7 +235,7 @@ func ConvertOpenAIRequestToAntigravity(modelName string, inputRawJSON []byte, _ if len(pieces) == 2 && len(pieces[1]) > 7 { mime := pieces[0] data := pieces[1][7:] - node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mime_type", mime) + node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.mimeType", mime) node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".inlineData.data", data) node, _ = sjson.SetBytes(node, "parts."+itoa(p)+".thoughtSignature", geminiCLIFunctionThoughtSignature) p++