Apply SanitizeFunctionName on request and RestoreSanitizedToolName on response for: gemini/claude, gemini/openai/chat-completions, gemini/openai/responses, antigravity/openai/chat-completions, gemini-cli/openai/chat-completions. Also update SanitizedToolNameMap to handle OpenAI format (tools[].function.name) in addition to Claude format (tools[].name).
457 lines
16 KiB
Go
457 lines
16 KiB
Go
package responses
|
|
|
|
import (
|
|
"encoding/json"
|
|
"strings"
|
|
|
|
"github.com/router-for-me/CLIProxyAPI/v6/internal/translator/gemini/common"
|
|
"github.com/router-for-me/CLIProxyAPI/v6/internal/util"
|
|
"github.com/tidwall/gjson"
|
|
"github.com/tidwall/sjson"
|
|
)
|
|
|
|
const geminiResponsesThoughtSignature = "skip_thought_signature_validator"
|
|
|
|
func ConvertOpenAIResponsesRequestToGemini(modelName string, inputRawJSON []byte, stream bool) []byte {
|
|
rawJSON := inputRawJSON
|
|
|
|
// Note: modelName and stream parameters are part of the fixed method signature
|
|
_ = modelName // Unused but required by interface
|
|
_ = stream // Unused but required by interface
|
|
|
|
// Base Gemini API template (do not include thinkingConfig by default)
|
|
out := []byte(`{"contents":[]}`)
|
|
|
|
root := gjson.ParseBytes(rawJSON)
|
|
|
|
// Extract system instruction from OpenAI "instructions" field
|
|
if instructions := root.Get("instructions"); instructions.Exists() {
|
|
systemInstr := []byte(`{"parts":[{"text":""}]}`)
|
|
systemInstr, _ = sjson.SetBytes(systemInstr, "parts.0.text", instructions.String())
|
|
out, _ = sjson.SetRawBytes(out, "systemInstruction", systemInstr)
|
|
}
|
|
|
|
// Convert input messages to Gemini contents format
|
|
if input := root.Get("input"); input.Exists() && input.IsArray() {
|
|
items := input.Array()
|
|
|
|
// Normalize consecutive function calls and outputs so each call is immediately followed by its response
|
|
normalized := make([]gjson.Result, 0, len(items))
|
|
for i := 0; i < len(items); {
|
|
item := items[i]
|
|
itemType := item.Get("type").String()
|
|
itemRole := item.Get("role").String()
|
|
if itemType == "" && itemRole != "" {
|
|
itemType = "message"
|
|
}
|
|
|
|
if itemType == "function_call" {
|
|
var calls []gjson.Result
|
|
var outputs []gjson.Result
|
|
|
|
for i < len(items) {
|
|
next := items[i]
|
|
nextType := next.Get("type").String()
|
|
nextRole := next.Get("role").String()
|
|
if nextType == "" && nextRole != "" {
|
|
nextType = "message"
|
|
}
|
|
if nextType != "function_call" {
|
|
break
|
|
}
|
|
calls = append(calls, next)
|
|
i++
|
|
}
|
|
|
|
for i < len(items) {
|
|
next := items[i]
|
|
nextType := next.Get("type").String()
|
|
nextRole := next.Get("role").String()
|
|
if nextType == "" && nextRole != "" {
|
|
nextType = "message"
|
|
}
|
|
if nextType != "function_call_output" {
|
|
break
|
|
}
|
|
outputs = append(outputs, next)
|
|
i++
|
|
}
|
|
|
|
if len(calls) > 0 {
|
|
outputMap := make(map[string]gjson.Result, len(outputs))
|
|
for _, outItem := range outputs {
|
|
outputMap[outItem.Get("call_id").String()] = outItem
|
|
}
|
|
for _, call := range calls {
|
|
normalized = append(normalized, call)
|
|
callID := call.Get("call_id").String()
|
|
if resp, ok := outputMap[callID]; ok {
|
|
normalized = append(normalized, resp)
|
|
delete(outputMap, callID)
|
|
}
|
|
}
|
|
for _, outItem := range outputs {
|
|
if _, ok := outputMap[outItem.Get("call_id").String()]; ok {
|
|
normalized = append(normalized, outItem)
|
|
}
|
|
}
|
|
continue
|
|
}
|
|
}
|
|
|
|
if itemType == "function_call_output" {
|
|
normalized = append(normalized, item)
|
|
i++
|
|
continue
|
|
}
|
|
|
|
normalized = append(normalized, item)
|
|
i++
|
|
}
|
|
|
|
for _, item := range normalized {
|
|
itemType := item.Get("type").String()
|
|
itemRole := item.Get("role").String()
|
|
if itemType == "" && itemRole != "" {
|
|
itemType = "message"
|
|
}
|
|
|
|
switch itemType {
|
|
case "message":
|
|
if strings.EqualFold(itemRole, "system") {
|
|
if contentArray := item.Get("content"); contentArray.Exists() {
|
|
systemInstr := []byte(`{"parts":[]}`)
|
|
if systemInstructionResult := gjson.GetBytes(out, "systemInstruction"); systemInstructionResult.Exists() {
|
|
systemInstr = []byte(systemInstructionResult.Raw)
|
|
}
|
|
|
|
if contentArray.IsArray() {
|
|
contentArray.ForEach(func(_, contentItem gjson.Result) bool {
|
|
part := []byte(`{"text":""}`)
|
|
text := contentItem.Get("text").String()
|
|
part, _ = sjson.SetBytes(part, "text", text)
|
|
systemInstr, _ = sjson.SetRawBytes(systemInstr, "parts.-1", part)
|
|
return true
|
|
})
|
|
} else if contentArray.Type == gjson.String {
|
|
part := []byte(`{"text":""}`)
|
|
part, _ = sjson.SetBytes(part, "text", contentArray.String())
|
|
systemInstr, _ = sjson.SetRawBytes(systemInstr, "parts.-1", part)
|
|
}
|
|
|
|
if gjson.GetBytes(systemInstr, "parts.#").Int() > 0 {
|
|
out, _ = sjson.SetRawBytes(out, "systemInstruction", systemInstr)
|
|
}
|
|
}
|
|
continue
|
|
}
|
|
|
|
// Handle regular messages
|
|
// Note: In Responses format, model outputs may appear as content items with type "output_text"
|
|
// even when the message.role is "user". We split such items into distinct Gemini messages
|
|
// with roles derived from the content type to match docs/convert-2.md.
|
|
if contentArray := item.Get("content"); contentArray.Exists() && contentArray.IsArray() {
|
|
currentRole := ""
|
|
currentParts := make([][]byte, 0)
|
|
|
|
flush := func() {
|
|
if currentRole == "" || len(currentParts) == 0 {
|
|
currentParts = currentParts[:0]
|
|
return
|
|
}
|
|
one := []byte(`{"role":"","parts":[]}`)
|
|
one, _ = sjson.SetBytes(one, "role", currentRole)
|
|
for _, part := range currentParts {
|
|
one, _ = sjson.SetRawBytes(one, "parts.-1", part)
|
|
}
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", one)
|
|
currentParts = currentParts[:0]
|
|
}
|
|
|
|
contentArray.ForEach(func(_, contentItem gjson.Result) bool {
|
|
contentType := contentItem.Get("type").String()
|
|
if contentType == "" {
|
|
contentType = "input_text"
|
|
}
|
|
|
|
effRole := "user"
|
|
if itemRole != "" {
|
|
switch strings.ToLower(itemRole) {
|
|
case "assistant", "model":
|
|
effRole = "model"
|
|
default:
|
|
effRole = strings.ToLower(itemRole)
|
|
}
|
|
}
|
|
if contentType == "output_text" {
|
|
effRole = "model"
|
|
}
|
|
if effRole == "assistant" {
|
|
effRole = "model"
|
|
}
|
|
|
|
if currentRole != "" && effRole != currentRole {
|
|
flush()
|
|
currentRole = ""
|
|
}
|
|
if currentRole == "" {
|
|
currentRole = effRole
|
|
}
|
|
|
|
var partJSON []byte
|
|
switch contentType {
|
|
case "input_text", "output_text":
|
|
if text := contentItem.Get("text"); text.Exists() {
|
|
partJSON = []byte(`{"text":""}`)
|
|
partJSON, _ = sjson.SetBytes(partJSON, "text", text.String())
|
|
}
|
|
case "input_image":
|
|
imageURL := contentItem.Get("image_url").String()
|
|
if imageURL == "" {
|
|
imageURL = contentItem.Get("url").String()
|
|
}
|
|
if imageURL != "" {
|
|
mimeType := "application/octet-stream"
|
|
data := ""
|
|
if strings.HasPrefix(imageURL, "data:") {
|
|
trimmed := strings.TrimPrefix(imageURL, "data:")
|
|
mediaAndData := strings.SplitN(trimmed, ";base64,", 2)
|
|
if len(mediaAndData) == 2 {
|
|
if mediaAndData[0] != "" {
|
|
mimeType = mediaAndData[0]
|
|
}
|
|
data = mediaAndData[1]
|
|
} else {
|
|
mediaAndData = strings.SplitN(trimmed, ",", 2)
|
|
if len(mediaAndData) == 2 {
|
|
if mediaAndData[0] != "" {
|
|
mimeType = mediaAndData[0]
|
|
}
|
|
data = mediaAndData[1]
|
|
}
|
|
}
|
|
}
|
|
if data != "" {
|
|
partJSON = []byte(`{"inline_data":{"mime_type":"","data":""}}`)
|
|
partJSON, _ = sjson.SetBytes(partJSON, "inline_data.mime_type", mimeType)
|
|
partJSON, _ = sjson.SetBytes(partJSON, "inline_data.data", data)
|
|
}
|
|
}
|
|
case "input_audio":
|
|
audioData := contentItem.Get("data").String()
|
|
audioFormat := contentItem.Get("format").String()
|
|
if audioData != "" {
|
|
audioMimeMap := map[string]string{
|
|
"mp3": "audio/mpeg",
|
|
"wav": "audio/wav",
|
|
"ogg": "audio/ogg",
|
|
"flac": "audio/flac",
|
|
"aac": "audio/aac",
|
|
"webm": "audio/webm",
|
|
"pcm16": "audio/pcm",
|
|
"g711_ulaw": "audio/basic",
|
|
"g711_alaw": "audio/basic",
|
|
}
|
|
mimeType := "audio/wav"
|
|
if audioFormat != "" {
|
|
if mapped, ok := audioMimeMap[audioFormat]; ok {
|
|
mimeType = mapped
|
|
} else {
|
|
mimeType = "audio/" + audioFormat
|
|
}
|
|
}
|
|
partJSON = []byte(`{"inline_data":{"mime_type":"","data":""}}`)
|
|
partJSON, _ = sjson.SetBytes(partJSON, "inline_data.mime_type", mimeType)
|
|
partJSON, _ = sjson.SetBytes(partJSON, "inline_data.data", audioData)
|
|
}
|
|
}
|
|
|
|
if len(partJSON) > 0 {
|
|
currentParts = append(currentParts, partJSON)
|
|
}
|
|
return true
|
|
})
|
|
|
|
flush()
|
|
} else if contentArray.Type == gjson.String {
|
|
effRole := "user"
|
|
if itemRole != "" {
|
|
switch strings.ToLower(itemRole) {
|
|
case "assistant", "model":
|
|
effRole = "model"
|
|
default:
|
|
effRole = strings.ToLower(itemRole)
|
|
}
|
|
}
|
|
|
|
one := []byte(`{"role":"","parts":[{"text":""}]}`)
|
|
one, _ = sjson.SetBytes(one, "role", effRole)
|
|
one, _ = sjson.SetBytes(one, "parts.0.text", contentArray.String())
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", one)
|
|
}
|
|
|
|
case "function_call":
|
|
// Handle function calls - convert to model message with functionCall
|
|
name := util.SanitizeFunctionName(item.Get("name").String())
|
|
arguments := item.Get("arguments").String()
|
|
|
|
modelContent := []byte(`{"role":"model","parts":[]}`)
|
|
functionCall := []byte(`{"functionCall":{"name":"","args":{}}}`)
|
|
functionCall, _ = sjson.SetBytes(functionCall, "functionCall.name", name)
|
|
functionCall, _ = sjson.SetBytes(functionCall, "thoughtSignature", geminiResponsesThoughtSignature)
|
|
functionCall, _ = sjson.SetBytes(functionCall, "functionCall.id", item.Get("call_id").String())
|
|
|
|
// Parse arguments JSON string and set as args object
|
|
if arguments != "" {
|
|
argsResult := gjson.Parse(arguments)
|
|
functionCall, _ = sjson.SetRawBytes(functionCall, "functionCall.args", []byte(argsResult.Raw))
|
|
}
|
|
|
|
modelContent, _ = sjson.SetRawBytes(modelContent, "parts.-1", functionCall)
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", modelContent)
|
|
|
|
case "function_call_output":
|
|
// Handle function call outputs - convert to function message with functionResponse
|
|
callID := item.Get("call_id").String()
|
|
// Use .Raw to preserve the JSON encoding (includes quotes for strings)
|
|
outputRaw := item.Get("output").Str
|
|
|
|
functionContent := []byte(`{"role":"function","parts":[]}`)
|
|
functionResponse := []byte(`{"functionResponse":{"name":"","response":{}}}`)
|
|
|
|
// We need to extract the function name from the previous function_call
|
|
// For now, we'll use a placeholder or extract from context if available
|
|
functionName := "unknown" // This should ideally be matched with the corresponding function_call
|
|
|
|
// Find the corresponding function call name by matching call_id
|
|
// We need to look back through the input array to find the matching call
|
|
if inputArray := root.Get("input"); inputArray.Exists() && inputArray.IsArray() {
|
|
inputArray.ForEach(func(_, prevItem gjson.Result) bool {
|
|
if prevItem.Get("type").String() == "function_call" && prevItem.Get("call_id").String() == callID {
|
|
functionName = prevItem.Get("name").String()
|
|
return false // Stop iteration
|
|
}
|
|
return true
|
|
})
|
|
}
|
|
functionName = util.SanitizeFunctionName(functionName)
|
|
|
|
functionResponse, _ = sjson.SetBytes(functionResponse, "functionResponse.name", functionName)
|
|
functionResponse, _ = sjson.SetBytes(functionResponse, "functionResponse.id", callID)
|
|
|
|
// Set the raw JSON output directly (preserves string encoding)
|
|
if outputRaw != "" && outputRaw != "null" {
|
|
output := gjson.Parse(outputRaw)
|
|
if output.Type == gjson.JSON && json.Valid([]byte(output.Raw)) {
|
|
functionResponse, _ = sjson.SetRawBytes(functionResponse, "functionResponse.response.result", []byte(output.Raw))
|
|
} else {
|
|
functionResponse, _ = sjson.SetBytes(functionResponse, "functionResponse.response.result", outputRaw)
|
|
}
|
|
}
|
|
functionContent, _ = sjson.SetRawBytes(functionContent, "parts.-1", functionResponse)
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", functionContent)
|
|
|
|
case "reasoning":
|
|
thoughtContent := []byte(`{"role":"model","parts":[]}`)
|
|
thought := []byte(`{"text":"","thoughtSignature":"","thought":true}`)
|
|
thought, _ = sjson.SetBytes(thought, "text", item.Get("summary.0.text").String())
|
|
thought, _ = sjson.SetBytes(thought, "thoughtSignature", item.Get("encrypted_content").String())
|
|
|
|
thoughtContent, _ = sjson.SetRawBytes(thoughtContent, "parts.-1", thought)
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", thoughtContent)
|
|
}
|
|
}
|
|
} else if input.Exists() && input.Type == gjson.String {
|
|
// Simple string input conversion to user message
|
|
userContent := []byte(`{"role":"user","parts":[{"text":""}]}`)
|
|
userContent, _ = sjson.SetBytes(userContent, "parts.0.text", input.String())
|
|
out, _ = sjson.SetRawBytes(out, "contents.-1", userContent)
|
|
}
|
|
|
|
// Convert tools to Gemini functionDeclarations format
|
|
if tools := root.Get("tools"); tools.Exists() && tools.IsArray() {
|
|
geminiTools := []byte(`[{"functionDeclarations":[]}]`)
|
|
|
|
tools.ForEach(func(_, tool gjson.Result) bool {
|
|
if tool.Get("type").String() == "function" {
|
|
funcDecl := []byte(`{"name":"","description":"","parametersJsonSchema":{}}`)
|
|
|
|
if name := tool.Get("name"); name.Exists() {
|
|
funcDecl, _ = sjson.SetBytes(funcDecl, "name", util.SanitizeFunctionName(name.String()))
|
|
}
|
|
if desc := tool.Get("description"); desc.Exists() {
|
|
funcDecl, _ = sjson.SetBytes(funcDecl, "description", desc.String())
|
|
}
|
|
if params := tool.Get("parameters"); params.Exists() {
|
|
funcDecl, _ = sjson.SetRawBytes(funcDecl, "parametersJsonSchema", []byte(params.Raw))
|
|
}
|
|
|
|
geminiTools, _ = sjson.SetRawBytes(geminiTools, "0.functionDeclarations.-1", funcDecl)
|
|
}
|
|
return true
|
|
})
|
|
|
|
// Only add tools if there are function declarations
|
|
if funcDecls := gjson.GetBytes(geminiTools, "0.functionDeclarations"); funcDecls.Exists() && len(funcDecls.Array()) > 0 {
|
|
out, _ = sjson.SetRawBytes(out, "tools", geminiTools)
|
|
}
|
|
}
|
|
|
|
// Handle generation config from OpenAI format
|
|
if maxOutputTokens := root.Get("max_output_tokens"); maxOutputTokens.Exists() {
|
|
genConfig := []byte(`{"maxOutputTokens":0}`)
|
|
genConfig, _ = sjson.SetBytes(genConfig, "maxOutputTokens", maxOutputTokens.Int())
|
|
out, _ = sjson.SetRawBytes(out, "generationConfig", genConfig)
|
|
}
|
|
|
|
// Handle temperature if present
|
|
if temperature := root.Get("temperature"); temperature.Exists() {
|
|
if !gjson.GetBytes(out, "generationConfig").Exists() {
|
|
out, _ = sjson.SetRawBytes(out, "generationConfig", []byte(`{}`))
|
|
}
|
|
out, _ = sjson.SetBytes(out, "generationConfig.temperature", temperature.Float())
|
|
}
|
|
|
|
// Handle top_p if present
|
|
if topP := root.Get("top_p"); topP.Exists() {
|
|
if !gjson.GetBytes(out, "generationConfig").Exists() {
|
|
out, _ = sjson.SetRawBytes(out, "generationConfig", []byte(`{}`))
|
|
}
|
|
out, _ = sjson.SetBytes(out, "generationConfig.topP", topP.Float())
|
|
}
|
|
|
|
// Handle stop sequences
|
|
if stopSequences := root.Get("stop_sequences"); stopSequences.Exists() && stopSequences.IsArray() {
|
|
if !gjson.GetBytes(out, "generationConfig").Exists() {
|
|
out, _ = sjson.SetRawBytes(out, "generationConfig", []byte(`{}`))
|
|
}
|
|
var sequences []string
|
|
stopSequences.ForEach(func(_, seq gjson.Result) bool {
|
|
sequences = append(sequences, seq.String())
|
|
return true
|
|
})
|
|
out, _ = sjson.SetBytes(out, "generationConfig.stopSequences", sequences)
|
|
}
|
|
|
|
// Apply thinking configuration: convert OpenAI Responses API reasoning.effort to Gemini thinkingConfig.
|
|
// Inline translation-only mapping; capability checks happen later in ApplyThinking.
|
|
re := root.Get("reasoning.effort")
|
|
if re.Exists() {
|
|
effort := strings.ToLower(strings.TrimSpace(re.String()))
|
|
if effort != "" {
|
|
thinkingPath := "generationConfig.thinkingConfig"
|
|
if effort == "auto" {
|
|
out, _ = sjson.SetBytes(out, thinkingPath+".thinkingBudget", -1)
|
|
out, _ = sjson.SetBytes(out, thinkingPath+".includeThoughts", true)
|
|
} else {
|
|
out, _ = sjson.SetBytes(out, thinkingPath+".thinkingLevel", effort)
|
|
out, _ = sjson.SetBytes(out, thinkingPath+".includeThoughts", effort != "none")
|
|
}
|
|
}
|
|
}
|
|
|
|
result := out
|
|
result = common.AttachDefaultSafetySettings(result, "safetySettings")
|
|
return result
|
|
}
|