2024-02-29 01:08:18 +08:00
|
|
|
|
package claude
|
2023-07-22 16:18:03 +08:00
|
|
|
|
|
2023-07-22 17:12:13 +08:00
|
|
|
|
import (
|
2025-03-12 19:29:15 +08:00
|
|
|
|
"bytes"
|
2023-07-22 17:36:40 +08:00
|
|
|
|
"encoding/json"
|
2023-07-22 17:12:13 +08:00
|
|
|
|
"fmt"
|
2023-07-22 17:36:40 +08:00
|
|
|
|
"io"
|
|
|
|
|
|
"net/http"
|
2023-07-22 17:12:13 +08:00
|
|
|
|
"one-api/common"
|
2024-02-29 01:08:18 +08:00
|
|
|
|
"one-api/dto"
|
2024-06-27 00:16:39 +08:00
|
|
|
|
relaycommon "one-api/relay/common"
|
2025-03-05 19:47:41 +08:00
|
|
|
|
"one-api/relay/helper"
|
2024-02-29 01:08:18 +08:00
|
|
|
|
"one-api/service"
|
2025-02-27 20:49:34 +08:00
|
|
|
|
"one-api/setting/model_setting"
|
2023-07-22 17:12:13 +08:00
|
|
|
|
"strings"
|
2024-09-05 00:53:00 +08:00
|
|
|
|
|
|
|
|
|
|
"github.com/gin-gonic/gin"
|
2023-07-22 17:12:13 +08:00
|
|
|
|
)
|
|
|
|
|
|
|
2023-07-22 16:18:03 +08:00
|
|
|
|
func stopReasonClaude2OpenAI(reason string) string {
|
|
|
|
|
|
switch reason {
|
|
|
|
|
|
case "stop_sequence":
|
|
|
|
|
|
return "stop"
|
2024-03-08 19:43:33 +08:00
|
|
|
|
case "end_turn":
|
|
|
|
|
|
return "stop"
|
2023-07-22 16:18:03 +08:00
|
|
|
|
case "max_tokens":
|
2024-04-24 18:49:56 +08:00
|
|
|
|
return "max_tokens"
|
2023-07-22 16:18:03 +08:00
|
|
|
|
default:
|
|
|
|
|
|
return reason
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2023-07-22 17:12:13 +08:00
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
func RequestOpenAI2ClaudeComplete(textRequest dto.GeneralOpenAIRequest) *dto.ClaudeRequest {
|
2024-07-18 00:36:05 +08:00
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeRequest := dto.ClaudeRequest{
|
2024-04-23 12:19:23 +08:00
|
|
|
|
Model: textRequest.Model,
|
|
|
|
|
|
Prompt: "",
|
|
|
|
|
|
StopSequences: nil,
|
|
|
|
|
|
Temperature: textRequest.Temperature,
|
|
|
|
|
|
TopP: textRequest.TopP,
|
|
|
|
|
|
TopK: textRequest.TopK,
|
|
|
|
|
|
Stream: textRequest.Stream,
|
2023-07-22 17:12:13 +08:00
|
|
|
|
}
|
2024-04-28 20:45:34 +08:00
|
|
|
|
if claudeRequest.MaxTokensToSample == 0 {
|
|
|
|
|
|
claudeRequest.MaxTokensToSample = 4096
|
2023-07-22 17:12:13 +08:00
|
|
|
|
}
|
|
|
|
|
|
prompt := ""
|
|
|
|
|
|
for _, message := range textRequest.Messages {
|
|
|
|
|
|
if message.Role == "user" {
|
|
|
|
|
|
prompt += fmt.Sprintf("\n\nHuman: %s", message.Content)
|
|
|
|
|
|
} else if message.Role == "assistant" {
|
|
|
|
|
|
prompt += fmt.Sprintf("\n\nAssistant: %s", message.Content)
|
2023-07-27 23:26:56 +08:00
|
|
|
|
} else if message.Role == "system" {
|
2024-03-06 17:41:55 +08:00
|
|
|
|
if prompt == "" {
|
|
|
|
|
|
prompt = message.StringContent()
|
|
|
|
|
|
}
|
2023-07-22 17:12:13 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
2023-07-27 23:26:56 +08:00
|
|
|
|
prompt += "\n\nAssistant:"
|
2023-07-22 17:12:13 +08:00
|
|
|
|
claudeRequest.Prompt = prompt
|
|
|
|
|
|
return &claudeRequest
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
func RequestOpenAI2ClaudeMessage(textRequest dto.GeneralOpenAIRequest) (*dto.ClaudeRequest, error) {
|
|
|
|
|
|
claudeTools := make([]dto.Tool, 0, len(textRequest.Tools))
|
2024-07-18 00:36:05 +08:00
|
|
|
|
|
|
|
|
|
|
for _, tool := range textRequest.Tools {
|
|
|
|
|
|
if params, ok := tool.Function.Parameters.(map[string]any); ok {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeTool := dto.Tool{
|
2024-07-18 00:36:05 +08:00
|
|
|
|
Name: tool.Function.Name,
|
|
|
|
|
|
Description: tool.Function.Description,
|
2024-08-13 17:54:24 +08:00
|
|
|
|
}
|
|
|
|
|
|
claudeTool.InputSchema = make(map[string]interface{})
|
|
|
|
|
|
claudeTool.InputSchema["type"] = params["type"].(string)
|
|
|
|
|
|
claudeTool.InputSchema["properties"] = params["properties"]
|
|
|
|
|
|
claudeTool.InputSchema["required"] = params["required"]
|
|
|
|
|
|
for s, a := range params {
|
|
|
|
|
|
if s == "type" || s == "properties" || s == "required" {
|
|
|
|
|
|
continue
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeTool.InputSchema[s] = a
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeTools = append(claudeTools, claudeTool)
|
2024-07-18 00:36:05 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeRequest := dto.ClaudeRequest{
|
2024-03-08 18:25:57 +08:00
|
|
|
|
Model: textRequest.Model,
|
|
|
|
|
|
MaxTokens: textRequest.MaxTokens,
|
|
|
|
|
|
StopSequences: nil,
|
|
|
|
|
|
Temperature: textRequest.Temperature,
|
|
|
|
|
|
TopP: textRequest.TopP,
|
2024-04-01 14:33:58 +08:00
|
|
|
|
TopK: textRequest.TopK,
|
2024-03-08 18:25:57 +08:00
|
|
|
|
Stream: textRequest.Stream,
|
2024-07-18 00:36:05 +08:00
|
|
|
|
Tools: claudeTools,
|
2024-03-08 18:25:57 +08:00
|
|
|
|
}
|
2025-02-25 14:10:43 +08:00
|
|
|
|
|
2025-02-27 22:10:29 +08:00
|
|
|
|
if claudeRequest.MaxTokens == 0 {
|
2025-02-28 17:53:08 +08:00
|
|
|
|
claudeRequest.MaxTokens = uint(model_setting.GetClaudeSettings().GetDefaultMaxTokens(textRequest.Model))
|
2025-02-27 22:10:29 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-02-27 20:49:34 +08:00
|
|
|
|
if model_setting.GetClaudeSettings().ThinkingAdapterEnabled &&
|
|
|
|
|
|
strings.HasSuffix(textRequest.Model, "-thinking") {
|
2025-02-25 14:10:43 +08:00
|
|
|
|
|
|
|
|
|
|
// 因为BudgetTokens 必须大于1024
|
|
|
|
|
|
if claudeRequest.MaxTokens < 1280 {
|
|
|
|
|
|
claudeRequest.MaxTokens = 1280
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// BudgetTokens 为 max_tokens 的 80%
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeRequest.Thinking = &dto.Thinking{
|
2025-02-25 14:10:43 +08:00
|
|
|
|
Type: "enabled",
|
2025-02-27 20:49:34 +08:00
|
|
|
|
BudgetTokens: int(float64(claudeRequest.MaxTokens) * model_setting.GetClaudeSettings().ThinkingAdapterBudgetTokensPercentage),
|
2025-02-25 14:10:43 +08:00
|
|
|
|
}
|
2025-02-25 22:01:05 +08:00
|
|
|
|
// TODO: 临时处理
|
|
|
|
|
|
// https://docs.anthropic.com/en/docs/build-with-claude/extended-thinking#important-considerations-when-using-extended-thinking
|
2025-02-25 16:52:45 +08:00
|
|
|
|
claudeRequest.TopP = 0
|
2025-02-25 22:01:05 +08:00
|
|
|
|
claudeRequest.Temperature = common.GetPointer[float64](1.0)
|
2025-02-25 14:10:43 +08:00
|
|
|
|
claudeRequest.Model = strings.TrimSuffix(textRequest.Model, "-thinking")
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2024-07-11 18:44:45 +08:00
|
|
|
|
if textRequest.Stop != nil {
|
|
|
|
|
|
// stop maybe string/array string, convert to array string
|
|
|
|
|
|
switch textRequest.Stop.(type) {
|
|
|
|
|
|
case string:
|
|
|
|
|
|
claudeRequest.StopSequences = []string{textRequest.Stop.(string)}
|
|
|
|
|
|
case []interface{}:
|
|
|
|
|
|
stopSequences := make([]string, 0)
|
|
|
|
|
|
for _, stop := range textRequest.Stop.([]interface{}) {
|
|
|
|
|
|
stopSequences = append(stopSequences, stop.(string))
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeRequest.StopSequences = stopSequences
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-04-23 13:08:37 +08:00
|
|
|
|
formatMessages := make([]dto.Message, 0)
|
2024-09-05 00:53:00 +08:00
|
|
|
|
lastMessage := dto.Message{
|
|
|
|
|
|
Role: "tool",
|
|
|
|
|
|
}
|
2024-04-25 20:37:50 +08:00
|
|
|
|
for i, message := range textRequest.Messages {
|
2024-04-23 13:08:37 +08:00
|
|
|
|
if message.Role == "" {
|
2024-04-25 22:57:11 +08:00
|
|
|
|
textRequest.Messages[i].Role = "user"
|
2024-04-23 13:08:37 +08:00
|
|
|
|
}
|
|
|
|
|
|
fmtMessage := dto.Message{
|
|
|
|
|
|
Role: message.Role,
|
|
|
|
|
|
Content: message.Content,
|
|
|
|
|
|
}
|
2024-09-05 00:53:00 +08:00
|
|
|
|
if message.Role == "tool" {
|
|
|
|
|
|
fmtMessage.ToolCallId = message.ToolCallId
|
|
|
|
|
|
}
|
|
|
|
|
|
if message.Role == "assistant" && message.ToolCalls != nil {
|
|
|
|
|
|
fmtMessage.ToolCalls = message.ToolCalls
|
|
|
|
|
|
}
|
|
|
|
|
|
if lastMessage.Role == message.Role && lastMessage.Role != "tool" {
|
2024-04-23 13:08:37 +08:00
|
|
|
|
if lastMessage.IsStringContent() && message.IsStringContent() {
|
|
|
|
|
|
content, _ := json.Marshal(strings.Trim(fmt.Sprintf("%s %s", lastMessage.StringContent(), message.StringContent()), "\""))
|
|
|
|
|
|
fmtMessage.Content = content
|
|
|
|
|
|
// delete last message
|
|
|
|
|
|
formatMessages = formatMessages[:len(formatMessages)-1]
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
if fmtMessage.Content == nil {
|
|
|
|
|
|
content, _ := json.Marshal("...")
|
|
|
|
|
|
fmtMessage.Content = content
|
|
|
|
|
|
}
|
|
|
|
|
|
formatMessages = append(formatMessages, fmtMessage)
|
2024-09-05 00:53:00 +08:00
|
|
|
|
lastMessage = fmtMessage
|
2024-04-23 13:08:37 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMessages := make([]dto.ClaudeMessage, 0)
|
2024-08-24 17:15:55 +08:00
|
|
|
|
isFirstMessage := true
|
2024-04-23 13:08:37 +08:00
|
|
|
|
for _, message := range formatMessages {
|
2024-03-08 18:25:57 +08:00
|
|
|
|
if message.Role == "system" {
|
2024-04-25 20:37:50 +08:00
|
|
|
|
if message.IsStringContent() {
|
|
|
|
|
|
claudeRequest.System = message.StringContent()
|
|
|
|
|
|
} else {
|
|
|
|
|
|
contents := message.ParseContent()
|
|
|
|
|
|
content := ""
|
|
|
|
|
|
for _, ctx := range contents {
|
|
|
|
|
|
if ctx.Type == "text" {
|
|
|
|
|
|
content += ctx.Text
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeRequest.System = content
|
|
|
|
|
|
}
|
2024-03-08 18:25:57 +08:00
|
|
|
|
} else {
|
2024-08-24 17:15:55 +08:00
|
|
|
|
if isFirstMessage {
|
|
|
|
|
|
isFirstMessage = false
|
|
|
|
|
|
if message.Role != "user" {
|
|
|
|
|
|
// fix: first message is assistant, add user message
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMessage := dto.ClaudeMessage{
|
2024-08-24 17:15:55 +08:00
|
|
|
|
Role: "user",
|
2025-03-12 21:31:46 +08:00
|
|
|
|
Content: []dto.ClaudeMediaMessage{
|
2024-08-24 17:15:55 +08:00
|
|
|
|
{
|
|
|
|
|
|
Type: "text",
|
2025-03-12 21:31:46 +08:00
|
|
|
|
Text: common.GetPointer[string]("..."),
|
2024-08-24 17:15:55 +08:00
|
|
|
|
},
|
|
|
|
|
|
},
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeMessages = append(claudeMessages, claudeMessage)
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMessage := dto.ClaudeMessage{
|
2024-03-08 18:25:57 +08:00
|
|
|
|
Role: message.Role,
|
|
|
|
|
|
}
|
2024-09-05 00:53:00 +08:00
|
|
|
|
if message.Role == "tool" {
|
|
|
|
|
|
if len(claudeMessages) > 0 && claudeMessages[len(claudeMessages)-1].Role == "user" {
|
|
|
|
|
|
lastMessage := claudeMessages[len(claudeMessages)-1]
|
|
|
|
|
|
if content, ok := lastMessage.Content.(string); ok {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
lastMessage.Content = []dto.ClaudeMediaMessage{
|
2024-09-05 00:53:00 +08:00
|
|
|
|
{
|
|
|
|
|
|
Type: "text",
|
2025-03-12 21:31:46 +08:00
|
|
|
|
Text: common.GetPointer[string](content),
|
2024-09-05 00:53:00 +08:00
|
|
|
|
},
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2025-03-12 21:31:46 +08:00
|
|
|
|
lastMessage.Content = append(lastMessage.Content.([]dto.ClaudeMediaMessage), dto.ClaudeMediaMessage{
|
2024-09-05 00:53:00 +08:00
|
|
|
|
Type: "tool_result",
|
|
|
|
|
|
ToolUseId: message.ToolCallId,
|
2025-03-12 21:31:46 +08:00
|
|
|
|
Content: message.Content,
|
2024-09-05 00:53:00 +08:00
|
|
|
|
})
|
|
|
|
|
|
claudeMessages[len(claudeMessages)-1] = lastMessage
|
|
|
|
|
|
continue
|
|
|
|
|
|
} else {
|
|
|
|
|
|
claudeMessage.Role = "user"
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMessage.Content = []dto.ClaudeMediaMessage{
|
2024-09-05 00:53:00 +08:00
|
|
|
|
{
|
|
|
|
|
|
Type: "tool_result",
|
|
|
|
|
|
ToolUseId: message.ToolCallId,
|
2025-03-12 21:31:46 +08:00
|
|
|
|
Content: message.Content,
|
2024-09-05 00:53:00 +08:00
|
|
|
|
},
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
} else if message.IsStringContent() && message.ToolCalls == nil {
|
2024-03-08 18:25:57 +08:00
|
|
|
|
claudeMessage.Content = message.StringContent()
|
|
|
|
|
|
} else {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMediaMessages := make([]dto.ClaudeMediaMessage, 0)
|
2024-03-08 18:25:57 +08:00
|
|
|
|
for _, mediaMessage := range message.ParseContent() {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMediaMessage := dto.ClaudeMediaMessage{
|
2024-03-08 18:25:57 +08:00
|
|
|
|
Type: mediaMessage.Type,
|
|
|
|
|
|
}
|
|
|
|
|
|
if mediaMessage.Type == "text" {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMediaMessage.Text = common.GetPointer[string](mediaMessage.Text)
|
2024-03-08 18:25:57 +08:00
|
|
|
|
} else {
|
|
|
|
|
|
imageUrl := mediaMessage.ImageUrl.(dto.MessageImageUrl)
|
|
|
|
|
|
claudeMediaMessage.Type = "image"
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMediaMessage.Source = &dto.ClaudeMessageSource{
|
2024-03-08 18:25:57 +08:00
|
|
|
|
Type: "base64",
|
|
|
|
|
|
}
|
|
|
|
|
|
// 判断是否是url
|
|
|
|
|
|
if strings.HasPrefix(imageUrl.Url, "http") {
|
|
|
|
|
|
// 是url,获取图片的类型和base64编码的数据
|
2024-12-29 00:00:24 +08:00
|
|
|
|
fileData, err := service.GetFileBase64FromUrl(imageUrl.Url)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return nil, fmt.Errorf("get file base64 from url failed: %s", err.Error())
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeMediaMessage.Source.MediaType = fileData.MimeType
|
|
|
|
|
|
claudeMediaMessage.Source.Data = fileData.Base64Data
|
2024-03-08 18:25:57 +08:00
|
|
|
|
} else {
|
2024-05-28 17:59:53 +08:00
|
|
|
|
_, format, base64String, err := service.DecodeBase64ImageData(imageUrl.Url)
|
2024-03-08 18:25:57 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
return nil, err
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeMediaMessage.Source.MediaType = "image/" + format
|
|
|
|
|
|
claudeMediaMessage.Source.Data = base64String
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeMediaMessages = append(claudeMediaMessages, claudeMediaMessage)
|
|
|
|
|
|
}
|
2024-09-05 00:53:00 +08:00
|
|
|
|
if message.ToolCalls != nil {
|
2024-12-22 16:20:30 +08:00
|
|
|
|
for _, toolCall := range message.ParseToolCalls() {
|
2024-09-05 00:53:00 +08:00
|
|
|
|
inputObj := make(map[string]any)
|
|
|
|
|
|
if err := json.Unmarshal([]byte(toolCall.Function.Arguments), &inputObj); err != nil {
|
|
|
|
|
|
common.SysError("tool call function arguments is not a map[string]any: " + fmt.Sprintf("%v", toolCall.Function.Arguments))
|
|
|
|
|
|
continue
|
|
|
|
|
|
}
|
2025-03-12 21:31:46 +08:00
|
|
|
|
claudeMediaMessages = append(claudeMediaMessages, dto.ClaudeMediaMessage{
|
2024-09-05 00:53:00 +08:00
|
|
|
|
Type: "tool_use",
|
|
|
|
|
|
Id: toolCall.ID,
|
|
|
|
|
|
Name: toolCall.Function.Name,
|
|
|
|
|
|
Input: inputObj,
|
|
|
|
|
|
})
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-03-08 18:25:57 +08:00
|
|
|
|
claudeMessage.Content = claudeMediaMessages
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeMessages = append(claudeMessages, claudeMessage)
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeRequest.Prompt = ""
|
|
|
|
|
|
claudeRequest.Messages = claudeMessages
|
|
|
|
|
|
return &claudeRequest, nil
|
|
|
|
|
|
}
|
2024-03-06 17:41:55 +08:00
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
func StreamResponseClaude2OpenAI(reqMode int, claudeResponse *dto.ClaudeResponse) *dto.ChatCompletionsStreamResponse {
|
2024-02-29 01:08:18 +08:00
|
|
|
|
var response dto.ChatCompletionsStreamResponse
|
2023-07-22 17:12:13 +08:00
|
|
|
|
response.Object = "chat.completion.chunk"
|
|
|
|
|
|
response.Model = claudeResponse.Model
|
2024-03-08 19:43:33 +08:00
|
|
|
|
response.Choices = make([]dto.ChatCompletionsStreamResponseChoice, 0)
|
2025-02-26 23:56:10 +08:00
|
|
|
|
tools := make([]dto.ToolCallResponse, 0)
|
2024-03-08 19:43:33 +08:00
|
|
|
|
var choice dto.ChatCompletionsStreamResponseChoice
|
|
|
|
|
|
if reqMode == RequestModeCompletion {
|
2024-04-25 23:57:39 +08:00
|
|
|
|
choice.Delta.SetContentString(claudeResponse.Completion)
|
2024-03-08 19:43:33 +08:00
|
|
|
|
finishReason := stopReasonClaude2OpenAI(claudeResponse.StopReason)
|
|
|
|
|
|
if finishReason != "null" {
|
|
|
|
|
|
choice.FinishReason = &finishReason
|
|
|
|
|
|
}
|
|
|
|
|
|
} else {
|
|
|
|
|
|
if claudeResponse.Type == "message_start" {
|
|
|
|
|
|
response.Id = claudeResponse.Message.Id
|
|
|
|
|
|
response.Model = claudeResponse.Message.Model
|
2025-03-12 19:29:15 +08:00
|
|
|
|
//claudeUsage = &claudeResponse.Message.Usage
|
2024-04-25 23:57:39 +08:00
|
|
|
|
choice.Delta.SetContentString("")
|
|
|
|
|
|
choice.Delta.Role = "assistant"
|
2024-04-26 02:56:35 +08:00
|
|
|
|
} else if claudeResponse.Type == "content_block_start" {
|
2024-07-18 00:36:05 +08:00
|
|
|
|
if claudeResponse.ContentBlock != nil {
|
|
|
|
|
|
//choice.Delta.SetContentString(claudeResponse.ContentBlock.Text)
|
|
|
|
|
|
if claudeResponse.ContentBlock.Type == "tool_use" {
|
2025-02-26 23:56:10 +08:00
|
|
|
|
tools = append(tools, dto.ToolCallResponse{
|
2024-07-18 00:36:05 +08:00
|
|
|
|
ID: claudeResponse.ContentBlock.Id,
|
|
|
|
|
|
Type: "function",
|
2025-02-26 23:56:10 +08:00
|
|
|
|
Function: dto.FunctionResponse{
|
2024-07-18 00:36:05 +08:00
|
|
|
|
Name: claudeResponse.ContentBlock.Name,
|
|
|
|
|
|
Arguments: "",
|
|
|
|
|
|
},
|
|
|
|
|
|
})
|
|
|
|
|
|
}
|
|
|
|
|
|
} else {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return nil
|
2024-07-18 00:36:05 +08:00
|
|
|
|
}
|
2024-03-08 19:43:33 +08:00
|
|
|
|
} else if claudeResponse.Type == "content_block_delta" {
|
2024-07-18 00:36:05 +08:00
|
|
|
|
if claudeResponse.Delta != nil {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
choice.Index = *claudeResponse.Index
|
2025-03-12 21:35:57 +08:00
|
|
|
|
choice.Delta.Content = claudeResponse.Delta.Text
|
2025-02-25 14:10:43 +08:00
|
|
|
|
switch claudeResponse.Delta.Type {
|
|
|
|
|
|
case "input_json_delta":
|
2025-02-26 23:56:10 +08:00
|
|
|
|
tools = append(tools, dto.ToolCallResponse{
|
|
|
|
|
|
Function: dto.FunctionResponse{
|
2025-03-13 19:32:08 +08:00
|
|
|
|
Arguments: *claudeResponse.Delta.PartialJson,
|
2024-07-18 00:36:05 +08:00
|
|
|
|
},
|
|
|
|
|
|
})
|
2025-02-25 14:10:43 +08:00
|
|
|
|
case "signature_delta":
|
|
|
|
|
|
// 加密的不处理
|
|
|
|
|
|
signatureContent := "\n"
|
|
|
|
|
|
choice.Delta.ReasoningContent = &signatureContent
|
|
|
|
|
|
case "thinking_delta":
|
|
|
|
|
|
thinkingContent := claudeResponse.Delta.Thinking
|
|
|
|
|
|
choice.Delta.ReasoningContent = &thinkingContent
|
2024-07-18 00:36:05 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-03-08 19:43:33 +08:00
|
|
|
|
} else if claudeResponse.Type == "message_delta" {
|
|
|
|
|
|
finishReason := stopReasonClaude2OpenAI(*claudeResponse.Delta.StopReason)
|
|
|
|
|
|
if finishReason != "null" {
|
|
|
|
|
|
choice.FinishReason = &finishReason
|
|
|
|
|
|
}
|
2025-03-12 19:29:15 +08:00
|
|
|
|
//claudeUsage = &claudeResponse.Usage
|
2024-04-23 11:44:40 +08:00
|
|
|
|
} else if claudeResponse.Type == "message_stop" {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return nil
|
2024-04-25 23:57:39 +08:00
|
|
|
|
} else {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return nil
|
2024-03-08 19:43:33 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-07-18 00:36:05 +08:00
|
|
|
|
if len(tools) > 0 {
|
|
|
|
|
|
choice.Delta.Content = nil // compatible with other OpenAI derivative applications, like LobeOpenAICompatibleFactory ...
|
|
|
|
|
|
choice.Delta.ToolCalls = tools
|
|
|
|
|
|
}
|
2024-03-08 19:43:33 +08:00
|
|
|
|
response.Choices = append(response.Choices, choice)
|
2024-04-25 23:57:39 +08:00
|
|
|
|
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return &response
|
2023-07-22 17:12:13 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
func ResponseClaude2OpenAI(reqMode int, claudeResponse *dto.ClaudeResponse) *dto.OpenAITextResponse {
|
2024-03-08 18:25:57 +08:00
|
|
|
|
choices := make([]dto.OpenAITextResponseChoice, 0)
|
2024-02-29 01:08:18 +08:00
|
|
|
|
fullTextResponse := dto.OpenAITextResponse{
|
2023-07-22 17:12:13 +08:00
|
|
|
|
Id: fmt.Sprintf("chatcmpl-%s", common.GetUUID()),
|
|
|
|
|
|
Object: "chat.completion",
|
|
|
|
|
|
Created: common.GetTimestamp(),
|
|
|
|
|
|
}
|
2024-07-18 00:36:05 +08:00
|
|
|
|
var responseText string
|
2025-03-14 17:48:26 +08:00
|
|
|
|
var responseThinking string
|
2024-07-18 00:36:05 +08:00
|
|
|
|
if len(claudeResponse.Content) > 0 {
|
2025-03-14 17:48:26 +08:00
|
|
|
|
responseText = claudeResponse.Content[0].GetText()
|
|
|
|
|
|
responseThinking = claudeResponse.Content[0].Thinking
|
2024-07-18 00:36:05 +08:00
|
|
|
|
}
|
2025-02-26 23:56:10 +08:00
|
|
|
|
tools := make([]dto.ToolCallResponse, 0)
|
2025-02-25 14:10:43 +08:00
|
|
|
|
thinkingContent := ""
|
|
|
|
|
|
|
2024-03-08 18:25:57 +08:00
|
|
|
|
if reqMode == RequestModeCompletion {
|
|
|
|
|
|
content, _ := json.Marshal(strings.TrimPrefix(claudeResponse.Completion, " "))
|
|
|
|
|
|
choice := dto.OpenAITextResponseChoice{
|
|
|
|
|
|
Index: 0,
|
|
|
|
|
|
Message: dto.Message{
|
|
|
|
|
|
Role: "assistant",
|
|
|
|
|
|
Content: content,
|
|
|
|
|
|
Name: nil,
|
|
|
|
|
|
},
|
|
|
|
|
|
FinishReason: stopReasonClaude2OpenAI(claudeResponse.StopReason),
|
|
|
|
|
|
}
|
|
|
|
|
|
choices = append(choices, choice)
|
|
|
|
|
|
} else {
|
|
|
|
|
|
fullTextResponse.Id = claudeResponse.Id
|
2024-07-18 00:36:05 +08:00
|
|
|
|
for _, message := range claudeResponse.Content {
|
2025-02-25 14:10:43 +08:00
|
|
|
|
switch message.Type {
|
|
|
|
|
|
case "tool_use":
|
2024-07-18 00:36:05 +08:00
|
|
|
|
args, _ := json.Marshal(message.Input)
|
2025-02-26 23:56:10 +08:00
|
|
|
|
tools = append(tools, dto.ToolCallResponse{
|
2024-07-18 00:36:05 +08:00
|
|
|
|
ID: message.Id,
|
|
|
|
|
|
Type: "function", // compatible with other OpenAI derivative applications
|
2025-02-26 23:56:10 +08:00
|
|
|
|
Function: dto.FunctionResponse{
|
2024-07-18 00:36:05 +08:00
|
|
|
|
Name: message.Name,
|
|
|
|
|
|
Arguments: string(args),
|
|
|
|
|
|
},
|
|
|
|
|
|
})
|
2025-02-25 14:10:43 +08:00
|
|
|
|
case "thinking":
|
|
|
|
|
|
// 加密的不管, 只输出明文的推理过程
|
|
|
|
|
|
thinkingContent = message.Thinking
|
|
|
|
|
|
case "text":
|
2025-03-15 19:10:12 +08:00
|
|
|
|
responseText = message.GetText()
|
2024-03-08 18:25:57 +08:00
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2024-07-18 00:36:05 +08:00
|
|
|
|
choice := dto.OpenAITextResponseChoice{
|
|
|
|
|
|
Index: 0,
|
|
|
|
|
|
Message: dto.Message{
|
|
|
|
|
|
Role: "assistant",
|
|
|
|
|
|
},
|
|
|
|
|
|
FinishReason: stopReasonClaude2OpenAI(claudeResponse.StopReason),
|
|
|
|
|
|
}
|
|
|
|
|
|
choice.SetStringContent(responseText)
|
2025-03-14 17:48:26 +08:00
|
|
|
|
if len(responseThinking) > 0 {
|
|
|
|
|
|
choice.ReasoningContent = responseThinking
|
|
|
|
|
|
}
|
2024-07-18 00:36:05 +08:00
|
|
|
|
if len(tools) > 0 {
|
2024-12-22 16:20:30 +08:00
|
|
|
|
choice.Message.SetToolCalls(tools)
|
2024-07-18 00:36:05 +08:00
|
|
|
|
}
|
2025-02-25 14:10:43 +08:00
|
|
|
|
choice.Message.ReasoningContent = thinkingContent
|
2024-09-11 19:12:55 +08:00
|
|
|
|
fullTextResponse.Model = claudeResponse.Model
|
2024-07-18 00:36:05 +08:00
|
|
|
|
choices = append(choices, choice)
|
2024-03-08 18:25:57 +08:00
|
|
|
|
fullTextResponse.Choices = choices
|
2023-07-22 17:12:13 +08:00
|
|
|
|
return &fullTextResponse
|
|
|
|
|
|
}
|
2023-07-22 17:36:40 +08:00
|
|
|
|
|
2025-03-12 19:29:15 +08:00
|
|
|
|
type ClaudeResponseInfo struct {
|
|
|
|
|
|
ResponseId string
|
|
|
|
|
|
Created int64
|
|
|
|
|
|
Model string
|
|
|
|
|
|
ResponseText strings.Builder
|
|
|
|
|
|
Usage *dto.Usage
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-03-12 21:31:46 +08:00
|
|
|
|
func FormatClaudeResponseInfo(requestMode int, claudeResponse *dto.ClaudeResponse, oaiResponse *dto.ChatCompletionsStreamResponse, claudeInfo *ClaudeResponseInfo) bool {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
if requestMode == RequestModeCompletion {
|
|
|
|
|
|
claudeInfo.ResponseText.WriteString(claudeResponse.Completion)
|
|
|
|
|
|
} else {
|
|
|
|
|
|
if claudeResponse.Type == "message_start" {
|
|
|
|
|
|
// message_start, 获取usage
|
|
|
|
|
|
claudeInfo.ResponseId = claudeResponse.Message.Id
|
|
|
|
|
|
claudeInfo.Model = claudeResponse.Message.Model
|
|
|
|
|
|
claudeInfo.Usage.PromptTokens = claudeResponse.Message.Usage.InputTokens
|
|
|
|
|
|
} else if claudeResponse.Type == "content_block_delta" {
|
2025-03-12 21:35:57 +08:00
|
|
|
|
if claudeResponse.Delta.Text != nil {
|
|
|
|
|
|
claudeInfo.ResponseText.WriteString(*claudeResponse.Delta.Text)
|
|
|
|
|
|
}
|
2025-03-12 19:29:15 +08:00
|
|
|
|
} else if claudeResponse.Type == "message_delta" {
|
|
|
|
|
|
claudeInfo.Usage.CompletionTokens = claudeResponse.Usage.OutputTokens
|
2025-03-14 17:00:39 +08:00
|
|
|
|
if claudeResponse.Usage.InputTokens > 0 {
|
|
|
|
|
|
claudeInfo.Usage.PromptTokens = claudeResponse.Usage.InputTokens
|
|
|
|
|
|
}
|
|
|
|
|
|
claudeInfo.Usage.TotalTokens = claudeInfo.Usage.PromptTokens + claudeResponse.Usage.OutputTokens
|
2025-03-12 19:29:15 +08:00
|
|
|
|
} else if claudeResponse.Type == "content_block_start" {
|
|
|
|
|
|
} else {
|
|
|
|
|
|
return false
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2025-03-12 19:46:08 +08:00
|
|
|
|
if oaiResponse != nil {
|
|
|
|
|
|
oaiResponse.Id = claudeInfo.ResponseId
|
|
|
|
|
|
oaiResponse.Created = claudeInfo.Created
|
|
|
|
|
|
oaiResponse.Model = claudeInfo.Model
|
|
|
|
|
|
}
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return true
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2024-08-27 20:19:51 +08:00
|
|
|
|
func ClaudeStreamHandler(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo, requestMode int) (*dto.OpenAIErrorWithStatusCode, *dto.Usage) {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
|
|
|
|
|
|
if info.RelayFormat == relaycommon.RelayFormatOpenAI {
|
|
|
|
|
|
return toOpenAIStreamHandler(c, resp, info, requestMode)
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
usage := &dto.Usage{}
|
|
|
|
|
|
responseText := strings.Builder{}
|
|
|
|
|
|
|
|
|
|
|
|
helper.StreamScannerHandler(c, resp, info, func(data string) bool {
|
|
|
|
|
|
var claudeResponse dto.ClaudeResponse
|
|
|
|
|
|
err := json.NewDecoder(bytes.NewReader(common.StringToByteSlice(data))).Decode(&claudeResponse)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
common.SysError("error unmarshalling stream response: " + err.Error())
|
|
|
|
|
|
return true
|
|
|
|
|
|
}
|
|
|
|
|
|
if requestMode == RequestModeCompletion {
|
|
|
|
|
|
responseText.WriteString(claudeResponse.Completion)
|
|
|
|
|
|
} else {
|
|
|
|
|
|
if claudeResponse.Type == "message_start" {
|
|
|
|
|
|
// message_start, 获取usage
|
|
|
|
|
|
info.UpstreamModelName = claudeResponse.Message.Model
|
|
|
|
|
|
usage.PromptTokens = claudeResponse.Message.Usage.InputTokens
|
|
|
|
|
|
usage.PromptTokensDetails.CachedTokens = claudeResponse.Message.Usage.CacheReadInputTokens
|
|
|
|
|
|
usage.PromptTokensDetails.CachedCreationTokens = claudeResponse.Message.Usage.CacheCreationInputTokens
|
|
|
|
|
|
usage.CompletionTokens = claudeResponse.Message.Usage.OutputTokens
|
|
|
|
|
|
} else if claudeResponse.Type == "content_block_delta" {
|
|
|
|
|
|
responseText.WriteString(claudeResponse.Delta.GetText())
|
|
|
|
|
|
} else if claudeResponse.Type == "message_delta" {
|
|
|
|
|
|
if claudeResponse.Usage.InputTokens > 0 {
|
|
|
|
|
|
// 不叠加,只取最新的
|
|
|
|
|
|
usage.PromptTokens = claudeResponse.Usage.InputTokens
|
|
|
|
|
|
}
|
|
|
|
|
|
usage.CompletionTokens = claudeResponse.Usage.OutputTokens
|
|
|
|
|
|
usage.TotalTokens = usage.PromptTokens + usage.CompletionTokens
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
helper.ClaudeChunkData(c, claudeResponse, data)
|
|
|
|
|
|
return true
|
|
|
|
|
|
})
|
|
|
|
|
|
|
|
|
|
|
|
if requestMode == RequestModeCompletion {
|
|
|
|
|
|
usage, _ = service.ResponseText2Usage(responseText.String(), info.UpstreamModelName, info.PromptTokens)
|
|
|
|
|
|
} else {
|
|
|
|
|
|
// 说明流模式建立失败,可能为官方出错
|
|
|
|
|
|
if usage.PromptTokens == 0 {
|
|
|
|
|
|
//usage.PromptTokens = info.PromptTokens
|
|
|
|
|
|
}
|
|
|
|
|
|
if usage.CompletionTokens == 0 {
|
|
|
|
|
|
usage, _ = service.ResponseText2Usage(responseText.String(), info.UpstreamModelName, usage.PromptTokens)
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
return nil, usage
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func toOpenAIStreamHandler(c *gin.Context, resp *http.Response, info *relaycommon.RelayInfo, requestMode int) (*dto.OpenAIErrorWithStatusCode, *dto.Usage) {
|
2023-07-22 17:36:40 +08:00
|
|
|
|
responseId := fmt.Sprintf("chatcmpl-%s", common.GetUUID())
|
2025-03-12 19:29:15 +08:00
|
|
|
|
claudeInfo := &ClaudeResponseInfo{
|
|
|
|
|
|
ResponseId: responseId,
|
|
|
|
|
|
Created: common.GetTimestamp(),
|
|
|
|
|
|
Model: info.UpstreamModelName,
|
|
|
|
|
|
ResponseText: strings.Builder{},
|
|
|
|
|
|
Usage: &dto.Usage{},
|
|
|
|
|
|
}
|
2024-07-19 01:07:37 +08:00
|
|
|
|
|
2025-03-05 19:47:41 +08:00
|
|
|
|
helper.StreamScannerHandler(c, resp, info, func(data string) bool {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
var claudeResponse dto.ClaudeResponse
|
2025-03-12 19:29:15 +08:00
|
|
|
|
err := json.NewDecoder(bytes.NewReader(common.StringToByteSlice(data))).Decode(&claudeResponse)
|
2024-07-19 01:07:37 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
common.SysError("error unmarshalling stream response: " + err.Error())
|
2025-03-05 19:47:41 +08:00
|
|
|
|
return true
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2024-07-19 01:07:37 +08:00
|
|
|
|
|
2025-03-12 19:29:15 +08:00
|
|
|
|
response := StreamResponseClaude2OpenAI(requestMode, &claudeResponse)
|
|
|
|
|
|
|
|
|
|
|
|
if !FormatClaudeResponseInfo(requestMode, &claudeResponse, response, claudeInfo) {
|
2025-03-05 19:47:41 +08:00
|
|
|
|
return true
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2024-03-08 19:43:33 +08:00
|
|
|
|
|
2025-03-05 19:47:41 +08:00
|
|
|
|
err = helper.ObjectData(c, response)
|
2024-07-19 01:07:37 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
common.LogError(c, "send_stream_response_failed: "+err.Error())
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2025-03-05 19:47:41 +08:00
|
|
|
|
return true
|
|
|
|
|
|
})
|
2024-07-19 01:07:37 +08:00
|
|
|
|
|
2024-03-08 19:43:33 +08:00
|
|
|
|
if requestMode == RequestModeCompletion {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
claudeInfo.Usage, _ = service.ResponseText2Usage(claudeInfo.ResponseText.String(), info.UpstreamModelName, info.PromptTokens)
|
2024-03-09 13:25:47 +08:00
|
|
|
|
} else {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
if claudeInfo.Usage.PromptTokens == 0 {
|
|
|
|
|
|
//上游出错
|
2024-06-15 01:30:51 +08:00
|
|
|
|
}
|
2025-03-12 19:29:15 +08:00
|
|
|
|
if claudeInfo.Usage.CompletionTokens == 0 {
|
|
|
|
|
|
claudeInfo.Usage, _ = service.ResponseText2Usage(claudeInfo.ResponseText.String(), info.UpstreamModelName, claudeInfo.Usage.PromptTokens)
|
2024-03-09 13:25:47 +08:00
|
|
|
|
}
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2024-07-08 02:00:39 +08:00
|
|
|
|
if info.ShouldIncludeUsage {
|
2025-03-12 19:29:15 +08:00
|
|
|
|
response := helper.GenerateFinalUsageResponse(responseId, claudeInfo.Created, info.UpstreamModelName, *claudeInfo.Usage)
|
2025-03-05 19:47:41 +08:00
|
|
|
|
err := helper.ObjectData(c, response)
|
2024-07-08 02:00:39 +08:00
|
|
|
|
if err != nil {
|
|
|
|
|
|
common.SysError("send final response failed: " + err.Error())
|
|
|
|
|
|
}
|
2024-07-08 01:45:43 +08:00
|
|
|
|
}
|
2025-03-05 19:47:41 +08:00
|
|
|
|
helper.Done(c)
|
2025-03-12 19:29:15 +08:00
|
|
|
|
return nil, claudeInfo.Usage
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2024-08-27 20:19:51 +08:00
|
|
|
|
func ClaudeHandler(c *gin.Context, resp *http.Response, requestMode int, info *relaycommon.RelayInfo) (*dto.OpenAIErrorWithStatusCode, *dto.Usage) {
|
2023-07-22 17:36:40 +08:00
|
|
|
|
responseBody, err := io.ReadAll(resp.Body)
|
|
|
|
|
|
if err != nil {
|
2024-02-29 01:08:18 +08:00
|
|
|
|
return service.OpenAIErrorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
err = resp.Body.Close()
|
|
|
|
|
|
if err != nil {
|
2024-02-29 01:08:18 +08:00
|
|
|
|
return service.OpenAIErrorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2025-03-14 17:48:26 +08:00
|
|
|
|
if common.DebugEnabled {
|
|
|
|
|
|
println("responseBody: ", string(responseBody))
|
|
|
|
|
|
}
|
2025-03-12 21:31:46 +08:00
|
|
|
|
var claudeResponse dto.ClaudeResponse
|
2023-07-22 17:36:40 +08:00
|
|
|
|
err = json.Unmarshal(responseBody, &claudeResponse)
|
|
|
|
|
|
if err != nil {
|
2024-02-29 01:08:18 +08:00
|
|
|
|
return service.OpenAIErrorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
if claudeResponse.Error.Type != "" {
|
2024-02-29 01:08:18 +08:00
|
|
|
|
return &dto.OpenAIErrorWithStatusCode{
|
2024-03-06 17:41:55 +08:00
|
|
|
|
Error: dto.OpenAIError{
|
2023-07-22 17:36:40 +08:00
|
|
|
|
Message: claudeResponse.Error.Message,
|
|
|
|
|
|
Type: claudeResponse.Error.Type,
|
|
|
|
|
|
Param: "",
|
|
|
|
|
|
Code: claudeResponse.Error.Type,
|
|
|
|
|
|
},
|
|
|
|
|
|
StatusCode: resp.StatusCode,
|
|
|
|
|
|
}, nil
|
|
|
|
|
|
}
|
2024-03-08 18:25:57 +08:00
|
|
|
|
usage := dto.Usage{}
|
|
|
|
|
|
if requestMode == RequestModeCompletion {
|
2025-03-12 21:31:46 +08:00
|
|
|
|
completionTokens, err := service.CountTextToken(claudeResponse.Completion, info.OriginModelName)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return service.OpenAIErrorWrapper(err, "count_token_text_failed", http.StatusInternalServerError), nil
|
|
|
|
|
|
}
|
2024-08-27 20:19:51 +08:00
|
|
|
|
usage.PromptTokens = info.PromptTokens
|
2024-03-08 18:25:57 +08:00
|
|
|
|
usage.CompletionTokens = completionTokens
|
2024-08-27 20:19:51 +08:00
|
|
|
|
usage.TotalTokens = info.PromptTokens + completionTokens
|
2024-03-08 18:25:57 +08:00
|
|
|
|
} else {
|
|
|
|
|
|
usage.PromptTokens = claudeResponse.Usage.InputTokens
|
|
|
|
|
|
usage.CompletionTokens = claudeResponse.Usage.OutputTokens
|
|
|
|
|
|
usage.TotalTokens = claudeResponse.Usage.InputTokens + claudeResponse.Usage.OutputTokens
|
2025-03-12 21:31:46 +08:00
|
|
|
|
usage.PromptTokensDetails.CachedTokens = claudeResponse.Usage.CacheReadInputTokens
|
|
|
|
|
|
usage.PromptTokensDetails.CachedCreationTokens = claudeResponse.Usage.CacheCreationInputTokens
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
2025-03-12 21:31:46 +08:00
|
|
|
|
var responseData []byte
|
|
|
|
|
|
switch info.RelayFormat {
|
|
|
|
|
|
case relaycommon.RelayFormatOpenAI:
|
|
|
|
|
|
openaiResponse := ResponseClaude2OpenAI(requestMode, &claudeResponse)
|
|
|
|
|
|
openaiResponse.Usage = usage
|
|
|
|
|
|
responseData, err = json.Marshal(openaiResponse)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return service.OpenAIErrorWrapper(err, "marshal_response_body_failed", http.StatusInternalServerError), nil
|
|
|
|
|
|
}
|
|
|
|
|
|
case relaycommon.RelayFormatClaude:
|
|
|
|
|
|
responseData = responseBody
|
2023-07-22 17:36:40 +08:00
|
|
|
|
}
|
|
|
|
|
|
c.Writer.Header().Set("Content-Type", "application/json")
|
|
|
|
|
|
c.Writer.WriteHeader(resp.StatusCode)
|
2025-03-12 21:31:46 +08:00
|
|
|
|
_, err = c.Writer.Write(responseData)
|
2023-07-22 17:36:40 +08:00
|
|
|
|
return nil, &usage
|
|
|
|
|
|
}
|