new-api/service/token_counter.go

package service

import (
	"encoding/json"
	"errors"
	"fmt"
	"github.com/tiktoken-go/tokenizer"
	"github.com/tiktoken-go/tokenizer/codec"
	"image"
	"log"
	"math"
	"one-api/common"
	"one-api/constant"
	"one-api/dto"
	relaycommon "one-api/relay/common"
	"strings"
	"sync"
	"unicode/utf8"
)

// tokenEncoderMap won't grow after initialization
var defaultTokenEncoder tokenizer.Codec

// tokenEncoderMap is used to store token encoders for different models
var tokenEncoderMap = make(map[string]tokenizer.Codec)

// tokenEncoderMutex protects tokenEncoderMap for concurrent access
var tokenEncoderMutex sync.RWMutex

func InitTokenEncoders() {
	common.SysLog("initializing token encoders")
	defaultTokenEncoder = codec.NewCl100kBase()
	common.SysLog("token encoders initialized")
}

func getTokenEncoder(model string) tokenizer.Codec {
	// First, try to get the encoder from cache with read lock
	tokenEncoderMutex.RLock()
	if encoder, exists := tokenEncoderMap[model]; exists {
		tokenEncoderMutex.RUnlock()
		return encoder
	}
	tokenEncoderMutex.RUnlock()

	// If not in cache, create new encoder with write lock
	tokenEncoderMutex.Lock()
	defer tokenEncoderMutex.Unlock()

	// Double-check if another goroutine already created the encoder
	if encoder, exists := tokenEncoderMap[model]; exists {
		return encoder
	}

	// Create new encoder
	modelCodec, err := tokenizer.ForModel(tokenizer.Model(model))
	if err != nil {
		// Cache the default encoder for this model to avoid repeated failures
		tokenEncoderMap[model] = defaultTokenEncoder
		return defaultTokenEncoder
	}

	// Cache the new encoder
	tokenEncoderMap[model] = modelCodec
	return modelCodec
}

func getTokenNum(tokenEncoder tokenizer.Codec, text string) int {
	if text == "" {
		return 0
	}
	ids, _, _ := tokenEncoder.Encode(text)
	return len(ids)
}

func getImageToken(info *relaycommon.RelayInfo, imageUrl *dto.MessageImageUrl, model string, stream bool) (int, error) {
	if imageUrl == nil {
		return 0, fmt.Errorf("image_url_is_nil")
	}
	baseTokens := 85
	if model == "glm-4v" {
		return 1047, nil
	}
	if imageUrl.Detail == "low" {
		return baseTokens, nil
	}
	if !constant.GetMediaTokenNotStream && !stream {
		return 3 * baseTokens, nil
	}

	// 同步One API的图片计费逻辑
	if imageUrl.Detail == "auto" || imageUrl.Detail == "" {
		imageUrl.Detail = "high"
	}

	tileTokens := 170
	if strings.HasPrefix(model, "gpt-4o-mini") {
		tileTokens = 5667
		baseTokens = 2833
	}
	// 是否统计图片token
	if !constant.GetMediaToken {
		return 3 * baseTokens, nil
	}
	if info.ChannelType == common.ChannelTypeGemini || info.ChannelType == common.ChannelTypeVertexAi || info.ChannelType == common.ChannelTypeAnthropic {
		return 3 * baseTokens, nil
	}
	var config image.Config
	var err error
	var format string
	var b64str string
	if strings.HasPrefix(imageUrl.Url, "http") {
		config, format, err = DecodeUrlImageData(imageUrl.Url)
	} else {
		common.SysLog(fmt.Sprintf("decoding image"))
		config, format, b64str, err = DecodeBase64ImageData(imageUrl.Url)
	}
	if err != nil {
		return 0, err
	}
	imageUrl.MimeType = format

	if config.Width == 0 || config.Height == 0 {
		// not an image
		if format != "" && b64str != "" {
			// file type
			return 3 * baseTokens, nil
		}
		return 0, errors.New(fmt.Sprintf("fail to decode base64 config: %s", imageUrl.Url))
	}

	shortSide := config.Width
	otherSide := config.Height
	log.Printf("format: %s, width: %d, height: %d", format, config.Width, config.Height)
	// 缩放倍数
	scale := 1.0
	if config.Height < shortSide {
		shortSide = config.Height
		otherSide = config.Width
	}

	// 将最小变的尺寸缩小到768以下，如果大于768，则缩放到768
	if shortSide > 768 {
		scale = float64(shortSide) / 768
		shortSide = 768
	}
	// 将另一边按照相同的比例缩小，向上取整
	otherSide = int(math.Ceil(float64(otherSide) / scale))
	log.Printf("shortSide: %d, otherSide: %d, scale: %f", shortSide, otherSide, scale)
	// 计算图片的token数量(边的长度除以512，向上取整)
	tiles := (shortSide + 511) / 512 * ((otherSide + 511) / 512)
	log.Printf("tiles: %d", tiles)
	return tiles*tileTokens + baseTokens, nil
}

func CountTokenChatRequest(info *relaycommon.RelayInfo, request dto.GeneralOpenAIRequest) (int, error) {
	tkm := 0
	msgTokens, err := CountTokenMessages(info, request.Messages, request.Model, request.Stream)
	if err != nil {
		return 0, err
	}
	tkm += msgTokens
	if request.Tools != nil {
		openaiTools := request.Tools
		countStr := ""
		for _, tool := range openaiTools {
			countStr = tool.Function.Name
			if tool.Function.Description != "" {
				countStr += tool.Function.Description
			}
			if tool.Function.Parameters != nil {
				countStr += fmt.Sprintf("%v", tool.Function.Parameters)
			}
		}
		toolTokens, err := CountTokenInput(countStr, request.Model)
		if err != nil {
			return 0, err
		}
		tkm += 8
		tkm += toolTokens
	}

	return tkm, nil
}

func CountTokenClaudeRequest(request dto.ClaudeRequest, model string) (int, error) {
	tkm := 0

	// Count tokens in messages
	msgTokens, err := CountTokenClaudeMessages(request.Messages, model, request.Stream)
	if err != nil {
		return 0, err
	}
	tkm += msgTokens

	// Count tokens in system message
	if request.System != "" {
		systemTokens, err := CountTokenInput(request.System, model)
		if err != nil {
			return 0, err
		}
		tkm += systemTokens
	}

	if request.Tools != nil {
		// check is array
		if tools, ok := request.Tools.([]any); ok {
			if len(tools) > 0 {
				parsedTools, err1 := common.Any2Type[[]dto.Tool](request.Tools)
				if err1 != nil {
					return 0, fmt.Errorf("tools: Input should be a valid list: %v", err)
				}
				toolTokens, err2 := CountTokenClaudeTools(parsedTools, model)
				if err2 != nil {
					return 0, fmt.Errorf("tools: %v", err)
				}
				tkm += toolTokens
			}
		} else {
			return 0, errors.New("tools: Input should be a valid list")
		}
	}

	return tkm, nil
}

func CountTokenClaudeMessages(messages []dto.ClaudeMessage, model string, stream bool) (int, error) {
	tokenEncoder := getTokenEncoder(model)
	tokenNum := 0

	for _, message := range messages {
		// Count tokens for role
		tokenNum += getTokenNum(tokenEncoder, message.Role)
		if message.IsStringContent() {
			tokenNum += getTokenNum(tokenEncoder, message.GetStringContent())
		} else {
			content, err := message.ParseContent()
			if err != nil {
				return 0, err
			}
			for _, mediaMessage := range content {
				switch mediaMessage.Type {
				case "text":
					tokenNum += getTokenNum(tokenEncoder, mediaMessage.GetText())
				case "image":
					//imageTokenNum, err := getClaudeImageToken(mediaMsg.Source, model, stream)
					//if err != nil {
					//	return 0, err
					//}
					tokenNum += 1000
				case "tool_use":
					if mediaMessage.Input != nil {
						tokenNum += getTokenNum(tokenEncoder, mediaMessage.Name)
						inputJSON, _ := json.Marshal(mediaMessage.Input)
						tokenNum += getTokenNum(tokenEncoder, string(inputJSON))
					}
				case "tool_result":
					if mediaMessage.Content != nil {
						contentJSON, _ := json.Marshal(mediaMessage.Content)
						tokenNum += getTokenNum(tokenEncoder, string(contentJSON))
					}
				}
			}
		}
	}

	// Add a constant for message formatting (this may need adjustment based on Claude's exact formatting)
	tokenNum += len(messages) * 2 // Assuming 2 tokens per message for formatting

	return tokenNum, nil
}

func CountTokenClaudeTools(tools []dto.Tool, model string) (int, error) {
	tokenEncoder := getTokenEncoder(model)
	tokenNum := 0

	for _, tool := range tools {
		tokenNum += getTokenNum(tokenEncoder, tool.Name)
		tokenNum += getTokenNum(tokenEncoder, tool.Description)

		schemaJSON, err := json.Marshal(tool.InputSchema)
		if err != nil {
			return 0, errors.New(fmt.Sprintf("marshal_tool_schema_fail: %s", err.Error()))
		}
		tokenNum += getTokenNum(tokenEncoder, string(schemaJSON))
	}

	// Add a constant for tool formatting (this may need adjustment based on Claude's exact formatting)
	tokenNum += len(tools) * 3 // Assuming 3 tokens per tool for formatting

	return tokenNum, nil
}

func CountTokenRealtime(info *relaycommon.RelayInfo, request dto.RealtimeEvent, model string) (int, int, error) {
	audioToken := 0
	textToken := 0
	switch request.Type {
	case dto.RealtimeEventTypeSessionUpdate:
		if request.Session != nil {
			msgTokens, err := CountTextToken(request.Session.Instructions, model)
			if err != nil {
				return 0, 0, err
			}
			textToken += msgTokens
		}
	case dto.RealtimeEventResponseAudioDelta:
		// count audio token
		atk, err := CountAudioTokenOutput(request.Delta, info.OutputAudioFormat)
		if err != nil {
			return 0, 0, fmt.Errorf("error counting audio token: %v", err)
		}
		audioToken += atk
	case dto.RealtimeEventResponseAudioTranscriptionDelta, dto.RealtimeEventResponseFunctionCallArgumentsDelta:
		// count text token
		tkm, err := CountTextToken(request.Delta, model)
		if err != nil {
			return 0, 0, fmt.Errorf("error counting text token: %v", err)
		}
		textToken += tkm
	case dto.RealtimeEventInputAudioBufferAppend:
		// count audio token
		atk, err := CountAudioTokenInput(request.Audio, info.InputAudioFormat)
		if err != nil {
			return 0, 0, fmt.Errorf("error counting audio token: %v", err)
		}
		audioToken += atk
	case dto.RealtimeEventConversationItemCreated:
		if request.Item != nil {
			switch request.Item.Type {
			case "message":
				for _, content := range request.Item.Content {
					if content.Type == "input_text" {
						tokens, err := CountTextToken(content.Text, model)
						if err != nil {
							return 0, 0, err
						}
						textToken += tokens
					}
				}
			}
		}
	case dto.RealtimeEventTypeResponseDone:
		// count tools token
		if !info.IsFirstRequest {
			if info.RealtimeTools != nil && len(info.RealtimeTools) > 0 {
				for _, tool := range info.RealtimeTools {
					toolTokens, err := CountTokenInput(tool, model)
					if err != nil {
						return 0, 0, err
					}
					textToken += 8
					textToken += toolTokens
				}
			}
		}
	}
	return textToken, audioToken, nil
}

func CountTokenMessages(info *relaycommon.RelayInfo, messages []dto.Message, model string, stream bool) (int, error) {
	//recover when panic
	tokenEncoder := getTokenEncoder(model)
	// Reference:
	// https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
	// https://github.com/pkoukk/tiktoken-go/issues/6
	//
	// Every message follows <|start|>{role/name}\n{content}<|end|>\n
	var tokensPerMessage int
	var tokensPerName int
	if model == "gpt-3.5-turbo-0301" {
		tokensPerMessage = 4
		tokensPerName = -1 // If there's a name, the role is omitted
	} else {
		tokensPerMessage = 3
		tokensPerName = 1
	}
	tokenNum := 0
	for _, message := range messages {
		tokenNum += tokensPerMessage
		tokenNum += getTokenNum(tokenEncoder, message.Role)
		if message.Content != nil {
			if message.Name != nil {
				tokenNum += tokensPerName
				tokenNum += getTokenNum(tokenEncoder, *message.Name)
			}
			arrayContent := message.ParseContent()
			for _, m := range arrayContent {
				if m.Type == dto.ContentTypeImageURL {
					imageUrl := m.GetImageMedia()
					imageTokenNum, err := getImageToken(info, imageUrl, model, stream)
					if err != nil {
						return 0, err
					}
					tokenNum += imageTokenNum
					log.Printf("image token num: %d", imageTokenNum)
				} else if m.Type == dto.ContentTypeInputAudio {
					// TODO: 音频token数量计算
					tokenNum += 100
				} else if m.Type == dto.ContentTypeFile {
					tokenNum += 5000
				} else if m.Type == dto.ContentTypeVideoUrl {
					tokenNum += 5000
				} else {
					tokenNum += getTokenNum(tokenEncoder, m.Text)
				}
			}
		}
	}
	tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
	return tokenNum, nil
}

func CountTokenInput(input any, model string) (int, error) {
	switch v := input.(type) {
	case string:
		return CountTextToken(v, model)
	case []string:
		text := ""
		for _, s := range v {
			text += s
		}
		return CountTextToken(text, model)
	case []interface{}:
		text := ""
		for _, item := range v {
			text += fmt.Sprintf("%v", item)
		}
		return CountTextToken(text, model)
	}
	return CountTokenInput(fmt.Sprintf("%v", input), model)
}

func CountTokenStreamChoices(messages []dto.ChatCompletionsStreamResponseChoice, model string) int {
	tokens := 0
	for _, message := range messages {
		tkm, _ := CountTokenInput(message.Delta.GetContentString(), model)
		tokens += tkm
		if message.Delta.ToolCalls != nil {
			for _, tool := range message.Delta.ToolCalls {
				tkm, _ := CountTokenInput(tool.Function.Name, model)
				tokens += tkm
				tkm, _ = CountTokenInput(tool.Function.Arguments, model)
				tokens += tkm
			}
		}
	}
	return tokens
}

func CountTTSToken(text string, model string) (int, error) {
	if strings.HasPrefix(model, "tts") {
		return utf8.RuneCountInString(text), nil
	} else {
		return CountTextToken(text, model)
	}
}

func CountAudioTokenInput(audioBase64 string, audioFormat string) (int, error) {
	if audioBase64 == "" {
		return 0, nil
	}
	duration, err := parseAudio(audioBase64, audioFormat)
	if err != nil {
		return 0, err
	}
	return int(duration / 60 * 100 / 0.06), nil
}

func CountAudioTokenOutput(audioBase64 string, audioFormat string) (int, error) {
	if audioBase64 == "" {
		return 0, nil
	}
	duration, err := parseAudio(audioBase64, audioFormat)
	if err != nil {
		return 0, err
	}
	return int(duration / 60 * 200 / 0.24), nil
}

//func CountAudioToken(sec float64, audioType string) {
//	if audioType == "input" {
//
//	}
//}

// CountTextToken 统计文本的token数量，仅当文本包含敏感词，返回错误，同时返回token数量
func CountTextToken(text string, model string) (int, error) {
	var err error
	tokenEncoder := getTokenEncoder(model)
	return getTokenNum(tokenEncoder, text), err
}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+								package service
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
 								import (
-												feat: claude relay

											
										
										
											2025-03-12 21:31:46 +08:00
+									"encoding/json"
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+									"errors"
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+									"fmt"
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+									"github.com/tiktoken-go/tokenizer"
-												🔧 fix(token_counter): refactor token encoder initialization and retrieval logic

											
										
										
											2025-06-10 18:51:26 +08:00
+									"github.com/tiktoken-go/tokenizer/codec"
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+									"image"
 									"log"
 									"math"
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+									"one-api/common"
-												feat: 媒体请求计费选项

											
										
										
											2024-07-18 17:04:19 +08:00
+									"one-api/constant"
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									"one-api/dto"
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+									relaycommon "one-api/relay/common"
-												perf: lazy initialization for token encoders (close #566)

											
										
										
											2023-09-29 17:56:11 +08:00
+									"strings"
-												🔧 fix(token_counter): enhance token encoder caching and concurrency handling

											
										
										
											2025-06-10 18:55:21 +08:00
+									"sync"
-												support tts

											
										
										
											2023-11-15 21:05:14 +08:00
+									"unicode/utf8"
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+								)
-												perf: lazy initialization for token encoders (close #566)

											
										
										
											2023-09-29 17:56:11 +08:00
+								// tokenEncoderMap won't grow after initialization
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+								var defaultTokenEncoder tokenizer.Codec
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
-												🔧 fix(token_counter): enhance token encoder caching and concurrency handling

											
										
										
											2025-06-10 18:55:21 +08:00
+								// tokenEncoderMap is used to store token encoders for different models
 								var tokenEncoderMap = make(map[string]tokenizer.Codec)
 								// tokenEncoderMutex protects tokenEncoderMap for concurrent access
 								var tokenEncoderMutex sync.RWMutex
-												perf: initialize all token encoder when starting (close #459, close $460)

											
										
										
											2023-08-26 13:02:02 +08:00
+								func InitTokenEncoders() {
 									common.SysLog("initializing token encoders")
-												🔧 fix(token_counter): refactor token encoder initialization and retrieval logic

											
										
										
											2025-06-10 18:51:26 +08:00
+									defaultTokenEncoder = codec.NewCl100kBase()
-												perf: initialize all token encoder when starting (close #459, close $460)

											
										
										
											2023-08-26 13:02:02 +08:00
+									common.SysLog("token encoders initialized")
 								}
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+								func getTokenEncoder(model string) tokenizer.Codec {
-												🔧 fix(token_counter): enhance token encoder caching and concurrency handling

											
										
										
											2025-06-10 18:55:21 +08:00
+									// First, try to get the encoder from cache with read lock
 									tokenEncoderMutex.RLock()
 									if encoder, exists := tokenEncoderMap[model]; exists {
 										tokenEncoderMutex.RUnlock()
 										return encoder
 									}
 									tokenEncoderMutex.RUnlock()
 									// If not in cache, create new encoder with write lock
 									tokenEncoderMutex.Lock()
 									defer tokenEncoderMutex.Unlock()
 									// Double-check if another goroutine already created the encoder
 									if encoder, exists := tokenEncoderMap[model]; exists {
 										return encoder
 									}
 									// Create new encoder
-												🔧 fix(token_counter): refactor token encoder initialization and retrieval logic

											
										
										
											2025-06-10 18:51:26 +08:00
+									modelCodec, err := tokenizer.ForModel(tokenizer.Model(model))
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+									if err != nil {
-												🔧 fix(token_counter): enhance token encoder caching and concurrency handling

											
										
										
											2025-06-10 18:55:21 +08:00
+										// Cache the default encoder for this model to avoid repeated failures
 										tokenEncoderMap[model] = defaultTokenEncoder
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+										return defaultTokenEncoder
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+									}
-												🔧 fix(token_counter): enhance token encoder caching and concurrency handling

											
										
										
											2025-06-10 18:55:21 +08:00
 									// Cache the new encoder
 									tokenEncoderMap[model] = modelCodec
-												🔧 fix(token_counter): refactor token encoder initialization and retrieval logic

											
										
										
											2025-06-10 18:51:26 +08:00
+									return modelCodec
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+								}
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+								func getTokenNum(tokenEncoder tokenizer.Codec, text string) int {
-												feat: Enhance token counting and content parsing for messages

											
										
										
											2025-02-24 14:18:15 +08:00
+									if text == "" {
 										return 0
 									}
-												🔧 fix(token_counter): update token encoder implementation and dependencies

											
										
										
											2025-06-10 18:04:49 +08:00
+									ids, _, _ := tokenEncoder.Encode(text)
 									return len(ids)
-												feat: able to approximate token (close #207)

											
										
										
											2023-07-04 19:54:13 +08:00
+								}
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+								func getImageToken(info *relaycommon.RelayInfo, imageUrl *dto.MessageImageUrl, model string, stream bool) (int, error) {
-												feat: support dify upload image file

											
										
										
											2025-03-15 19:10:12 +08:00
+									if imageUrl == nil {
 										return 0, fmt.Errorf("image_url_is_nil")
 									}
-												feat: support gpt-4o-mini image tokens

											
										
										
											2024-07-19 12:59:37 +08:00
+									baseTokens := 85
-												chore: token counter

											
										
										
											2024-05-18 15:14:49 +08:00
+									if model == "glm-4v" {
 										return 1047, nil
 									}
-												feat: update token encoder

											
										
										
											2024-05-30 23:15:06 +08:00
+									if imageUrl.Detail == "low" {
-												feat: support gpt-4o-mini image tokens

											
										
										
											2024-07-19 12:59:37 +08:00
+										return baseTokens, nil
-												feat: update token encoder

											
										
										
											2024-05-30 23:15:06 +08:00
+									}
-												feat: 媒体请求计费选项

											
										
										
											2024-07-18 17:04:19 +08:00
+									if !constant.GetMediaTokenNotStream && !stream {
-												feat: support dify upload image file

											
										
										
											2025-03-15 19:10:12 +08:00
+										return 3 * baseTokens, nil
-												feat: 媒体请求计费选项

											
										
										
											2024-07-18 17:04:19 +08:00
+									}
-												feat: support dify upload image file

											
										
										
											2025-03-15 19:10:12 +08:00
-												feat: update tiktoken

											
										
										
											2024-05-30 21:39:58 +08:00
+									// 同步One API的图片计费逻辑
 									if imageUrl.Detail == "auto" || imageUrl.Detail == "" {
 										imageUrl.Detail = "high"
 									}
-												feat: support gpt-4o-mini image tokens

											
										
										
											2024-07-19 12:59:37 +08:00
 									tileTokens := 170
 									if strings.HasPrefix(model, "gpt-4o-mini") {
 										tileTokens = 5667
 										baseTokens = 2833
 									}
-												fix: retry prompt tokens

											
										
										
											2025-01-02 16:33:00 +08:00
+									// 是否统计图片token
 									if !constant.GetMediaToken {
 										return 3 * baseTokens, nil
 									}
 									if info.ChannelType == common.ChannelTypeGemini || info.ChannelType == common.ChannelTypeVertexAi || info.ChannelType == common.ChannelTypeAnthropic {
 										return 3 * baseTokens, nil
 									}
-												support base64 image

											
										
										
											2023-11-19 18:59:35 +08:00
+									var config image.Config
 									var err error
-												support gemini-pro-vision

											
										
										
											2023-12-27 16:32:54 +08:00
+									var format string
-												feat: enhance image decoding logic to handle base64 file types and improve error handling

											
										
										
											2025-05-15 14:51:33 +08:00
+									var b64str string
-												support base64 image

											
										
										
											2023-11-19 18:59:35 +08:00
+									if strings.HasPrefix(imageUrl.Url, "http") {
-												feat: 支持设置worker访问请求中的图片地址

											
										
										
											2024-05-28 17:59:53 +08:00
+										config, format, err = DecodeUrlImageData(imageUrl.Url)
-												support base64 image

											
										
										
											2023-11-19 18:59:35 +08:00
+									} else {
 										common.SysLog(fmt.Sprintf("decoding image"))
-												feat: enhance image decoding logic to handle base64 file types and improve error handling

											
										
										
											2025-05-15 14:51:33 +08:00
+										config, format, b64str, err = DecodeBase64ImageData(imageUrl.Url)
-												support base64 image

											
										
										
											2023-11-19 18:59:35 +08:00
+									}
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+									if err != nil {
 										return 0, err
 									}
-												feat: support dify upload image file

											
										
										
											2025-03-15 19:10:12 +08:00
+									imageUrl.MimeType = format
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
 									if config.Width == 0 || config.Height == 0 {
-												feat: enhance image decoding logic to handle base64 file types and improve error handling

											
										
										
											2025-05-15 14:51:33 +08:00
+										// not an image
 										if format != "" && b64str != "" {
 											// file type
 											return 3 * baseTokens, nil
 										}
 										return 0, errors.New(fmt.Sprintf("fail to decode base64 config: %s", imageUrl.Url))
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+									}
 									shortSide := config.Width
 									otherSide := config.Height
-												support gemini-pro-vision

											
										
										
											2023-12-27 16:32:54 +08:00
+									log.Printf("format: %s, width: %d, height: %d", format, config.Width, config.Height)
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+									// 缩放倍数
 									scale := 1.0
 									if config.Height < shortSide {
 										shortSide = config.Height
 										otherSide = config.Width
 									}
 									// 将最小变的尺寸缩小到768以下，如果大于768，则缩放到768
 									if shortSide > 768 {
 										scale = float64(shortSide) / 768
 										shortSide = 768
 									}
 									// 将另一边按照相同的比例缩小，向上取整
 									otherSide = int(math.Ceil(float64(otherSide) / scale))
 									log.Printf("shortSide: %d, otherSide: %d, scale: %f", shortSide, otherSide, scale)
 									// 计算图片的token数量(边的长度除以512，向上取整)
 									tiles := (shortSide + 511) / 512 * ((otherSide + 511) / 512)
 									log.Printf("tiles: %d", tiles)
-												feat: support gpt-4o-mini image tokens

											
										
										
											2024-07-19 12:59:37 +08:00
+									return tiles*tileTokens + baseTokens, nil
-												fix image token calculate

											
										
										
											2023-11-17 20:32:11 +08:00
+								}
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+								func CountTokenChatRequest(info *relaycommon.RelayInfo, request dto.GeneralOpenAIRequest) (int, error) {
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+									tkm := 0
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+									msgTokens, err := CountTokenMessages(info, request.Messages, request.Model, request.Stream)
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+									if err != nil {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										return 0, err
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+									}
 									tkm += msgTokens
 									if request.Tools != nil {
-												fix: gemini&claude tool call format #795 #766

											
										
										
											2025-02-26 23:56:10 +08:00
+										openaiTools := request.Tools
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+										countStr := ""
 										for _, tool := range openaiTools {
 											countStr = tool.Function.Name
 											if tool.Function.Description != "" {
 												countStr += tool.Function.Description
 											}
 											if tool.Function.Parameters != nil {
 												countStr += fmt.Sprintf("%v", tool.Function.Parameters)
 											}
 										}
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+										toolTokens, err := CountTokenInput(countStr, request.Model)
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+										if err != nil {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+											return 0, err
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+										}
 										tkm += 8
 										tkm += toolTokens
 									}
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									return tkm, nil
-												feat: 完善函数计费

											
										
										
											2024-04-23 23:01:06 +08:00
+								}
-												feat: claude relay

											
										
										
											2025-03-12 21:31:46 +08:00
+								func CountTokenClaudeRequest(request dto.ClaudeRequest, model string) (int, error) {
 									tkm := 0
 									// Count tokens in messages
 									msgTokens, err := CountTokenClaudeMessages(request.Messages, model, request.Stream)
 									if err != nil {
 										return 0, err
 									}
 									tkm += msgTokens
 									// Count tokens in system message
 									if request.System != "" {
 										systemTokens, err := CountTokenInput(request.System, model)
 										if err != nil {
 											return 0, err
 										}
 										tkm += systemTokens
 									}
 									if request.Tools != nil {
 										// check is array
 										if tools, ok := request.Tools.([]any); ok {
 											if len(tools) > 0 {
 												parsedTools, err1 := common.Any2Type[[]dto.Tool](request.Tools)
 												if err1 != nil {
 													return 0, fmt.Errorf("tools: Input should be a valid list: %v", err)
 												}
 												toolTokens, err2 := CountTokenClaudeTools(parsedTools, model)
 												if err2 != nil {
 													return 0, fmt.Errorf("tools: %v", err)
 												}
 												tkm += toolTokens
 											}
 										} else {
 											return 0, errors.New("tools: Input should be a valid list")
 										}
 									}
 									return tkm, nil
 								}
 								func CountTokenClaudeMessages(messages []dto.ClaudeMessage, model string, stream bool) (int, error) {
 									tokenEncoder := getTokenEncoder(model)
 									tokenNum := 0
 									for _, message := range messages {
 										// Count tokens for role
 										tokenNum += getTokenNum(tokenEncoder, message.Role)
 										if message.IsStringContent() {
 											tokenNum += getTokenNum(tokenEncoder, message.GetStringContent())
 										} else {
 											content, err := message.ParseContent()
 											if err != nil {
 												return 0, err
 											}
 											for _, mediaMessage := range content {
 												switch mediaMessage.Type {
 												case "text":
 													tokenNum += getTokenNum(tokenEncoder, mediaMessage.GetText())
 												case "image":
 													//imageTokenNum, err := getClaudeImageToken(mediaMsg.Source, model, stream)
 													//if err != nil {
 													//	return 0, err
 													//}
 													tokenNum += 1000
 												case "tool_use":
-												refactor: message content 改成 any

refactor: message content 改成 any

											
										
										
											2025-06-07 23:05:01 +08:00
+													if mediaMessage.Input != nil {
 														tokenNum += getTokenNum(tokenEncoder, mediaMessage.Name)
 														inputJSON, _ := json.Marshal(mediaMessage.Input)
 														tokenNum += getTokenNum(tokenEncoder, string(inputJSON))
 													}
-												feat: claude relay

											
										
										
											2025-03-12 21:31:46 +08:00
+												case "tool_result":
-												refactor: message content 改成 any

refactor: message content 改成 any

											
										
										
											2025-06-07 23:05:01 +08:00
+													if mediaMessage.Content != nil {
 														contentJSON, _ := json.Marshal(mediaMessage.Content)
 														tokenNum += getTokenNum(tokenEncoder, string(contentJSON))
 													}
-												feat: claude relay

											
										
										
											2025-03-12 21:31:46 +08:00
+												}
 											}
 										}
 									}
 									// Add a constant for message formatting (this may need adjustment based on Claude's exact formatting)
 									tokenNum += len(messages) * 2 // Assuming 2 tokens per message for formatting
 									return tokenNum, nil
 								}
 								func CountTokenClaudeTools(tools []dto.Tool, model string) (int, error) {
 									tokenEncoder := getTokenEncoder(model)
 									tokenNum := 0
 									for _, tool := range tools {
 										tokenNum += getTokenNum(tokenEncoder, tool.Name)
 										tokenNum += getTokenNum(tokenEncoder, tool.Description)
 										schemaJSON, err := json.Marshal(tool.InputSchema)
 										if err != nil {
 											return 0, errors.New(fmt.Sprintf("marshal_tool_schema_fail: %s", err.Error()))
 										}
 										tokenNum += getTokenNum(tokenEncoder, string(schemaJSON))
 									}
 									// Add a constant for tool formatting (this may need adjustment based on Claude's exact formatting)
 									tokenNum += len(tools) * 3 // Assuming 3 tokens per tool for formatting
 									return tokenNum, nil
 								}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+								func CountTokenRealtime(info *relaycommon.RelayInfo, request dto.RealtimeEvent, model string) (int, int, error) {
 									audioToken := 0
 									textToken := 0
 									switch request.Type {
 									case dto.RealtimeEventTypeSessionUpdate:
 										if request.Session != nil {
 											msgTokens, err := CountTextToken(request.Session.Instructions, model)
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+											if err != nil {
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+												return 0, 0, err
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+											}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+											textToken += msgTokens
 										}
 									case dto.RealtimeEventResponseAudioDelta:
 										// count audio token
 										atk, err := CountAudioTokenOutput(request.Delta, info.OutputAudioFormat)
 										if err != nil {
 											return 0, 0, fmt.Errorf("error counting audio token: %v", err)
 										}
 										audioToken += atk
 									case dto.RealtimeEventResponseAudioTranscriptionDelta, dto.RealtimeEventResponseFunctionCallArgumentsDelta:
 										// count text token
 										tkm, err := CountTextToken(request.Delta, model)
 										if err != nil {
 											return 0, 0, fmt.Errorf("error counting text token: %v", err)
 										}
 										textToken += tkm
 									case dto.RealtimeEventInputAudioBufferAppend:
 										// count audio token
 										atk, err := CountAudioTokenInput(request.Audio, info.InputAudioFormat)
 										if err != nil {
 											return 0, 0, fmt.Errorf("error counting audio token: %v", err)
 										}
 										audioToken += atk
-												feat: azure realtime

(cherry picked from commit 75ff3d98f06103dc2df1f8817bd3fcbf433e0f20)

											
										
										
											2024-10-07 17:18:11 +08:00
+									case dto.RealtimeEventConversationItemCreated:
 										if request.Item != nil {
 											switch request.Item.Type {
 											case "message":
 												for _, content := range request.Item.Content {
 													if content.Type == "input_text" {
 														tokens, err := CountTextToken(content.Text, model)
 														if err != nil {
 															return 0, 0, err
 														}
 														textToken += tokens
 													}
 												}
 											}
 										}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+									case dto.RealtimeEventTypeResponseDone:
 										// count tools token
 										if !info.IsFirstRequest {
 											if info.RealtimeTools != nil && len(info.RealtimeTools) > 0 {
 												for _, tool := range info.RealtimeTools {
 													toolTokens, err := CountTokenInput(tool, model)
 													if err != nil {
 														return 0, 0, err
 													}
 													textToken += 8
 													textToken += toolTokens
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+												}
 											}
 										}
 									}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+									return textToken, audioToken, nil
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+								}
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+								func CountTokenMessages(info *relaycommon.RelayInfo, messages []dto.Message, model string, stream bool) (int, error) {
-												support gpt-4-1106-vision-preview

											
										
										
											2023-11-17 18:24:37 +08:00
+									//recover when panic
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+									tokenEncoder := getTokenEncoder(model)
 									// Reference:
 									// https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
 									// https://github.com/pkoukk/tiktoken-go/issues/6
 									//
 									// Every message follows <|start|>{role/name}\n{content}<|end|>\n
 									var tokensPerMessage int
 									var tokensPerName int
-												chore: update countTokenMessages (#238)


											
										
										
											2023-07-03 09:42:34 +08:00
+									if model == "gpt-3.5-turbo-0301" {
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+										tokensPerMessage = 4
 										tokensPerName = -1 // If there's a name, the role is omitted
 									} else {
 										tokensPerMessage = 3
 										tokensPerName = 1
 									}
 									tokenNum := 0
 									for _, message := range messages {
 										tokenNum += tokensPerMessage
-												feat: able to approximate token (close #207)

											
										
										
											2023-07-04 19:54:13 +08:00
+										tokenNum += getTokenNum(tokenEncoder, message.Role)
-												refactor: message content 改成 any

refactor: message content 改成 any

											
										
										
											2025-06-07 23:05:01 +08:00
+										if message.Content != nil {
-												feat: Enhance token counting and content parsing for messages

											
										
										
											2025-02-24 14:18:15 +08:00
+											if message.Name != nil {
 												tokenNum += tokensPerName
 												tokenNum += getTokenNum(tokenEncoder, *message.Name)
 											}
 											arrayContent := message.ParseContent()
 											for _, m := range arrayContent {
 												if m.Type == dto.ContentTypeImageURL {
-												feat: support dify upload image file

											
										
										
											2025-03-15 19:10:12 +08:00
+													imageUrl := m.GetImageMedia()
 													imageTokenNum, err := getImageToken(info, imageUrl, model, stream)
-												feat: Enhance token counting and content parsing for messages

											
										
										
											2025-02-24 14:18:15 +08:00
+													if err != nil {
 														return 0, err
-												fix: fix tool calls

											
										
										
											2024-01-31 01:41:38 +08:00
+													}
-												feat: Enhance token counting and content parsing for messages

											
										
										
											2025-02-24 14:18:15 +08:00
+													tokenNum += imageTokenNum
 													log.Printf("image token num: %d", imageTokenNum)
 												} else if m.Type == dto.ContentTypeInputAudio {
 													// TODO: 音频token数量计算
 													tokenNum += 100
-												feat: enhance file handling and logging in the application

											
										
										
											2025-04-11 16:23:54 +08:00
+												} else if m.Type == dto.ContentTypeFile {
 													tokenNum += 5000
-												feat: add video URL support in MediaContent and update token counting logic

											
										
										
											2025-05-03 21:12:07 +08:00
+												} else if m.Type == dto.ContentTypeVideoUrl {
 													tokenNum += 5000
-												feat: Enhance token counting and content parsing for messages

											
										
										
											2025-02-24 14:18:15 +08:00
+												} else {
 													tokenNum += getTokenNum(tokenEncoder, m.Text)
-												support gpt-4-1106-vision-preview

											
										
										
											2023-11-17 18:24:37 +08:00
+												}
 											}
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+										}
 									}
 									tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									return tokenNum, nil
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+								}
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+								func CountTokenInput(input any, model string) (int, error) {
-												恢复渠道优先级可设置为负数

											
										
										
											2023-12-26 23:49:43 +08:00
+									switch v := input.(type) {
-												fix: now the input field can be array type now (close #149)

											
										
										
											2023-06-12 16:11:57 +08:00
+									case string:
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+										return CountTextToken(v, model)
-												fix: now the input field can be array type now (close #149)

											
										
										
											2023-06-12 16:11:57 +08:00
+									case []string:
 										text := ""
-												恢复渠道优先级可设置为负数

											
										
										
											2023-12-26 23:49:43 +08:00
+										for _, s := range v {
-												fix: now the input field can be array type now (close #149)

											
										
										
											2023-06-12 16:11:57 +08:00
+											text += s
 										}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+										return CountTextToken(text, model)
-												feat: Improve embedding request handling and support across channels

- Update EmbeddingRequest DTO to support more flexible input types
- Add input parsing method to handle various input formats
- Implement ConvertEmbeddingRequest for multiple channel adaptors
- Remove relayMode parameter from EmbeddingHelper
- Add input validation for embedding requests
- Simplify embedding request conversion for different channels

											
										
										
											2025-02-12 14:39:36 +08:00
+									case []interface{}:
 										text := ""
 										for _, item := range v {
 											text += fmt.Sprintf("%v", item)
 										}
 										return CountTextToken(text, model)
-												fix: now the input field can be array type now (close #149)

											
										
										
											2023-06-12 16:11:57 +08:00
+									}
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									return CountTokenInput(fmt.Sprintf("%v", input), model)
-												fix: now the input field can be array type now (close #149)

											
										
										
											2023-06-12 16:11:57 +08:00
+								}
-												feat: 启用函数计费

											
										
										
											2024-04-22 16:35:56 +08:00
+								func CountTokenStreamChoices(messages []dto.ChatCompletionsStreamResponseChoice, model string) int {
 									tokens := 0
 									for _, message := range messages {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										tkm, _ := CountTokenInput(message.Delta.GetContentString(), model)
-												feat: 启用函数计费

											
										
										
											2024-04-22 16:35:56 +08:00
+										tokens += tkm
 										if message.Delta.ToolCalls != nil {
 											for _, tool := range message.Delta.ToolCalls {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+												tkm, _ := CountTokenInput(tool.Function.Name, model)
-												feat: 启用函数计费

											
										
										
											2024-04-22 16:35:56 +08:00
+												tokens += tkm
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+												tkm, _ = CountTokenInput(tool.Function.Arguments, model)
-												feat: 启用函数计费

											
										
										
											2024-04-22 16:35:56 +08:00
+												tokens += tkm
 											}
 										}
 									}
 									return tokens
 								}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+								func CountTTSToken(text string, model string) (int, error) {
-												support tts

											
										
										
											2023-11-15 21:05:14 +08:00
+									if strings.HasPrefix(model, "tts") {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										return utf8.RuneCountInString(text), nil
-												support tts

											
										
										
											2023-11-15 21:05:14 +08:00
+									} else {
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+										return CountTextToken(text, model)
 									}
 								}
 								func CountAudioTokenInput(audioBase64 string, audioFormat string) (int, error) {
 									if audioBase64 == "" {
 										return 0, nil
 									}
 									duration, err := parseAudio(audioBase64, audioFormat)
 									if err != nil {
 										return 0, err
-												support tts

											
										
										
											2023-11-15 21:05:14 +08:00
+									}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+									return int(duration / 60 * 100 / 0.06), nil
-												support tts

											
										
										
											2023-11-15 21:05:14 +08:00
+								}
-												feat: realtime

(cherry picked from commit d4966246e68dbdcdab45ec5c5141362834d74425)

											
										
										
											2024-10-06 14:13:41 +08:00
+								func CountAudioTokenOutput(audioBase64 string, audioFormat string) (int, error) {
 									if audioBase64 == "" {
 										return 0, nil
 									}
 									duration, err := parseAudio(audioBase64, audioFormat)
 									if err != nil {
 										return 0, err
 									}
 									return int(duration / 60 * 200 / 0.24), nil
 								}
 								//func CountAudioToken(sec float64, audioType string) {
 								//	if audioType == "input" {
 								//
 								//	}
 								//}
 								// CountTextToken 统计文本的token数量，仅当文本包含敏感词，返回错误，同时返回token数量
 								func CountTextToken(text string, model string) (int, error) {
-												feat: 初步兼容敏感词过滤

											
										
										
											2024-03-20 17:07:42 +08:00
+									var err error
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+									tokenEncoder := getTokenEncoder(model)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									return getTokenNum(tokenEncoder, text), err
-												fix: make the token number calculation more accurate (#101)

* Make token calculation more accurate.

* fix: make the token number calculation more accurate

---------

Co-authored-by: JustSong <songquanpeng@foxmail.com>
											
										
										
											2023-05-19 09:41:26 +08:00
+								}