new-api/relay/relay-text.go

package relay

import (
	"bytes"
	"encoding/json"
	"errors"
	"fmt"
	"io"
	"math"
	"net/http"
	"one-api/common"
	"one-api/constant"
	"one-api/dto"
	"one-api/model"
	relaycommon "one-api/relay/common"
	relayconstant "one-api/relay/constant"
	"one-api/relay/helper"
	"one-api/service"
	"one-api/setting"
	"strings"
	"time"

	"github.com/bytedance/gopkg/util/gopool"
	"github.com/shopspring/decimal"

	"github.com/gin-gonic/gin"
)

func getAndValidateTextRequest(c *gin.Context, relayInfo *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
	textRequest := &dto.GeneralOpenAIRequest{}
	err := common.UnmarshalBodyReusable(c, textRequest)
	if err != nil {
		return nil, err
	}
	if relayInfo.RelayMode == relayconstant.RelayModeModerations && textRequest.Model == "" {
		textRequest.Model = "text-moderation-latest"
	}
	if relayInfo.RelayMode == relayconstant.RelayModeEmbeddings && textRequest.Model == "" {
		textRequest.Model = c.Param("model")
	}

	if textRequest.MaxTokens > math.MaxInt32/2 {
		return nil, errors.New("max_tokens is invalid")
	}
	if textRequest.Model == "" {
		return nil, errors.New("model is required")
	}
	switch relayInfo.RelayMode {
	case relayconstant.RelayModeCompletions:
		if textRequest.Prompt == "" {
			return nil, errors.New("field prompt is required")
		}
	case relayconstant.RelayModeChatCompletions:
		if len(textRequest.Messages) == 0 {
			return nil, errors.New("field messages is required")
		}
	case relayconstant.RelayModeEmbeddings:
	case relayconstant.RelayModeModerations:
		if textRequest.Input == nil || textRequest.Input == "" {
			return nil, errors.New("field input is required")
		}
	case relayconstant.RelayModeEdits:
		if textRequest.Instruction == "" {
			return nil, errors.New("field instruction is required")
		}
	}
	relayInfo.IsStream = textRequest.Stream
	return textRequest, nil
}

func TextHelper(c *gin.Context) (openaiErr *dto.OpenAIErrorWithStatusCode) {

	relayInfo := relaycommon.GenRelayInfo(c)

	// get & validate textRequest 获取并验证文本请求
	textRequest, err := getAndValidateTextRequest(c, relayInfo)
	if err != nil {
		common.LogError(c, fmt.Sprintf("getAndValidateTextRequest failed: %s", err.Error()))
		return service.OpenAIErrorWrapperLocal(err, "invalid_text_request", http.StatusBadRequest)
	}

	if setting.ShouldCheckPromptSensitive() {
		words, err := checkRequestSensitive(textRequest, relayInfo)
		if err != nil {
			common.LogWarn(c, fmt.Sprintf("user sensitive words detected: %s", strings.Join(words, ", ")))
			return service.OpenAIErrorWrapperLocal(err, "sensitive_words_detected", http.StatusBadRequest)
		}
	}

	err = helper.ModelMappedHelper(c, relayInfo)
	if err != nil {
		return service.OpenAIErrorWrapperLocal(err, "model_mapped_error", http.StatusInternalServerError)
	}

	textRequest.Model = relayInfo.UpstreamModelName

	// 获取 promptTokens，如果上下文中已经存在，则直接使用
	var promptTokens int
	if value, exists := c.Get("prompt_tokens"); exists {
		promptTokens = value.(int)
		relayInfo.PromptTokens = promptTokens
	} else {
		promptTokens, err = getPromptTokens(textRequest, relayInfo)
		// count messages token error 计算promptTokens错误
		if err != nil {
			return service.OpenAIErrorWrapper(err, "count_token_messages_failed", http.StatusInternalServerError)
		}
		c.Set("prompt_tokens", promptTokens)
	}

	priceData, err := helper.ModelPriceHelper(c, relayInfo, promptTokens, int(textRequest.MaxTokens))
	if err != nil {
		return service.OpenAIErrorWrapperLocal(err, "model_price_error", http.StatusInternalServerError)
	}

	// pre-consume quota 预消耗配额
	preConsumedQuota, userQuota, openaiErr := preConsumeQuota(c, priceData.ShouldPreConsumedQuota, relayInfo)
	if openaiErr != nil {
		return openaiErr
	}
	defer func() {
		if openaiErr != nil {
			returnPreConsumedQuota(c, relayInfo, userQuota, preConsumedQuota)
		}
	}()
	includeUsage := false
	// 判断用户是否需要返回使用情况
	if textRequest.StreamOptions != nil && textRequest.StreamOptions.IncludeUsage {
		includeUsage = true
	}

	// 如果不支持StreamOptions，将StreamOptions设置为nil
	if !relayInfo.SupportStreamOptions || !textRequest.Stream {
		textRequest.StreamOptions = nil
	} else {
		// 如果支持StreamOptions，且请求中没有设置StreamOptions，根据配置文件设置StreamOptions
		if constant.ForceStreamOption {
			textRequest.StreamOptions = &dto.StreamOptions{
				IncludeUsage: true,
			}
		}
	}

	if includeUsage {
		relayInfo.ShouldIncludeUsage = true
	}

	adaptor := GetAdaptor(relayInfo.ApiType)
	if adaptor == nil {
		return service.OpenAIErrorWrapperLocal(fmt.Errorf("invalid api type: %d", relayInfo.ApiType), "invalid_api_type", http.StatusBadRequest)
	}
	adaptor.Init(relayInfo)
	var requestBody io.Reader

	//if relayInfo.ChannelType == common.ChannelTypeOpenAI && !isModelMapped {
	//	body, err := common.GetRequestBody(c)
	//	if err != nil {
	//		return service.OpenAIErrorWrapperLocal(err, "get_request_body_failed", http.StatusInternalServerError)
	//	}
	//	requestBody = bytes.NewBuffer(body)
	//} else {
	//
	//}

	convertedRequest, err := adaptor.ConvertRequest(c, relayInfo, textRequest)
	if err != nil {
		return service.OpenAIErrorWrapperLocal(err, "convert_request_failed", http.StatusInternalServerError)
	}
	jsonData, err := json.Marshal(convertedRequest)
	if err != nil {
		return service.OpenAIErrorWrapperLocal(err, "json_marshal_failed", http.StatusInternalServerError)
	}
	requestBody = bytes.NewBuffer(jsonData)

	statusCodeMappingStr := c.GetString("status_code_mapping")
	var httpResp *http.Response
	resp, err := adaptor.DoRequest(c, relayInfo, requestBody)
	if err != nil {
		return service.OpenAIErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)
	}

	if resp != nil {
		httpResp = resp.(*http.Response)
		relayInfo.IsStream = relayInfo.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
		if httpResp.StatusCode != http.StatusOK {
			openaiErr = service.RelayErrorHandler(httpResp)
			// reset status code 重置状态码
			service.ResetStatusCode(openaiErr, statusCodeMappingStr)
			return openaiErr
		}
	}

	usage, openaiErr := adaptor.DoResponse(c, httpResp, relayInfo)
	if openaiErr != nil {
		// reset status code 重置状态码
		service.ResetStatusCode(openaiErr, statusCodeMappingStr)
		return openaiErr
	}

	if strings.HasPrefix(relayInfo.OriginModelName, "gpt-4o-audio") {
		service.PostAudioConsumeQuota(c, relayInfo, usage.(*dto.Usage), preConsumedQuota, userQuota, priceData, "")
	} else {
		postConsumeQuota(c, relayInfo, usage.(*dto.Usage), preConsumedQuota, userQuota, priceData, "")
	}
	return nil
}

func getPromptTokens(textRequest *dto.GeneralOpenAIRequest, info *relaycommon.RelayInfo) (int, error) {
	var promptTokens int
	var err error
	switch info.RelayMode {
	case relayconstant.RelayModeChatCompletions:
		promptTokens, err = service.CountTokenChatRequest(info, *textRequest)
	case relayconstant.RelayModeCompletions:
		promptTokens, err = service.CountTokenInput(textRequest.Prompt, textRequest.Model)
	case relayconstant.RelayModeModerations:
		promptTokens, err = service.CountTokenInput(textRequest.Input, textRequest.Model)
	case relayconstant.RelayModeEmbeddings:
		promptTokens, err = service.CountTokenInput(textRequest.Input, textRequest.Model)
	default:
		err = errors.New("unknown relay mode")
		promptTokens = 0
	}
	info.PromptTokens = promptTokens
	return promptTokens, err
}

func checkRequestSensitive(textRequest *dto.GeneralOpenAIRequest, info *relaycommon.RelayInfo) ([]string, error) {
	var err error
	var words []string
	switch info.RelayMode {
	case relayconstant.RelayModeChatCompletions:
		words, err = service.CheckSensitiveMessages(textRequest.Messages)
	case relayconstant.RelayModeCompletions:
		words, err = service.CheckSensitiveInput(textRequest.Prompt)
	case relayconstant.RelayModeModerations:
		words, err = service.CheckSensitiveInput(textRequest.Input)
	case relayconstant.RelayModeEmbeddings:
		words, err = service.CheckSensitiveInput(textRequest.Input)
	}
	return words, err
}

// 预扣费并返回用户剩余配额
func preConsumeQuota(c *gin.Context, preConsumedQuota int, relayInfo *relaycommon.RelayInfo) (int, int, *dto.OpenAIErrorWithStatusCode) {
	userQuota, err := model.GetUserQuota(relayInfo.UserId, false)
	if err != nil {
		return 0, 0, service.OpenAIErrorWrapperLocal(err, "get_user_quota_failed", http.StatusInternalServerError)
	}
	if userQuota <= 0 {
		return 0, 0, service.OpenAIErrorWrapperLocal(errors.New("user quota is not enough"), "insufficient_user_quota", http.StatusForbidden)
	}
	if userQuota-preConsumedQuota < 0 {
		return 0, 0, service.OpenAIErrorWrapperLocal(fmt.Errorf("chat pre-consumed quota failed, user quota: %s, need quota: %s", common.FormatQuota(userQuota), common.FormatQuota(preConsumedQuota)), "insufficient_user_quota", http.StatusForbidden)
	}
	relayInfo.UserQuota = userQuota
	if userQuota > 100*preConsumedQuota {
		// 用户额度充足，判断令牌额度是否充足
		if !relayInfo.TokenUnlimited {
			// 非无限令牌，判断令牌额度是否充足
			tokenQuota := c.GetInt("token_quota")
			if tokenQuota > 100*preConsumedQuota {
				// 令牌额度充足，信任令牌
				preConsumedQuota = 0
				common.LogInfo(c, fmt.Sprintf("user %d quota %s and token %d quota %d are enough, trusted and no need to pre-consume", relayInfo.UserId, common.FormatQuota(userQuota), relayInfo.TokenId, tokenQuota))
			}
		} else {
			// in this case, we do not pre-consume quota
			// because the user has enough quota
			preConsumedQuota = 0
			common.LogInfo(c, fmt.Sprintf("user %d with unlimited token has enough quota %s, trusted and no need to pre-consume", relayInfo.UserId, common.FormatQuota(userQuota)))
		}
	}

	if preConsumedQuota > 0 {
		err := service.PreConsumeTokenQuota(relayInfo, preConsumedQuota)
		if err != nil {
			return 0, 0, service.OpenAIErrorWrapperLocal(err, "pre_consume_token_quota_failed", http.StatusForbidden)
		}
		err = model.DecreaseUserQuota(relayInfo.UserId, preConsumedQuota)
		if err != nil {
			return 0, 0, service.OpenAIErrorWrapperLocal(err, "decrease_user_quota_failed", http.StatusInternalServerError)
		}
	}
	return preConsumedQuota, userQuota, nil
}

func returnPreConsumedQuota(c *gin.Context, relayInfo *relaycommon.RelayInfo, userQuota int, preConsumedQuota int) {
	if preConsumedQuota != 0 {
		gopool.Go(func() {
			relayInfoCopy := *relayInfo

			err := service.PostConsumeQuota(&relayInfoCopy, -preConsumedQuota, 0, false)
			if err != nil {
				common.SysError("error return pre-consumed quota: " + err.Error())
			}
		})
	}
}

func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo,
	usage *dto.Usage, preConsumedQuota int, userQuota int, priceData helper.PriceData, extraContent string) {
	if usage == nil {
		usage = &dto.Usage{
			PromptTokens:     relayInfo.PromptTokens,
			CompletionTokens: 0,
			TotalTokens:      relayInfo.PromptTokens,
		}
		extraContent += "（可能是请求出错）"
	}
	useTimeSeconds := time.Now().Unix() - relayInfo.StartTime.Unix()
	promptTokens := usage.PromptTokens
	cacheTokens := usage.PromptTokensDetails.CachedTokens
	completionTokens := usage.CompletionTokens
	modelName := relayInfo.OriginModelName

	tokenName := ctx.GetString("token_name")
	completionRatio := priceData.CompletionRatio
	cacheRatio := priceData.CacheRatio
	modelRatio := priceData.ModelRatio
	groupRatio := priceData.GroupRatio
	modelPrice := priceData.ModelPrice

	// Convert values to decimal for precise calculation
	dPromptTokens := decimal.NewFromInt(int64(promptTokens))
	dCacheTokens := decimal.NewFromInt(int64(cacheTokens))
	dCompletionTokens := decimal.NewFromInt(int64(completionTokens))
	dCompletionRatio := decimal.NewFromFloat(completionRatio)
	dCacheRatio := decimal.NewFromFloat(cacheRatio)
	dModelRatio := decimal.NewFromFloat(modelRatio)
	dGroupRatio := decimal.NewFromFloat(groupRatio)
	dModelPrice := decimal.NewFromFloat(modelPrice)
	dQuotaPerUnit := decimal.NewFromFloat(common.QuotaPerUnit)

	ratio := dModelRatio.Mul(dGroupRatio)

	var quotaCalculateDecimal decimal.Decimal
	if !priceData.UsePrice {
		nonCachedTokens := dPromptTokens.Sub(dCacheTokens)
		cachedTokensWithRatio := dCacheTokens.Mul(dCacheRatio)
		promptQuota := nonCachedTokens.Add(cachedTokensWithRatio)
		completionQuota := dCompletionTokens.Mul(dCompletionRatio)

		quotaCalculateDecimal = promptQuota.Add(completionQuota).Mul(ratio)

		if !ratio.IsZero() && quotaCalculateDecimal.LessThanOrEqual(decimal.Zero) {
			quotaCalculateDecimal = decimal.NewFromInt(1)
		}
	} else {
		quotaCalculateDecimal = dModelPrice.Mul(dQuotaPerUnit).Mul(dGroupRatio)
	}

	quota := int(quotaCalculateDecimal.Round(0).IntPart())
	totalTokens := promptTokens + completionTokens

	var logContent string
	if !priceData.UsePrice {
		logContent = fmt.Sprintf("模型倍率 %.2f，补全倍率 %.2f，分组倍率 %.2f", modelRatio, completionRatio, groupRatio)
	} else {
		logContent = fmt.Sprintf("模型价格 %.2f，分组倍率 %.2f", modelPrice, groupRatio)
	}

	// record all the consume log even if quota is 0
	if totalTokens == 0 {
		// in this case, must be some error happened
		// we cannot just return, because we may have to return the pre-consumed quota
		quota = 0
		logContent += fmt.Sprintf("（可能是上游超时）")
		common.LogError(ctx, fmt.Sprintf("total tokens is 0, cannot consume quota, userId %d, channelId %d, "+
			"tokenId %d, model %s， pre-consumed quota %d", relayInfo.UserId, relayInfo.ChannelId, relayInfo.TokenId, modelName, preConsumedQuota))
	} else {
		quotaDelta := quota - preConsumedQuota
		if quotaDelta != 0 {
			err := service.PostConsumeQuota(relayInfo, quotaDelta, preConsumedQuota, true)
			if err != nil {
				common.LogError(ctx, "error consuming token remain quota: "+err.Error())
			}
		}
		model.UpdateUserUsedQuotaAndRequestCount(relayInfo.UserId, quota)
		model.UpdateChannelUsedQuota(relayInfo.ChannelId, quota)
	}

	logModel := modelName
	if strings.HasPrefix(logModel, "gpt-4-gizmo") {
		logModel = "gpt-4-gizmo-*"
		logContent += fmt.Sprintf("，模型 %s", modelName)
	}
	if strings.HasPrefix(logModel, "gpt-4o-gizmo") {
		logModel = "gpt-4o-gizmo-*"
		logContent += fmt.Sprintf("，模型 %s", modelName)
	}
	if extraContent != "" {
		logContent += ", " + extraContent
	}
	other := service.GenerateTextOtherInfo(ctx, relayInfo, modelRatio, groupRatio, completionRatio, cacheTokens, cacheRatio, modelPrice)
	model.RecordConsumeLog(ctx, relayInfo.UserId, relayInfo.ChannelId, promptTokens, completionTokens, logModel,
		tokenName, quota, logContent, relayInfo.TokenId, userQuota, int(useTimeSeconds), relayInfo.IsStream, relayInfo.Group, other)
}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+								package relay
 								import (
 									"bytes"
 									"encoding/json"
 									"errors"
 									"fmt"
 									"io"
 									"math"
 									"net/http"
 									"one-api/common"
-												feat: 初步兼容敏感词过滤

											
										
										
											2024-03-20 17:07:42 +08:00
+									"one-api/constant"
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									"one-api/dto"
 									"one-api/model"
 									relaycommon "one-api/relay/common"
 									relayconstant "one-api/relay/constant"
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									"one-api/relay/helper"
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									"one-api/service"
-												feat: Introduce settings package and refactor constants

- Added a new `setting` package to replace the `constant` package for configuration management, improving code organization and clarity.
- Moved various configuration variables such as `ServerAddress`, `PayAddress`, and `SensitiveWords` to the new `setting` package.
- Updated references throughout the codebase to use the new `setting` package, ensuring consistent access to configuration values.
- Introduced new files for managing chat settings and midjourney settings, enhancing modularity and maintainability of the code.

											
										
										
											2024-12-22 17:24:29 +08:00
+									"one-api/setting"
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									"strings"
 									"time"
-												feat: Improve decimal precision for quota and payment calculations

- Added github.com/shopspring/decimal for precise floating-point calculations
- Refactored quota and payment calculations in multiple files to use decimal arithmetic
- Updated go.mod and go.sum to include decimal library
- Improved precision in topup, relay, and quota service calculations
- Added support for more OpenAI model variants in cache ratio settings

											
										
										
											2025-03-08 21:55:50 +08:00
+									"github.com/bytedance/gopkg/util/gopool"
 									"github.com/shopspring/decimal"
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									"github.com/gin-gonic/gin"
 								)
 								func getAndValidateTextRequest(c *gin.Context, relayInfo *relaycommon.RelayInfo) (*dto.GeneralOpenAIRequest, error) {
 									textRequest := &dto.GeneralOpenAIRequest{}
 									err := common.UnmarshalBodyReusable(c, textRequest)
 									if err != nil {
 										return nil, err
 									}
 									if relayInfo.RelayMode == relayconstant.RelayModeModerations && textRequest.Model == "" {
 										textRequest.Model = "text-moderation-latest"
 									}
 									if relayInfo.RelayMode == relayconstant.RelayModeEmbeddings && textRequest.Model == "" {
 										textRequest.Model = c.Param("model")
 									}
-												refactor: improve validation logic and error handling in relay-text.go

- Simplified validation checks for MaxTokens and Messages fields.
- Enhanced error messages for better clarity.
- Updated goroutine to avoid passing context unnecessarily.

											
										
										
											2024-12-01 08:24:41 +08:00
+									if textRequest.MaxTokens > math.MaxInt32/2 {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										return nil, errors.New("max_tokens is invalid")
 									}
 									if textRequest.Model == "" {
 										return nil, errors.New("model is required")
 									}
 									switch relayInfo.RelayMode {
 									case relayconstant.RelayModeCompletions:
 										if textRequest.Prompt == "" {
 											return nil, errors.New("field prompt is required")
 										}
 									case relayconstant.RelayModeChatCompletions:
-												refactor: improve validation logic and error handling in relay-text.go

- Simplified validation checks for MaxTokens and Messages fields.
- Enhanced error messages for better clarity.
- Updated goroutine to avoid passing context unnecessarily.

											
										
										
											2024-12-01 08:24:41 +08:00
+										if len(textRequest.Messages) == 0 {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+											return nil, errors.New("field messages is required")
 										}
 									case relayconstant.RelayModeEmbeddings:
 									case relayconstant.RelayModeModerations:
-												refactor: improve validation logic and error handling in relay-text.go

- Simplified validation checks for MaxTokens and Messages fields.
- Enhanced error messages for better clarity.
- Updated goroutine to avoid passing context unnecessarily.

											
										
										
											2024-12-01 08:24:41 +08:00
+										if textRequest.Input == nil || textRequest.Input == "" {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+											return nil, errors.New("field input is required")
 										}
 									case relayconstant.RelayModeEdits:
 										if textRequest.Instruction == "" {
 											return nil, errors.New("field instruction is required")
 										}
 									}
 									relayInfo.IsStream = textRequest.Stream
 									return textRequest, nil
 								}
-												fix: 部分情况缺少返回预扣

(cherry picked from commit 96373455521a38095706bd81c57f9a18557d9c2e)

											
										
										
											2024-10-07 20:35:33 +08:00
+								func TextHelper(c *gin.Context) (openaiErr *dto.OpenAIErrorWithStatusCode) {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
 									relayInfo := relaycommon.GenRelayInfo(c)
 									// get & validate textRequest 获取并验证文本请求
 									textRequest, err := getAndValidateTextRequest(c, relayInfo)
 									if err != nil {
 										common.LogError(c, fmt.Sprintf("getAndValidateTextRequest failed: %s", err.Error()))
-												feat: 本地重试

											
										
										
											2024-04-04 16:35:44 +08:00
+										return service.OpenAIErrorWrapperLocal(err, "invalid_text_request", http.StatusBadRequest)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: Introduce settings package and refactor constants

- Added a new `setting` package to replace the `constant` package for configuration management, improving code organization and clarity.
- Moved various configuration variables such as `ServerAddress`, `PayAddress`, and `SensitiveWords` to the new `setting` package.
- Updated references throughout the codebase to use the new `setting` package, ensuring consistent access to configuration values.
- Introduced new files for managing chat settings and midjourney settings, enhancing modularity and maintainability of the code.

											
										
										
											2024-12-22 17:24:29 +08:00
+									if setting.ShouldCheckPromptSensitive() {
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+										words, err := checkRequestSensitive(textRequest, relayInfo)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										if err != nil {
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+											common.LogWarn(c, fmt.Sprintf("user sensitive words detected: %s", strings.Join(words, ", ")))
-												feat: 本地重试

											
										
										
											2024-04-04 16:35:44 +08:00
+											return service.OpenAIErrorWrapperLocal(err, "sensitive_words_detected", http.StatusBadRequest)
-												feat: 统一错误提示

											
										
										
											2024-03-20 20:36:55 +08:00
+										}
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									}
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									err = helper.ModelMappedHelper(c, relayInfo)
 									if err != nil {
 										return service.OpenAIErrorWrapperLocal(err, "model_mapped_error", http.StatusInternalServerError)
 									}
 									textRequest.Model = relayInfo.UpstreamModelName
-												Update relay-text.go

在上下文中存入promptTokens,避免重试过程重复计算
											
										
										
											2024-12-26 02:00:04 +08:00
+									// 获取 promptTokens，如果上下文中已经存在，则直接使用
 									var promptTokens int
 									if value, exists := c.Get("prompt_tokens"); exists {
 										promptTokens = value.(int)
-												fix: retry prompt tokens

											
										
										
											2025-01-02 16:33:00 +08:00
+										relayInfo.PromptTokens = promptTokens
-												Update relay-text.go

在上下文中存入promptTokens,避免重试过程重复计算
											
										
										
											2024-12-26 02:00:04 +08:00
+									} else {
 										promptTokens, err = getPromptTokens(textRequest, relayInfo)
 										// count messages token error 计算promptTokens错误
 										if err != nil {
 											return service.OpenAIErrorWrapper(err, "count_token_messages_failed", http.StatusInternalServerError)
 										}
 										c.Set("prompt_tokens", promptTokens)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: add new GPT-4.5 preview model ratios

											
										
										
											2025-02-28 19:17:15 +08:00
+									priceData, err := helper.ModelPriceHelper(c, relayInfo, promptTokens, int(textRequest.MaxTokens))
 									if err != nil {
 										return service.OpenAIErrorWrapperLocal(err, "model_price_error", http.StatusInternalServerError)
 									}
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									// pre-consume quota 预消耗配额
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									preConsumedQuota, userQuota, openaiErr := preConsumeQuota(c, priceData.ShouldPreConsumedQuota, relayInfo)
-												fix: 修复预扣费判定无效导致用户可无限欠费问题

											
										
										
											2024-03-03 22:05:00 +08:00
+									if openaiErr != nil {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										return openaiErr
 									}
-												fix: 部分情况缺少返回预扣

(cherry picked from commit 96373455521a38095706bd81c57f9a18557d9c2e)

											
										
										
											2024-10-07 20:35:33 +08:00
+									defer func() {
 										if openaiErr != nil {
 											returnPreConsumedQuota(c, relayInfo, userQuota, preConsumedQuota)
 										}
 									}()
-												feat: update stream_options

											
										
										
											2024-07-19 14:06:10 +08:00
+									includeUsage := false
 									// 判断用户是否需要返回使用情况
 									if textRequest.StreamOptions != nil && textRequest.StreamOptions.IncludeUsage {
 										includeUsage = true
 									}
-												feat: 完善stream_options

											
										
										
											2024-07-08 02:00:39 +08:00
+									// 如果不支持StreamOptions，将StreamOptions设置为nil
 									if !relayInfo.SupportStreamOptions || !textRequest.Stream {
 										textRequest.StreamOptions = nil
 									} else {
 										// 如果支持StreamOptions，且请求中没有设置StreamOptions，根据配置文件设置StreamOptions
 										if constant.ForceStreamOption {
 											textRequest.StreamOptions = &dto.StreamOptions{
 												IncludeUsage: true,
 											}
 										}
 									}
-												feat: update stream_options

											
										
										
											2024-07-19 14:06:10 +08:00
+									if includeUsage {
 										relayInfo.ShouldIncludeUsage = true
-												feat: 完善stream_options

											
										
										
											2024-07-08 02:00:39 +08:00
+									}
-												feat: 初步重构完成

											
										
										
											2024-02-29 16:21:25 +08:00
+									adaptor := GetAdaptor(relayInfo.ApiType)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if adaptor == nil {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										return service.OpenAIErrorWrapperLocal(fmt.Errorf("invalid api type: %d", relayInfo.ApiType), "invalid_api_type", http.StatusBadRequest)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												refactor: audio relay

											
										
										
											2024-07-16 22:07:10 +08:00
+									adaptor.Init(relayInfo)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									var requestBody io.Reader
-												feat: support stream_options

											
										
										
											2024-07-08 01:27:57 +08:00
-												feat: 暂时禁用透传功能

											
										
										
											2024-11-19 15:04:19 +08:00
+									//if relayInfo.ChannelType == common.ChannelTypeOpenAI && !isModelMapped {
 									//	body, err := common.GetRequestBody(c)
 									//	if err != nil {
 									//		return service.OpenAIErrorWrapperLocal(err, "get_request_body_failed", http.StatusInternalServerError)
 									//	}
 									//	requestBody = bytes.NewBuffer(body)
 									//} else {
 									//
 									//}
 									convertedRequest, err := adaptor.ConvertRequest(c, relayInfo, textRequest)
 									if err != nil {
 										return service.OpenAIErrorWrapperLocal(err, "convert_request_failed", http.StatusInternalServerError)
 									}
-												chore: Update dependencies and refactor JSON handling #614

- Removed the `bytedance/sonic` dependency and replaced its usage with the standard `encoding/json` package for JSON marshalling in `relay-text.go`.
- Updated `go.mod` to reflect the removal of `sonic` and adjusted the version of `sonic/loader`.
- Cleaned up `go.sum` to ensure consistency with the updated dependencies.

											
										
										
											2024-12-12 14:14:24 +08:00
+									jsonData, err := json.Marshal(convertedRequest)
-												feat: 暂时禁用透传功能

											
										
										
											2024-11-19 15:04:19 +08:00
+									if err != nil {
 										return service.OpenAIErrorWrapperLocal(err, "json_marshal_failed", http.StatusInternalServerError)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: 暂时禁用透传功能

											
										
										
											2024-11-19 15:04:19 +08:00
+									requestBody = bytes.NewBuffer(jsonData)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
-												feat: 状态码复写

											
										
										
											2024-04-20 21:05:23 +08:00
+									statusCodeMappingStr := c.GetString("status_code_mapping")
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+									var httpResp *http.Response
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									resp, err := adaptor.DoRequest(c, relayInfo, requestBody)
-												fix: 修复流模式错误扣费的问题 (close #95)

											
										
										
											2024-03-06 17:41:55 +08:00
+									if err != nil {
 										return service.OpenAIErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)
 									}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
-												feat: support aws claude

											
										
										
											2024-04-23 11:44:40 +08:00
+									if resp != nil {
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+										httpResp = resp.(*http.Response)
 										relayInfo.IsStream = relayInfo.IsStream || strings.HasPrefix(httpResp.Header.Get("Content-Type"), "text/event-stream")
 										if httpResp.StatusCode != http.StatusOK {
-												fix: 部分情况缺少返回预扣

(cherry picked from commit 96373455521a38095706bd81c57f9a18557d9c2e)

											
										
										
											2024-10-07 20:35:33 +08:00
+											openaiErr = service.RelayErrorHandler(httpResp)
-												feat: support aws claude

											
										
										
											2024-04-23 11:44:40 +08:00
+											// reset status code 重置状态码
 											service.ResetStatusCode(openaiErr, statusCodeMappingStr)
 											return openaiErr
 										}
-												fix: 修复流模式错误扣费的问题 (close #95)

											
										
										
											2024-03-06 17:41:55 +08:00
+									}
-												feat: realtime

(cherry picked from commit a5529df3e1a4c08a120e8c05203a7d885b0fe8d8)

											
										
										
											2024-10-04 16:08:18 +08:00
+									usage, openaiErr := adaptor.DoResponse(c, httpResp, relayInfo)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if openaiErr != nil {
-												feat: 状态码复写

											
										
										
											2024-04-20 21:05:23 +08:00
+										// reset status code 重置状态码
 										service.ResetStatusCode(openaiErr, statusCodeMappingStr)
-												fix: remove sensitive check on completion (close #157)

											
										
										
											2024-03-29 22:20:14 +08:00
+										return openaiErr
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: 完善audio计费

											
										
										
											2024-11-07 16:12:09 +08:00
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									if strings.HasPrefix(relayInfo.OriginModelName, "gpt-4o-audio") {
 										service.PostAudioConsumeQuota(c, relayInfo, usage.(*dto.Usage), preConsumedQuota, userQuota, priceData, "")
-												feat: 完善audio计费

											
										
										
											2024-11-07 16:12:09 +08:00
+									} else {
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+										postConsumeQuota(c, relayInfo, usage.(*dto.Usage), preConsumedQuota, userQuota, priceData, "")
-												feat: 完善audio计费

											
										
										
											2024-11-07 16:12:09 +08:00
+									}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									return nil
 								}
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+								func getPromptTokens(textRequest *dto.GeneralOpenAIRequest, info *relaycommon.RelayInfo) (int, error) {
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									var promptTokens int
 									var err error
 									switch info.RelayMode {
 									case relayconstant.RelayModeChatCompletions:
-												feat: add multi-file type support for Gemini and Claude

- Add file data DTO for structured file handling
- Implement file decoder service
- Update Claude and Gemini relay channels to handle various file types
- Reorganize worker service to cf_worker for clarity
- Update token counter and image service for new file types

											
										
										
											2024-12-29 00:00:24 +08:00
+										promptTokens, err = service.CountTokenChatRequest(info, *textRequest)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									case relayconstant.RelayModeCompletions:
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										promptTokens, err = service.CountTokenInput(textRequest.Prompt, textRequest.Model)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									case relayconstant.RelayModeModerations:
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										promptTokens, err = service.CountTokenInput(textRequest.Input, textRequest.Model)
-												fix: Fix the issue of 'unknown relay mode' when making an embedding request (close #93)

											
										
										
											2024-03-05 23:04:57 +08:00
+									case relayconstant.RelayModeEmbeddings:
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+										promptTokens, err = service.CountTokenInput(textRequest.Input, textRequest.Model)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									default:
 										err = errors.New("unknown relay mode")
 										promptTokens = 0
 									}
 									info.PromptTokens = promptTokens
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									return promptTokens, err
 								}
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+								func checkRequestSensitive(textRequest *dto.GeneralOpenAIRequest, info *relaycommon.RelayInfo) ([]string, error) {
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									var err error
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+									var words []string
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									switch info.RelayMode {
 									case relayconstant.RelayModeChatCompletions:
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+										words, err = service.CheckSensitiveMessages(textRequest.Messages)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									case relayconstant.RelayModeCompletions:
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+										words, err = service.CheckSensitiveInput(textRequest.Prompt)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									case relayconstant.RelayModeModerations:
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+										words, err = service.CheckSensitiveInput(textRequest.Input)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									case relayconstant.RelayModeEmbeddings:
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+										words, err = service.CheckSensitiveInput(textRequest.Input)
-												refactor: 重构敏感词

											
										
										
											2024-05-23 23:59:55 +08:00
+									}
-												feat: Enhance sensitive word detection with detailed logging

											
										
										
											2025-02-21 16:57:30 +08:00
+									return words, err
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+								}
 								// 预扣费并返回用户剩余配额
-												fix: fix preConsumeQuota error

											
										
										
											2024-02-29 16:39:52 +08:00
+								func preConsumeQuota(c *gin.Context, preConsumedQuota int, relayInfo *relaycommon.RelayInfo) (int, int, *dto.OpenAIErrorWithStatusCode) {
-												refactor: user cache logic

											
										
										
											2024-12-29 16:50:26 +08:00
+									userQuota, err := model.GetUserQuota(relayInfo.UserId, false)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if err != nil {
-												feat: 本地重试

											
										
										
											2024-04-04 16:35:44 +08:00
+										return 0, 0, service.OpenAIErrorWrapperLocal(err, "get_user_quota_failed", http.StatusInternalServerError)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: 区分额度不足和预扣费失败提示

											
										
										
											2024-08-09 18:34:51 +08:00
+									if userQuota <= 0 {
-												feat: 本地重试

											
										
										
											2024-04-04 16:35:44 +08:00
+										return 0, 0, service.OpenAIErrorWrapperLocal(errors.New("user quota is not enough"), "insufficient_user_quota", http.StatusForbidden)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: 区分额度不足和预扣费失败提示

											
										
										
											2024-08-09 18:34:51 +08:00
+									if userQuota-preConsumedQuota < 0 {
-												refactor: Improve message content handling and quota error responses

											
										
										
											2025-02-21 18:18:21 +08:00
+										return 0, 0, service.OpenAIErrorWrapperLocal(fmt.Errorf("chat pre-consumed quota failed, user quota: %s, need quota: %s", common.FormatQuota(userQuota), common.FormatQuota(preConsumedQuota)), "insufficient_user_quota", http.StatusForbidden)
-												feat: 区分额度不足和预扣费失败提示

											
										
										
											2024-08-09 18:34:51 +08:00
+									}
-												refactor: Enhance user context and quota management

- Add new context keys for user-related information
- Modify user cache and authentication middleware to populate context
- Refactor quota and notification services to use context-based user data
- Remove redundant database queries by leveraging context information
- Update various components to use new context-based user retrieval methods

											
										
										
											2025-02-25 20:56:16 +08:00
+									relayInfo.UserQuota = userQuota
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if userQuota > 100*preConsumedQuota {
 										// 用户额度充足，判断令牌额度是否充足
 										if !relayInfo.TokenUnlimited {
 											// 非无限令牌，判断令牌额度是否充足
 											tokenQuota := c.GetInt("token_quota")
 											if tokenQuota > 100*preConsumedQuota {
 												// 令牌额度充足，信任令牌
 												preConsumedQuota = 0
-												feat: Add user notification settings with quota warning and multiple notification methods

- Implement user notification settings with email and webhook options
- Add new user settings for quota warning threshold and notification preferences
- Create backend API and database support for user notification configuration
- Enhance frontend personal settings with notification configuration UI
- Support custom notification email and webhook URL
- Add service layer for sending user notifications

											
										
										
											2025-02-18 14:54:21 +08:00
+												common.LogInfo(c, fmt.Sprintf("user %d quota %s and token %d quota %d are enough, trusted and no need to pre-consume", relayInfo.UserId, common.FormatQuota(userQuota), relayInfo.TokenId, tokenQuota))
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+											}
 										} else {
 											// in this case, we do not pre-consume quota
 											// because the user has enough quota
 											preConsumedQuota = 0
-												feat: Add user notification settings with quota warning and multiple notification methods

- Implement user notification settings with email and webhook options
- Add new user settings for quota warning threshold and notification preferences
- Create backend API and database support for user notification configuration
- Enhance frontend personal settings with notification configuration UI
- Support custom notification email and webhook URL
- Add service layer for sending user notifications

											
										
										
											2025-02-18 14:54:21 +08:00
+											common.LogInfo(c, fmt.Sprintf("user %d with unlimited token has enough quota %s, trusted and no need to pre-consume", relayInfo.UserId, common.FormatQuota(userQuota)))
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										}
 									}
-												refactor: user cache logic

											
										
										
											2024-12-29 16:50:26 +08:00
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if preConsumedQuota > 0 {
-												refactor: Enhance user context and quota management

- Add new context keys for user-related information
- Modify user cache and authentication middleware to populate context
- Refactor quota and notification services to use context-based user data
- Remove redundant database queries by leveraging context information
- Update various components to use new context-based user retrieval methods

											
										
										
											2025-02-25 20:56:16 +08:00
+										err := service.PreConsumeTokenQuota(relayInfo, preConsumedQuota)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										if err != nil {
-												feat: 本地重试

											
										
										
											2024-04-04 16:35:44 +08:00
+											return 0, 0, service.OpenAIErrorWrapperLocal(err, "pre_consume_token_quota_failed", http.StatusForbidden)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										}
-												refactor: token cache logic

											
										
										
											2024-12-30 17:10:48 +08:00
+										err = model.DecreaseUserQuota(relayInfo.UserId, preConsumedQuota)
 										if err != nil {
 											return 0, 0, service.OpenAIErrorWrapperLocal(err, "decrease_user_quota_failed", http.StatusInternalServerError)
 										}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												fix: fix preConsumeQuota error

											
										
										
											2024-02-29 16:39:52 +08:00
+									return preConsumedQuota, userQuota, nil
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+								}
-												feat: playground

											
										
										
											2024-09-26 00:59:09 +08:00
+								func returnPreConsumedQuota(c *gin.Context, relayInfo *relaycommon.RelayInfo, userQuota int, preConsumedQuota int) {
-												fix: 修复流模式错误扣费的问题 (close #95)

											
										
										
											2024-03-06 17:41:55 +08:00
+									if preConsumedQuota != 0 {
-												refactor: Replace manual goroutine creation with gopool.Go

											
										
										
											2025-02-19 18:38:29 +08:00
+										gopool.Go(func() {
-												refactor: improve validation logic and error handling in relay-text.go

- Simplified validation checks for MaxTokens and Messages fields.
- Enhanced error messages for better clarity.
- Updated goroutine to avoid passing context unnecessarily.

											
										
										
											2024-12-01 08:24:41 +08:00
+											relayInfoCopy := *relayInfo
-												feat: Add user notification settings with quota warning and multiple notification methods

- Implement user notification settings with email and webhook options
- Add new user settings for quota warning threshold and notification preferences
- Create backend API and database support for user notification configuration
- Enhance frontend personal settings with notification configuration UI
- Support custom notification email and webhook URL
- Add service layer for sending user notifications

											
										
										
											2025-02-18 14:54:21 +08:00
+											err := service.PostConsumeQuota(&relayInfoCopy, -preConsumedQuota, 0, false)
-												fix: 修复流模式错误扣费的问题 (close #95)

											
										
										
											2024-03-06 17:41:55 +08:00
+											if err != nil {
 												common.SysError("error return pre-consumed quota: " + err.Error())
 											}
-												refactor: Replace manual goroutine creation with gopool.Go

											
										
										
											2025-02-19 18:38:29 +08:00
+										})
-												fix: 修复流模式错误扣费的问题 (close #95)

											
										
										
											2024-03-06 17:41:55 +08:00
+									}
 								}
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+								func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo,
 									usage *dto.Usage, preConsumedQuota int, userQuota int, priceData helper.PriceData, extraContent string) {
-												feat: 日志新增rpm和tpm数据。(close #384)

											
										
										
											2024-08-01 16:13:08 +08:00
+									if usage == nil {
 										usage = &dto.Usage{
 											PromptTokens:     relayInfo.PromptTokens,
 											CompletionTokens: 0,
 											TotalTokens:      relayInfo.PromptTokens,
 										}
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
+										extraContent += "（可能是请求出错）"
-												feat: 日志新增rpm和tpm数据。(close #384)

											
										
										
											2024-08-01 16:13:08 +08:00
+									}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									useTimeSeconds := time.Now().Unix() - relayInfo.StartTime.Unix()
 									promptTokens := usage.PromptTokens
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
+									cacheTokens := usage.PromptTokensDetails.CachedTokens
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									completionTokens := usage.CompletionTokens
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									modelName := relayInfo.OriginModelName
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
 									tokenName := ctx.GetString("token_name")
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
+									completionRatio := priceData.CompletionRatio
 									cacheRatio := priceData.CacheRatio
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									modelRatio := priceData.ModelRatio
 									groupRatio := priceData.GroupRatio
 									modelPrice := priceData.ModelPrice
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
-												feat: Improve decimal precision for quota and payment calculations

- Added github.com/shopspring/decimal for precise floating-point calculations
- Refactored quota and payment calculations in multiple files to use decimal arithmetic
- Updated go.mod and go.sum to include decimal library
- Improved precision in topup, relay, and quota service calculations
- Added support for more OpenAI model variants in cache ratio settings

											
										
										
											2025-03-08 21:55:50 +08:00
+									// Convert values to decimal for precise calculation
 									dPromptTokens := decimal.NewFromInt(int64(promptTokens))
 									dCacheTokens := decimal.NewFromInt(int64(cacheTokens))
 									dCompletionTokens := decimal.NewFromInt(int64(completionTokens))
 									dCompletionRatio := decimal.NewFromFloat(completionRatio)
 									dCacheRatio := decimal.NewFromFloat(cacheRatio)
 									dModelRatio := decimal.NewFromFloat(modelRatio)
 									dGroupRatio := decimal.NewFromFloat(groupRatio)
 									dModelPrice := decimal.NewFromFloat(modelPrice)
 									dQuotaPerUnit := decimal.NewFromFloat(common.QuotaPerUnit)
 									ratio := dModelRatio.Mul(dGroupRatio)
 									var quotaCalculateDecimal decimal.Decimal
-												refactor: Simplify model mapping and pricing logic across relay modules

											
										
										
											2025-02-20 16:41:46 +08:00
+									if !priceData.UsePrice {
-												feat: Improve decimal precision for quota and payment calculations

- Added github.com/shopspring/decimal for precise floating-point calculations
- Refactored quota and payment calculations in multiple files to use decimal arithmetic
- Updated go.mod and go.sum to include decimal library
- Improved precision in topup, relay, and quota service calculations
- Added support for more OpenAI model variants in cache ratio settings

											
										
										
											2025-03-08 21:55:50 +08:00
+										nonCachedTokens := dPromptTokens.Sub(dCacheTokens)
 										cachedTokensWithRatio := dCacheTokens.Mul(dCacheRatio)
 										promptQuota := nonCachedTokens.Add(cachedTokensWithRatio)
 										completionQuota := dCompletionTokens.Mul(dCompletionRatio)
 										quotaCalculateDecimal = promptQuota.Add(completionQuota).Mul(ratio)
 										if !ratio.IsZero() && quotaCalculateDecimal.LessThanOrEqual(decimal.Zero) {
 											quotaCalculateDecimal = decimal.NewFromInt(1)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										}
 									} else {
-												feat: Improve decimal precision for quota and payment calculations

- Added github.com/shopspring/decimal for precise floating-point calculations
- Refactored quota and payment calculations in multiple files to use decimal arithmetic
- Updated go.mod and go.sum to include decimal library
- Improved precision in topup, relay, and quota service calculations
- Added support for more OpenAI model variants in cache ratio settings

											
										
										
											2025-03-08 21:55:50 +08:00
+										quotaCalculateDecimal = dModelPrice.Mul(dQuotaPerUnit).Mul(dGroupRatio)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: Improve decimal precision for quota and payment calculations

- Added github.com/shopspring/decimal for precise floating-point calculations
- Refactored quota and payment calculations in multiple files to use decimal arithmetic
- Updated go.mod and go.sum to include decimal library
- Improved precision in topup, relay, and quota service calculations
- Added support for more OpenAI model variants in cache ratio settings

											
										
										
											2025-03-08 21:55:50 +08:00
 									quota := int(quotaCalculateDecimal.Round(0).IntPart())
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									totalTokens := promptTokens + completionTokens
-												refactor: Improve quota calculation precision using floating-point arithmetic

											
										
										
											2025-03-08 16:44:08 +08:00
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									var logContent string
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
+									if !priceData.UsePrice {
-												feat: support SiliconFlow (close #437, close #403)

											
										
										
											2024-08-16 18:27:26 +08:00
+										logContent = fmt.Sprintf("模型倍率 %.2f，补全倍率 %.2f，分组倍率 %.2f", modelRatio, completionRatio, groupRatio)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									} else {
 										logContent = fmt.Sprintf("模型价格 %.2f，分组倍率 %.2f", modelPrice, groupRatio)
 									}
 									// record all the consume log even if quota is 0
 									if totalTokens == 0 {
 										// in this case, must be some error happened
 										// we cannot just return, because we may have to return the pre-consumed quota
 										quota = 0
 										logContent += fmt.Sprintf("（可能是上游超时）")
-												feat: support cohere rerank

											
										
										
											2024-07-06 17:09:22 +08:00
+										common.LogError(ctx, fmt.Sprintf("total tokens is 0, cannot consume quota, userId %d, channelId %d, "+
 											"tokenId %d, model %s， pre-consumed quota %d", relayInfo.UserId, relayInfo.ChannelId, relayInfo.TokenId, modelName, preConsumedQuota))
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									} else {
 										quotaDelta := quota - preConsumedQuota
-												chore: 优化按次计费的数据库查询次数

											
										
										
											2024-04-04 20:10:30 +08:00
+										if quotaDelta != 0 {
-												feat: Add user notification settings with quota warning and multiple notification methods

- Implement user notification settings with email and webhook options
- Add new user settings for quota warning threshold and notification preferences
- Create backend API and database support for user notification configuration
- Enhance frontend personal settings with notification configuration UI
- Support custom notification email and webhook URL
- Add service layer for sending user notifications

											
										
										
											2025-02-18 14:54:21 +08:00
+											err := service.PostConsumeQuota(relayInfo, quotaDelta, preConsumedQuota, true)
-												chore: 优化按次计费的数据库查询次数

											
										
										
											2024-04-04 20:10:30 +08:00
+											if err != nil {
 												common.LogError(ctx, "error consuming token remain quota: "+err.Error())
 											}
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+										}
 										model.UpdateUserUsedQuotaAndRequestCount(relayInfo.UserId, quota)
 										model.UpdateChannelUsedQuota(relayInfo.ChannelId, quota)
 									}
-												feat: support cohere rerank

											
										
										
											2024-07-06 17:09:22 +08:00
+									logModel := modelName
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									if strings.HasPrefix(logModel, "gpt-4-gizmo") {
 										logModel = "gpt-4-gizmo-*"
-												feat: support cohere rerank

											
										
										
											2024-07-06 17:09:22 +08:00
+										logContent += fmt.Sprintf("，模型 %s", modelName)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+									}
-												feat: support gpt-4o-gizmo-* (close #436)

											
										
										
											2024-08-16 17:25:03 +08:00
+									if strings.HasPrefix(logModel, "gpt-4o-gizmo") {
 										logModel = "gpt-4o-gizmo-*"
 										logContent += fmt.Sprintf("，模型 %s", modelName)
 									}
-												refactor: image relay

											
										
										
											2024-07-17 23:50:37 +08:00
+									if extraContent != "" {
-												chore: log format

											
										
										
											2024-07-18 00:41:31 +08:00
+										logContent += ", " + extraContent
-												refactor: image relay

											
										
										
											2024-07-17 23:50:37 +08:00
+									}
-												feat: Implement cache token ratio for more precise token pricing

											
										
										
											2025-03-08 01:30:50 +08:00
+									other := service.GenerateTextOtherInfo(ctx, relayInfo, modelRatio, groupRatio, completionRatio, cacheTokens, cacheRatio, modelPrice)
-												feat: support cohere rerank

											
										
										
											2024-07-06 17:09:22 +08:00
+									model.RecordConsumeLog(ctx, relayInfo.UserId, relayInfo.ChannelId, promptTokens, completionTokens, logModel,
-												feat: Enhance logging functionality with group support

- Added a new 'group' parameter to various logging functions, including RecordConsumeLog, GetAllLogs, and GetUserLogs, to allow for more granular log tracking.
- Updated the logs table component to display group information, improving the visibility of log data.
- Refactored related functions to accommodate the new group parameter, ensuring consistent handling across the application.
- Improved the initialization of the group column for PostgreSQL compatibility.

											
										
										
											2024-12-24 14:48:11 +08:00
+										tokenName, quota, logContent, relayInfo.TokenId, userQuota, int(useTimeSeconds), relayInfo.IsStream, relayInfo.Group, other)
-												feat: 初步重构

											
										
										
											2024-02-29 01:08:18 +08:00
+								}