ai-gateway/controller/relay-utils.go

package controller

import (
	"context"
	"encoding/json"
	"fmt"
	"io"
	"net/http"
	"one-api/common"
	"one-api/model"
	"strconv"
	"strings"

	"github.com/gin-gonic/gin"
	"github.com/pkoukk/tiktoken-go"
)

var stopFinishReason = "stop"

// tokenEncoderMap won't grow after initialization
var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}
var defaultTokenEncoder *tiktoken.Tiktoken

func InitTokenEncoders() {
	common.SysLog("initializing token encoders")
	gpt35TokenEncoder, err := tiktoken.EncodingForModel("gpt-3.5-turbo")
	if err != nil {
		common.FatalLog(fmt.Sprintf("failed to get gpt-3.5-turbo token encoder: %s", err.Error()))
	}
	defaultTokenEncoder = gpt35TokenEncoder
	gpt4TokenEncoder, err := tiktoken.EncodingForModel("gpt-4")
	if err != nil {
		common.FatalLog(fmt.Sprintf("failed to get gpt-4 token encoder: %s", err.Error()))
	}
	for model, _ := range common.ModelRatio {
		if strings.HasPrefix(model, "gpt-3.5") {
			tokenEncoderMap[model] = gpt35TokenEncoder
		} else if strings.HasPrefix(model, "gpt-4") {
			tokenEncoderMap[model] = gpt4TokenEncoder
		} else {
			tokenEncoderMap[model] = nil
		}
	}
	common.SysLog("token encoders initialized")
}

func getTokenEncoder(model string) *tiktoken.Tiktoken {
	tokenEncoder, ok := tokenEncoderMap[model]
	if ok && tokenEncoder != nil {
		return tokenEncoder
	}
	if ok {
		tokenEncoder, err := tiktoken.EncodingForModel(model)
		if err != nil {
			common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))
			tokenEncoder = defaultTokenEncoder
		}
		tokenEncoderMap[model] = tokenEncoder
		return tokenEncoder
	}
	return defaultTokenEncoder
}

func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {
	if common.ApproximateTokenEnabled {
		return int(float64(len(text)) * 0.38)
	}
	return len(tokenEncoder.Encode(text, nil, nil))
}

func countTokenMessages(messages []Message, model string) int {
	tokenEncoder := getTokenEncoder(model)
	// Reference:
	// https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb
	// https://github.com/pkoukk/tiktoken-go/issues/6
	//
	// Every message follows <|start|>{role/name}\n{content}<|end|>\n
	var tokensPerMessage int
	var tokensPerName int
	if model == "gpt-3.5-turbo-0301" {
		tokensPerMessage = 4
		tokensPerName = -1 // If there's a name, the role is omitted
	} else {
		tokensPerMessage = 3
		tokensPerName = 1
	}
	tokenNum := 0
	for _, message := range messages {
		tokenNum += tokensPerMessage
		tokenNum += getTokenNum(tokenEncoder, message.StringContent())
		tokenNum += getTokenNum(tokenEncoder, message.Role)
		if message.Name != nil {
			tokenNum += tokensPerName
			tokenNum += getTokenNum(tokenEncoder, *message.Name)
		}
	}
	tokenNum += 3 // Every reply is primed with <|start|>assistant<|message|>
	return tokenNum
}

func countTokenInput(input any, model string) int {
	switch input.(type) {
	case string:
		return countTokenText(input.(string), model)
	case []string:
		text := ""
		for _, s := range input.([]string) {
			text += s
		}
		return countTokenText(text, model)
	}
	return 0
}

func countTokenText(text string, model string) int {
	tokenEncoder := getTokenEncoder(model)
	return getTokenNum(tokenEncoder, text)
}

func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {
	openAIError := OpenAIError{
		Message: err.Error(),
		Type:    "one_api_error",
		Code:    code,
	}
	return &OpenAIErrorWithStatusCode{
		OpenAIError: openAIError,
		StatusCode:  statusCode,
	}
}

func shouldDisableChannel(err *OpenAIError, statusCode int) bool {
	if !common.AutomaticDisableChannelEnabled {
		return false
	}
	if err == nil {
		return false
	}
	if statusCode == http.StatusUnauthorized {
		return true
	}
	if err.Type == "insufficient_quota" || err.Code == "invalid_api_key" || err.Code == "account_deactivated" {
		return true
	}
	return false
}

func setEventStreamHeaders(c *gin.Context) {
	c.Writer.Header().Set("Content-Type", "text/event-stream")
	c.Writer.Header().Set("Cache-Control", "no-cache")
	c.Writer.Header().Set("Connection", "keep-alive")
	c.Writer.Header().Set("Transfer-Encoding", "chunked")
	c.Writer.Header().Set("X-Accel-Buffering", "no")
}

func relayErrorHandler(resp *http.Response) (openAIErrorWithStatusCode *OpenAIErrorWithStatusCode) {
	openAIErrorWithStatusCode = &OpenAIErrorWithStatusCode{
		StatusCode: resp.StatusCode,
		OpenAIError: OpenAIError{
			Message: fmt.Sprintf("bad response status code %d", resp.StatusCode),
			Type:    "upstream_error",
			Code:    "bad_response_status_code",
			Param:   strconv.Itoa(resp.StatusCode),
		},
	}
	responseBody, err := io.ReadAll(resp.Body)
	if err != nil {
		return
	}
	err = resp.Body.Close()
	if err != nil {
		return
	}
	var textResponse TextResponse
	err = json.Unmarshal(responseBody, &textResponse)
	if err != nil {
		return
	}
	openAIErrorWithStatusCode.OpenAIError = textResponse.Error
	return
}

func getFullRequestURL(baseURL string, requestURL string, channelType int) string {
	fullRequestURL := fmt.Sprintf("%s%s", baseURL, requestURL)

	if strings.HasPrefix(baseURL, "https://gateway.ai.cloudflare.com") {
		switch channelType {
		case common.ChannelTypeOpenAI:
			fullRequestURL = fmt.Sprintf("%s%s", baseURL, strings.TrimPrefix(requestURL, "/v1"))
		case common.ChannelTypeAzure:
			fullRequestURL = fmt.Sprintf("%s%s", baseURL, strings.TrimPrefix(requestURL, "/openai/deployments"))
		}
	}

	return fullRequestURL
}

func postConsumeQuota(ctx context.Context, tokenId int, quota int, userId int, channelId int, modelRatio float64, groupRatio float64, modelName string, tokenName string) {
	err := model.PostConsumeTokenQuota(tokenId, quota)
	if err != nil {
		common.SysError("error consuming token remain quota: " + err.Error())
	}
	err = model.CacheUpdateUserQuota(userId)
	if err != nil {
		common.SysError("error update user quota cache: " + err.Error())
	}
	if quota != 0 {
		logContent := fmt.Sprintf("模型倍率 %.2f，分组倍率 %.2f", modelRatio, groupRatio)
		model.RecordConsumeLog(ctx, userId, channelId, 0, 0, modelName, tokenName, quota, logContent)
		model.UpdateUserUsedQuotaAndRequestCount(userId, quota)
		model.UpdateChannelUsedQuota(channelId, quota)
	}
}
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`package controller`

			`import (`
feat: support tts model (#713) * Added support for Text-to-Speech models and endpoints * chore: update impl --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-11-17 13:18:51 +00:00			`"context"`
fix: fix error response (close #468) 2023-08-26 04:37:45 +00:00			`"encoding/json"`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`"fmt"`
fix: fix error response (close #468) 2023-08-26 04:37:45 +00:00			`"io"`
fix: disable channel when 401 received (close #467) 2023-08-26 04:05:18 +00:00			`"net/http"`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`"one-api/common"`
feat: support tts model (#713) * Added support for Text-to-Speech models and endpoints * chore: update impl --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-11-17 13:18:51 +00:00			`"one-api/model"`
fix: fix error response (close #468) 2023-08-26 04:37:45 +00:00			`"strconv"`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`"strings"`
feat: support cloudflare gateway for azure (#666) * 🐛 Fix cloudflare gateway request failure * 🐛 fix channel test url error 2023-11-19 07:52:35 +00:00
			`"github.com/gin-gonic/gin"`
			`"github.com/pkoukk/tiktoken-go"`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`)`

fix: fix finish_reason fileld not fully compatible with OpenAI (close #372, #373) * optimize:unify finish_reason field * refactor: use a global stop finish reason --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-08-12 03:04:53 +00:00			`var stopFinishReason = "stop"`

perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`// tokenEncoderMap won't grow after initialization`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`var tokenEncoderMap = map[string]*tiktoken.Tiktoken{}`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`var defaultTokenEncoder *tiktoken.Tiktoken`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00
perf: initialize all token encoder when starting (close #459, close $460) 2023-08-26 05:02:02 +00:00			`func InitTokenEncoders() {`
			`common.SysLog("initializing token encoders")`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`gpt35TokenEncoder, err := tiktoken.EncodingForModel("gpt-3.5-turbo")`
perf: initialize all token encoder when starting (close #459, close $460) 2023-08-26 05:02:02 +00:00			`if err != nil {`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`common.FatalLog(fmt.Sprintf("failed to get gpt-3.5-turbo token encoder: %s", err.Error()))`
			`}`
			`defaultTokenEncoder = gpt35TokenEncoder`
			`gpt4TokenEncoder, err := tiktoken.EncodingForModel("gpt-4")`
			`if err != nil {`
			`common.FatalLog(fmt.Sprintf("failed to get gpt-4 token encoder: %s", err.Error()))`
perf: initialize all token encoder when starting (close #459, close $460) 2023-08-26 05:02:02 +00:00			`}`
			`for model, _ := range common.ModelRatio {`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`if strings.HasPrefix(model, "gpt-3.5") {`
			`tokenEncoderMap[model] = gpt35TokenEncoder`
			`} else if strings.HasPrefix(model, "gpt-4") {`
			`tokenEncoderMap[model] = gpt4TokenEncoder`
			`} else {`
			`tokenEncoderMap[model] = nil`
perf: initialize all token encoder when starting (close #459, close $460) 2023-08-26 05:02:02 +00:00			`}`
			`}`
			`common.SysLog("token encoders initialized")`
			`}`

fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`func getTokenEncoder(model string) *tiktoken.Tiktoken {`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`tokenEncoder, ok := tokenEncoderMap[model]`
			`if ok && tokenEncoder != nil {`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`return tokenEncoder`
			`}`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`if ok {`
			`tokenEncoder, err := tiktoken.EncodingForModel(model)`
fix: use gpt-3.5's encoder if not found (close #110) 2023-05-21 03:11:19 +00:00			`if err != nil {`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`common.SysError(fmt.Sprintf("failed to get token encoder for model %s: %s, using encoder for gpt-3.5-turbo", model, err.Error()))`
			`tokenEncoder = defaultTokenEncoder`
fix: use gpt-3.5's encoder if not found (close #110) 2023-05-21 03:11:19 +00:00			`}`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`tokenEncoderMap[model] = tokenEncoder`
			`return tokenEncoder`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`}`
perf: lazy initialization for token encoders (close #566) 2023-09-29 09:56:11 +00:00			`return defaultTokenEncoder`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`}`

feat: able to approximate token (close #207) 2023-07-04 11:54:13 +00:00			`func getTokenNum(tokenEncoder *tiktoken.Tiktoken, text string) int {`
			`if common.ApproximateTokenEnabled {`
			`return int(float64(len(text)) * 0.38)`
			`}`
			`return len(tokenEncoder.Encode(text, nil, nil))`
			`}`

fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`func countTokenMessages(messages []Message, model string) int {`
			`tokenEncoder := getTokenEncoder(model)`
			`// Reference:`
			`// https://github.com/openai/openai-cookbook/blob/main/examples/How_to_count_tokens_with_tiktoken.ipynb`
			`// https://github.com/pkoukk/tiktoken-go/issues/6`
			`//`
			`// Every message follows <\|start\|>{role/name}\n{content}<\|end\|>\n`
			`var tokensPerMessage int`
			`var tokensPerName int`
chore: update countTokenMessages (#238) 2023-07-03 01:42:34 +00:00			`if model == "gpt-3.5-turbo-0301" {`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`tokensPerMessage = 4`
			`tokensPerName = -1 // If there's a name, the role is omitted`
			`} else {`
			`tokensPerMessage = 3`
			`tokensPerName = 1`
			`}`
			`tokenNum := 0`
			`for _, message := range messages {`
			`tokenNum += tokensPerMessage`
feat: support gpt-4 with vision (#683, #714) 2023-11-19 10:38:54 +00:00			`tokenNum += getTokenNum(tokenEncoder, message.StringContent())`
feat: able to approximate token (close #207) 2023-07-04 11:54:13 +00:00			`tokenNum += getTokenNum(tokenEncoder, message.Role)`
feat: support channel ai.ls now (close #99) 2023-05-19 03:07:17 +00:00			`if message.Name != nil {`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`tokenNum += tokensPerName`
feat: able to approximate token (close #207) 2023-07-04 11:54:13 +00:00			`tokenNum += getTokenNum(tokenEncoder, *message.Name)`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`}`
			`}`
			`tokenNum += 3 // Every reply is primed with <\|start\|>assistant<\|message\|>`
			`return tokenNum`
			`}`

fix: now the input field can be array type now (close #149) 2023-06-12 08:11:57 +00:00			`func countTokenInput(input any, model string) int {`
			`switch input.(type) {`
			`case string:`
			`return countTokenText(input.(string), model)`
			`case []string:`
			`text := ""`
			`for _, s := range input.([]string) {`
			`text += s`
			`}`
			`return countTokenText(text, model)`
			`}`
			`return 0`
			`}`

fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`func countTokenText(text string, model string) int {`
			`tokenEncoder := getTokenEncoder(model)`
feat: able to approximate token (close #207) 2023-07-04 11:54:13 +00:00			`return getTokenNum(tokenEncoder, text)`
fix: make the token number calculation more accurate (#101) * Make token calculation more accurate. * fix: make the token number calculation more accurate --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-05-19 01:41:26 +00:00			`}`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00
			`func errorWrapper(err error, code string, statusCode int) *OpenAIErrorWithStatusCode {`
			`openAIError := OpenAIError{`
			`Message: err.Error(),`
			`Type: "one_api_error",`
			`Code: code,`
			`}`
			`return &OpenAIErrorWithStatusCode{`
			`OpenAIError: openAIError,`
			`StatusCode: statusCode,`
			`}`
			`}`
fix: using whitelist when disabling channels (close #292) 2023-07-22 10:15:30 +00:00
fix: disable channel when 401 received (close #467) 2023-08-26 04:05:18 +00:00			`func shouldDisableChannel(err *OpenAIError, statusCode int) bool {`
fix: using whitelist when disabling channels (close #292) 2023-07-22 10:15:30 +00:00			`if !common.AutomaticDisableChannelEnabled {`
			`return false`
			`}`
			`if err == nil {`
			`return false`
			`}`
fix: disable channel when 401 received (close #467) 2023-08-26 04:05:18 +00:00			`if statusCode == http.StatusUnauthorized {`
			`return true`
			`}`
fix: using whitelist when disabling channels (close #292) 2023-07-22 10:15:30 +00:00			`if err.Type == "insufficient_quota" \|\| err.Code == "invalid_api_key" \|\| err.Code == "account_deactivated" {`
			`return true`
			`}`
			`return false`
			`}`
refactor: add set event stream headers func (#402) 封装流式传输响应头的设置 2023-08-12 13:55:18 +00:00
			`func setEventStreamHeaders(c *gin.Context) {`
			`c.Writer.Header().Set("Content-Type", "text/event-stream")`
			`c.Writer.Header().Set("Cache-Control", "no-cache")`
			`c.Writer.Header().Set("Connection", "keep-alive")`
			`c.Writer.Header().Set("Transfer-Encoding", "chunked")`
			`c.Writer.Header().Set("X-Accel-Buffering", "no")`
			`}`
fix: fix error response (close #468) 2023-08-26 04:37:45 +00:00
			`func relayErrorHandler(resp http.Response) (openAIErrorWithStatusCode OpenAIErrorWithStatusCode) {`
			`openAIErrorWithStatusCode = &OpenAIErrorWithStatusCode{`
			`StatusCode: resp.StatusCode,`
			`OpenAIError: OpenAIError{`
			`Message: fmt.Sprintf("bad response status code %d", resp.StatusCode),`
chore: update error code 2023-09-17 03:30:20 +00:00			`Type: "upstream_error",`
fix: fix error response (close #468) 2023-08-26 04:37:45 +00:00			`Code: "bad_response_status_code",`
			`Param: strconv.Itoa(resp.StatusCode),`
			`},`
			`}`
			`responseBody, err := io.ReadAll(resp.Body)`
			`if err != nil {`
			`return`
			`}`
			`err = resp.Body.Close()`
			`if err != nil {`
			`return`
			`}`
			`var textResponse TextResponse`
			`err = json.Unmarshal(responseBody, &textResponse)`
			`if err != nil {`
			`return`
			`}`
			`openAIErrorWithStatusCode.OpenAIError = textResponse.Error`
			`return`
			`}`
feat: add cloudflare ai gateway support for image & audio (#607) * Update channel-test.go * Update relay-audio.go * Update relay-image.go * chore: using a util function --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-10-22 09:50:52 +00:00
			`func getFullRequestURL(baseURL string, requestURL string, channelType int) string {`
			`fullRequestURL := fmt.Sprintf("%s%s", baseURL, requestURL)`
feat: support cloudflare gateway for azure (#666) * 🐛 Fix cloudflare gateway request failure * 🐛 fix channel test url error 2023-11-19 07:52:35 +00:00
			`if strings.HasPrefix(baseURL, "https://gateway.ai.cloudflare.com") {`
			`switch channelType {`
			`case common.ChannelTypeOpenAI:`
feat: add cloudflare ai gateway support for image & audio (#607) * Update channel-test.go * Update relay-audio.go * Update relay-image.go * chore: using a util function --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-10-22 09:50:52 +00:00			`fullRequestURL = fmt.Sprintf("%s%s", baseURL, strings.TrimPrefix(requestURL, "/v1"))`
feat: support cloudflare gateway for azure (#666) * 🐛 Fix cloudflare gateway request failure * 🐛 fix channel test url error 2023-11-19 07:52:35 +00:00			`case common.ChannelTypeAzure:`
			`fullRequestURL = fmt.Sprintf("%s%s", baseURL, strings.TrimPrefix(requestURL, "/openai/deployments"))`
feat: add cloudflare ai gateway support for image & audio (#607) * Update channel-test.go * Update relay-audio.go * Update relay-image.go * chore: using a util function --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-10-22 09:50:52 +00:00			`}`
			`}`
feat: support cloudflare gateway for azure (#666) * 🐛 Fix cloudflare gateway request failure * 🐛 fix channel test url error 2023-11-19 07:52:35 +00:00
feat: add cloudflare ai gateway support for image & audio (#607) * Update channel-test.go * Update relay-audio.go * Update relay-image.go * chore: using a util function --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-10-22 09:50:52 +00:00			`return fullRequestURL`
			`}`
feat: support tts model (#713) * Added support for Text-to-Speech models and endpoints * chore: update impl --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-11-17 13:18:51 +00:00
			`func postConsumeQuota(ctx context.Context, tokenId int, quota int, userId int, channelId int, modelRatio float64, groupRatio float64, modelName string, tokenName string) {`
			`err := model.PostConsumeTokenQuota(tokenId, quota)`
			`if err != nil {`
			`common.SysError("error consuming token remain quota: " + err.Error())`
			`}`
			`err = model.CacheUpdateUserQuota(userId)`
			`if err != nil {`
			`common.SysError("error update user quota cache: " + err.Error())`
			`}`
			`if quota != 0 {`
			`logContent := fmt.Sprintf("模型倍率 %.2f，分组倍率 %.2f", modelRatio, groupRatio)`
			`model.RecordConsumeLog(ctx, userId, channelId, 0, 0, modelName, tokenName, quota, logContent)`
			`model.UpdateUserUsedQuotaAndRequestCount(userId, quota)`
			`model.UpdateChannelUsedQuota(channelId, quota)`
			`}`
			`}`