ai-gateway/relay/controller/text.go

77 lines
2.7 KiB
Go
Raw Normal View History

2023-06-19 02:28:55 +00:00
package controller
import (
"fmt"
2024-01-14 11:21:03 +00:00
"github.com/gin-gonic/gin"
2023-06-19 02:28:55 +00:00
"net/http"
"one-api/common"
"one-api/common/logger"
2024-01-14 11:21:03 +00:00
"one-api/relay/channel/openai"
"one-api/relay/constant"
"one-api/relay/util"
2023-06-19 02:28:55 +00:00
"strings"
)
func RelayTextHelper(c *gin.Context) *openai.ErrorWithStatusCode {
ctx := c.Request.Context()
meta := util.GetRelayMeta(c)
// get & validate textRequest
textRequest, err := getAndValidateTextRequest(c, meta.Mode)
if err != nil {
logger.Errorf(ctx, "getAndValidateTextRequest failed: %s", err.Error())
return openai.ErrorWrapper(err, "invalid_text_request", http.StatusBadRequest)
2023-06-19 02:28:55 +00:00
}
// map model name
var isModelMapped bool
textRequest.Model, isModelMapped = util.GetMappedModelName(textRequest.Model, meta.ModelMapping)
// get model ratio & group ratio
2023-06-19 02:28:55 +00:00
modelRatio := common.GetModelRatio(textRequest.Model)
groupRatio := common.GetGroupRatio(meta.Group)
2023-06-19 02:28:55 +00:00
ratio := modelRatio * groupRatio
// pre-consume quota
promptTokens := getPromptTokens(textRequest, meta.Mode)
preConsumedQuota, bizErr := preConsumeQuota(ctx, textRequest, promptTokens, ratio, meta)
if bizErr != nil {
logger.Warnf(ctx, "preConsumeQuota failed: %+v", *bizErr)
return bizErr
}
// get request body
requestBody, err := GetRequestBody(c, *textRequest, isModelMapped, meta.APIType, meta.Mode)
if err != nil {
return openai.ErrorWrapper(err, "get_request_body_failed", http.StatusInternalServerError)
2023-07-22 08:18:03 +00:00
}
// do request
var resp *http.Response
isStream := textRequest.Stream
if meta.APIType != constant.APITypeXunfei { // cause xunfei use websocket
fullRequestURL, err := GetRequestURL(c.Request.URL.String(), meta, textRequest)
if err != nil {
logger.Error(ctx, fmt.Sprintf("util.GetRequestURL failed: %s", err.Error()))
return openai.ErrorWrapper(fmt.Errorf("util.GetRequestURL failed"), "get_request_url_failed", http.StatusInternalServerError)
2023-07-22 08:18:03 +00:00
}
resp, err = doRequest(ctx, c, meta, isStream, fullRequestURL, requestBody)
if err != nil {
logger.Errorf(ctx, "doRequest failed: %s", err.Error())
2024-01-14 11:21:03 +00:00
return openai.ErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)
2023-07-28 15:45:08 +00:00
}
isStream = isStream || strings.HasPrefix(resp.Header.Get("Content-Type"), "text/event-stream")
2023-08-20 14:07:50 +00:00
if resp.StatusCode != http.StatusOK {
util.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)
2024-01-14 11:21:03 +00:00
return util.RelayErrorHandler(resp)
2023-08-20 14:07:50 +00:00
}
}
// do response
usage, respErr := DoResponse(c, textRequest, resp, meta.Mode, meta.APIType, isStream, promptTokens)
if respErr != nil {
logger.Errorf(ctx, "respErr is not nil: %+v", respErr)
util.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)
return respErr
2023-06-19 02:28:55 +00:00
}
// post-consume quota
go postConsumeQuota(ctx, usage, meta, textRequest, ratio, preConsumedQuota, modelRatio, groupRatio)
return nil
2023-06-19 02:28:55 +00:00
}