refactor: refactor image relay (close #1068)

2024-03-03 19:30:11 +08:00 · 2024-03-03 19:30:11 +08:00 · de18d6fe16
commit de18d6fe16
parent 1d0b7fb5ae
4 changed files with 122 additions and 116 deletions
--- a/common/model-ratio.go
+++ b/common/model-ratio.go
@ -7,29 +7,6 @@ import (
 	"time"
 )
 var DalleSizeRatios = map[string]map[string]float64{
 	"dall-e-2": {
 		"256x256":   1,
 		"512x512":   1.125,
 		"1024x1024": 1.25,
 	},
 	"dall-e-3": {
 		"1024x1024": 1,
 		"1024x1792": 2,
 		"1792x1024": 2,
 	},
 }
 var DalleGenerationImageAmounts = map[string][2]int{
 	"dall-e-2": {1, 10},
 	"dall-e-3": {1, 1}, // OpenAI allows n=1 currently.
 }
 var DalleImagePromptLengthLimitations = map[string]int{
 	"dall-e-2": 1000,
 	"dall-e-3": 4000,
 }
 const (
 	USD2RMB = 7
 	USD     = 500 // $0.002 = 1 -> $1 = 500
--- a/relay/constant/image.go
+++ b/relay/constant/image.go
@ -0,0 +1,24 @@
 package constant
 var DalleSizeRatios = map[string]map[string]float64{
 	"dall-e-2": {
 		"256x256":   1,
 		"512x512":   1.125,
 		"1024x1024": 1.25,
 	},
 	"dall-e-3": {
 		"1024x1024": 1,
 		"1024x1792": 2,
 		"1792x1024": 2,
 	},
 }
 var DalleGenerationImageAmounts = map[string][2]int{
 	"dall-e-2": {1, 10},
 	"dall-e-3": {1, 1}, // OpenAI allows n=1 currently.
 }
 var DalleImagePromptLengthLimitations = map[string]int{
 	"dall-e-2": 1000,
 	"dall-e-3": 4000,
 }
--- a/relay/controller/helper.go
+++ b/relay/controller/helper.go
@ -36,6 +36,65 @@ func getAndValidateTextRequest(c *gin.Context, relayMode int) (*relaymodel.Gener
 	return textRequest, nil
 }
 func getImageRequest(c *gin.Context, relayMode int) (*openai.ImageRequest, error) {
 	imageRequest := &openai.ImageRequest{}
 	err := common.UnmarshalBodyReusable(c, imageRequest)
 	if err != nil {
 		return nil, err
 	}
 	if imageRequest.N == 0 {
 		imageRequest.N = 1
 	}
 	if imageRequest.Size == "" {
 		imageRequest.Size = "1024x1024"
 	}
 	if imageRequest.Model == "" {
 		imageRequest.Model = "dall-e-2"
 	}
 	return imageRequest, nil
 }
 func validateImageRequest(imageRequest *openai.ImageRequest, meta *util.RelayMeta) *relaymodel.ErrorWithStatusCode {
 	// model validation
 	_, hasValidSize := constant.DalleSizeRatios[imageRequest.Model][imageRequest.Size]
 	if !hasValidSize {
 		return openai.ErrorWrapper(errors.New("size not supported for this image model"), "size_not_supported", http.StatusBadRequest)
 	}
 	// check prompt length
 	if imageRequest.Prompt == "" {
 		return openai.ErrorWrapper(errors.New("prompt is required"), "prompt_missing", http.StatusBadRequest)
 	}
 	if len(imageRequest.Prompt) > constant.DalleImagePromptLengthLimitations[imageRequest.Model] {
 		return openai.ErrorWrapper(errors.New("prompt is too long"), "prompt_too_long", http.StatusBadRequest)
 	}
 	// Number of generated images validation
 	if !isWithinRange(imageRequest.Model, imageRequest.N) {
 		// channel not azure
 		if meta.ChannelType != common.ChannelTypeAzure {
 			return openai.ErrorWrapper(errors.New("invalid value of n"), "n_not_within_range", http.StatusBadRequest)
 		}
 	}
 	return nil
 }
 func getImageCostRatio(imageRequest *openai.ImageRequest) (float64, error) {
 	if imageRequest == nil {
 		return 0, errors.New("imageRequest is nil")
 	}
 	imageCostRatio, hasValidSize := constant.DalleSizeRatios[imageRequest.Model][imageRequest.Size]
 	if !hasValidSize {
 		return 0, fmt.Errorf("size not supported for this image model: %s", imageRequest.Size)
 	}
 	if imageRequest.Quality == "hd" && imageRequest.Model == "dall-e-3" {
 		if imageRequest.Size == "1024x1024" {
 			imageCostRatio *= 2
 		} else {
 			imageCostRatio *= 1.5
 		}
 	}
 	return imageCostRatio, nil
 }
 func getPromptTokens(textRequest *relaymodel.GeneralOpenAIRequest, relayMode int) int {
 	switch relayMode {
 	case constant.RelayModeChatCompletions:
--- a/relay/controller/image.go
+++ b/relay/controller/image.go
@ -10,6 +10,7 @@ import (
 	"github.com/songquanpeng/one-api/common/logger"
 	"github.com/songquanpeng/one-api/model"
 	"github.com/songquanpeng/one-api/relay/channel/openai"
 	"github.com/songquanpeng/one-api/relay/constant"
 	relaymodel "github.com/songquanpeng/one-api/relay/model"
 	"github.com/songquanpeng/one-api/relay/util"
 	"io"
@ -20,120 +21,65 @@ import (
 )
 func isWithinRange(element string, value int) bool {
-	if _, ok := common.DalleGenerationImageAmounts[element]; !ok {
+	if _, ok := constant.DalleGenerationImageAmounts[element]; !ok {
 		return false
 	}
-	min := common.DalleGenerationImageAmounts[element][0]
+	min := constant.DalleGenerationImageAmounts[element][0]
-	max := common.DalleGenerationImageAmounts[element][1]
+	max := constant.DalleGenerationImageAmounts[element][1]
 	return value >= min && value <= max
 }
 func RelayImageHelper(c *gin.Context, relayMode int) *relaymodel.ErrorWithStatusCode {
-	imageModel := "dall-e-2"
+	ctx := c.Request.Context()
-	imageSize := "1024x1024"
+	meta := util.GetRelayMeta(c)
-
+	imageRequest, err := getImageRequest(c, meta.Mode)
 	tokenId := c.GetInt("token_id")
 	channelType := c.GetInt("channel")
 	channelId := c.GetInt("channel_id")
 	userId := c.GetInt("id")
 	group := c.GetString("group")
 	var imageRequest openai.ImageRequest
 	err := common.UnmarshalBodyReusable(c, &imageRequest)
 	if err != nil {
-		return openai.ErrorWrapper(err, "bind_request_body_failed", http.StatusBadRequest)
+		logger.Errorf(ctx, "getImageRequest failed: %s", err.Error())
-	}
+		return openai.ErrorWrapper(err, "invalid_image_request", http.StatusBadRequest)
 	if imageRequest.N == 0 {
 		imageRequest.N = 1
 	}
 	// Size validation
 	if imageRequest.Size != "" {
 		imageSize = imageRequest.Size
 	}
 	// Model validation
 	if imageRequest.Model != "" {
 		imageModel = imageRequest.Model
 	}
 	imageCostRatio, hasValidSize := common.DalleSizeRatios[imageModel][imageSize]
 	// Check if model is supported
 	if hasValidSize {
 		if imageRequest.Quality == "hd" && imageModel == "dall-e-3" {
 			if imageSize == "1024x1024" {
 				imageCostRatio *= 2
 			} else {
 				imageCostRatio *= 1.5
 			}
 		}
 	} else {
 		return openai.ErrorWrapper(errors.New("size not supported for this image model"), "size_not_supported", http.StatusBadRequest)
 	}
 	// Prompt validation
 	if imageRequest.Prompt == "" {
 		return openai.ErrorWrapper(errors.New("prompt is required"), "prompt_missing", http.StatusBadRequest)
 	}
 	// Check prompt length
 	if len(imageRequest.Prompt) > common.DalleImagePromptLengthLimitations[imageModel] {
 		return openai.ErrorWrapper(errors.New("prompt is too long"), "prompt_too_long", http.StatusBadRequest)
 	}
 	// Number of generated images validation
 	if !isWithinRange(imageModel, imageRequest.N) {
 		// channel not azure
 		if channelType != common.ChannelTypeAzure {
 			return openai.ErrorWrapper(errors.New("invalid value of n"), "n_not_within_range", http.StatusBadRequest)
 		}
 	}
 	// map model name
-	modelMapping := c.GetString("model_mapping")
+	var isModelMapped bool
-	isModelMapped := false
+	meta.OriginModelName = imageRequest.Model
-	if modelMapping != "" {
+	imageRequest.Model, isModelMapped = util.GetMappedModelName(imageRequest.Model, meta.ModelMapping)
-		modelMap := make(map[string]string)
+	meta.ActualModelName = imageRequest.Model
-		err := json.Unmarshal([]byte(modelMapping), &modelMap)
+
 	// model validation
 	bizErr := validateImageRequest(imageRequest, meta)
 	if bizErr != nil {
 		return bizErr
 	}
 	imageCostRatio, err := getImageCostRatio(imageRequest)
 	if err != nil {
-			return openai.ErrorWrapper(err, "unmarshal_model_mapping_failed", http.StatusInternalServerError)
+		return openai.ErrorWrapper(err, "get_image_cost_ratio_failed", http.StatusInternalServerError)
 	}
-		if modelMap[imageModel] != "" {
+
 			imageModel = modelMap[imageModel]
 			isModelMapped = true
 		}
 	}
 	baseURL := common.ChannelBaseURLs[channelType]
 	requestURL := c.Request.URL.String()
-	if c.GetString("base_url") != "" {
+	fullRequestURL := util.GetFullRequestURL(meta.BaseURL, requestURL, meta.ChannelType)
-		baseURL = c.GetString("base_url")
+	if meta.ChannelType == common.ChannelTypeAzure {
 	}
 	fullRequestURL := util.GetFullRequestURL(baseURL, requestURL, channelType)
 	if channelType == common.ChannelTypeAzure {
 		// https://learn.microsoft.com/en-us/azure/ai-services/openai/dall-e-quickstart?tabs=dalle3%2Ccommand-line&pivots=rest-api
 		apiVersion := util.GetAzureAPIVersion(c)
 		// https://{resource_name}.openai.azure.com/openai/deployments/dall-e-3/images/generations?api-version=2023-06-01-preview
-		fullRequestURL = fmt.Sprintf("%s/openai/deployments/%s/images/generations?api-version=%s", baseURL, imageModel, apiVersion)
+		fullRequestURL = fmt.Sprintf("%s/openai/deployments/%s/images/generations?api-version=%s", meta.BaseURL, imageRequest.Model, apiVersion)
 	}
 	var requestBody io.Reader
-	if isModelMapped || channelType == common.ChannelTypeAzure { // make Azure channel request body
+	if isModelMapped || meta.ChannelType == common.ChannelTypeAzure { // make Azure channel request body
 		jsonStr, err := json.Marshal(imageRequest)
 		if err != nil {
-			return openai.ErrorWrapper(err, "marshal_text_request_failed", http.StatusInternalServerError)
+			return openai.ErrorWrapper(err, "marshal_image_request_failed", http.StatusInternalServerError)
 		}
 		requestBody = bytes.NewBuffer(jsonStr)
 	} else {
 		requestBody = c.Request.Body
 	}
-	modelRatio := common.GetModelRatio(imageModel)
+	modelRatio := common.GetModelRatio(imageRequest.Model)
-	groupRatio := common.GetGroupRatio(group)
+	groupRatio := common.GetGroupRatio(meta.Group)
 	ratio := modelRatio * groupRatio
-	userQuota, err := model.CacheGetUserQuota(userId)
+	userQuota, err := model.CacheGetUserQuota(meta.UserId)
 	quota := int(ratio*imageCostRatio*1000) * imageRequest.N
@ -146,7 +92,7 @@ func RelayImageHelper(c *gin.Context, relayMode int) *relaymodel.ErrorWithStatus
 		return openai.ErrorWrapper(err, "new_request_failed", http.StatusInternalServerError)
 	}
 	token := c.Request.Header.Get("Authorization")
-	if channelType == common.ChannelTypeAzure { // Azure authentication
+	if meta.ChannelType == common.ChannelTypeAzure { // Azure authentication
 		token = strings.TrimPrefix(token, "Bearer ")
 		req.Header.Set("api-key", token)
 	} else {
@ -169,25 +115,25 @@ func RelayImageHelper(c *gin.Context, relayMode int) *relaymodel.ErrorWithStatus
 	if err != nil {
 		return openai.ErrorWrapper(err, "close_request_body_failed", http.StatusInternalServerError)
 	}
-	var textResponse openai.ImageResponse
+	var imageResponse openai.ImageResponse
 	defer func(ctx context.Context) {
 		if resp.StatusCode != http.StatusOK {
 			return
 		}
-		err := model.PostConsumeTokenQuota(tokenId, quota)
+		err := model.PostConsumeTokenQuota(meta.TokenId, quota)
 		if err != nil {
 			logger.SysError("error consuming token remain quota: " + err.Error())
 		}
-		err = model.CacheUpdateUserQuota(userId)
+		err = model.CacheUpdateUserQuota(meta.UserId)
 		if err != nil {
 			logger.SysError("error update user quota cache: " + err.Error())
 		}
 		if quota != 0 {
 			tokenName := c.GetString("token_name")
 			logContent := fmt.Sprintf("模型倍率 %.2f，分组倍率 %.2f", modelRatio, groupRatio)
-			model.RecordConsumeLog(ctx, userId, channelId, 0, 0, imageModel, tokenName, quota, logContent)
+			model.RecordConsumeLog(ctx, meta.UserId, meta.ChannelId, 0, 0, imageRequest.Model, tokenName, quota, logContent)
-			model.UpdateUserUsedQuotaAndRequestCount(userId, quota)
+			model.UpdateUserUsedQuotaAndRequestCount(meta.UserId, quota)
 			channelId := c.GetInt("channel_id")
 			model.UpdateChannelUsedQuota(channelId, quota)
 		}
@ -202,7 +148,7 @@ func RelayImageHelper(c *gin.Context, relayMode int) *relaymodel.ErrorWithStatus
 	if err != nil {
 		return openai.ErrorWrapper(err, "close_response_body_failed", http.StatusInternalServerError)
 	}
-	err = json.Unmarshal(responseBody, &textResponse)
+	err = json.Unmarshal(responseBody, &imageResponse)
 	if err != nil {
 		return openai.ErrorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError)
 	}