ai-gateway/middleware/distributor.go

package middleware

import (
	"fmt"
	"github.com/gin-gonic/gin"
	"github.com/songquanpeng/one-api/common/ctxkey"
	"github.com/songquanpeng/one-api/common/logger"
	"github.com/songquanpeng/one-api/model"
	"github.com/songquanpeng/one-api/relay/channeltype"
	"net/http"
	"strconv"
)

type ModelRequest struct {
	Model string `json:"model" form:"model"`
}

func Distribute() func(c *gin.Context) {
	return func(c *gin.Context) {
		userId := c.GetInt(ctxkey.Id)
		userGroup, _ := model.CacheGetUserGroup(userId)
		c.Set(ctxkey.Group, userGroup)
		var requestModel string
		var channel *model.Channel
		channelId, ok := c.Get(ctxkey.SpecificChannelId)
		if ok {
			id, err := strconv.Atoi(channelId.(string))
			if err != nil {
				abortWithMessage(c, http.StatusBadRequest, "无效的渠道 Id")
				return
			}
			channel, err = model.GetChannelById(id, true)
			if err != nil {
				abortWithMessage(c, http.StatusBadRequest, "无效的渠道 Id")
				return
			}
			if channel.Status != model.ChannelStatusEnabled {
				abortWithMessage(c, http.StatusForbidden, "该渠道已被禁用")
				return
			}
		} else {
			requestModel = c.GetString(ctxkey.RequestModel)
			var err error
			channel, err = model.CacheGetRandomSatisfiedChannel(userGroup, requestModel, false)
			if err != nil {
				message := fmt.Sprintf("当前分组 %s 下对于模型 %s 无可用渠道", userGroup, requestModel)
				if channel != nil {
					logger.SysError(fmt.Sprintf("渠道不存在：%d", channel.Id))
					message = "数据库一致性已被破坏，请联系管理员"
				}
				abortWithMessage(c, http.StatusServiceUnavailable, message)
				return
			}
		}
		SetupContextForSelectedChannel(c, channel, requestModel)
		c.Next()
	}
}

func SetupContextForSelectedChannel(c *gin.Context, channel *model.Channel, modelName string) {
	c.Set(ctxkey.Channel, channel.Type)
	c.Set(ctxkey.ChannelId, channel.Id)
	c.Set(ctxkey.ChannelName, channel.Name)
	c.Set(ctxkey.ModelMapping, channel.GetModelMapping())
	c.Set(ctxkey.OriginalModel, modelName) // for retry
	c.Request.Header.Set("Authorization", fmt.Sprintf("Bearer %s", channel.Key))
	c.Set(ctxkey.BaseURL, channel.GetBaseURL())
	cfg, _ := channel.LoadConfig()
	// this is for backward compatibility
	if channel.Other != nil {
		switch channel.Type {
		case channeltype.Azure:
			if cfg.APIVersion == "" {
				cfg.APIVersion = *channel.Other
			}
		case channeltype.Xunfei:
			if cfg.APIVersion == "" {
				cfg.APIVersion = *channel.Other
			}
		case channeltype.Gemini:
			if cfg.APIVersion == "" {
				cfg.APIVersion = *channel.Other
			}
		case channeltype.AIProxyLibrary:
			if cfg.LibraryID == "" {
				cfg.LibraryID = *channel.Other
			}
		case channeltype.Ali:
			if cfg.Plugin == "" {
				cfg.Plugin = *channel.Other
			}
		}
	}
	c.Set(ctxkey.Config, cfg)
}
Relay done but not working 2023-04-23 10:24:11 +00:00			`package middleware`

			`import (`
			`"fmt"`
feat: able to set model limitation for token (close #178) 2024-04-03 18:08:18 +00:00			`"github.com/gin-gonic/gin"`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00			`"github.com/songquanpeng/one-api/common/ctxkey"`
chore: update module name 2024-01-28 11:38:58 +00:00			`"github.com/songquanpeng/one-api/common/logger"`
			`"github.com/songquanpeng/one-api/model"`
chore: reorganize constant related package 2024-04-05 16:44:33 +00:00			`"github.com/songquanpeng/one-api/relay/channeltype"`
Relay done but not working 2023-04-23 10:24:11 +00:00			`"net/http"`
			`"strconv"`
			`)`

feat: support group now (close #17, close #72, close #85, close #104, close #136) Co-authored-by: quzard <1191890118@qq.com> 2023-06-07 15:26:00 +00:00			`type ModelRequest struct {`
feat: support multipart/form-data format request (#1690) * "add parser multipart/form-data" * chore: fix impl * chore: update impl --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-09-22 09:32:47 +00:00			Model string `json:"model" form:"model"`
feat: support group now (close #17, close #72, close #85, close #104, close #136) Co-authored-by: quzard <1191890118@qq.com> 2023-06-07 15:26:00 +00:00			`}`

Relay done but not working 2023-04-23 10:24:11 +00:00			`func Distribute() func(c *gin.Context) {`
			`return func(c *gin.Context) {`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`userId := c.GetInt(ctxkey.Id)`
feat: use cache to avoid database access (#158) 2023-06-20 11:09:49 +00:00			`userGroup, _ := model.CacheGetUserGroup(userId)`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`c.Set(ctxkey.Group, userGroup)`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`var requestModel string`
Relay done but not working 2023-04-23 10:24:11 +00:00			`var channel *model.Channel`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`channelId, ok := c.Get(ctxkey.SpecificChannelId)`
Relay done but not working 2023-04-23 10:24:11 +00:00			`if ok {`
			`id, err := strconv.Atoi(channelId.(string))`
			`if err != nil {`
feat: support Tencent's model (close #519) 2023-10-03 06:19:03 +00:00			`abortWithMessage(c, http.StatusBadRequest, "无效的渠道 Id")`
Relay done but not working 2023-04-23 10:24:11 +00:00			`return`
			`}`
			`channel, err = model.GetChannelById(id, true)`
			`if err != nil {`
feat: support Tencent's model (close #519) 2023-10-03 06:19:03 +00:00			`abortWithMessage(c, http.StatusBadRequest, "无效的渠道 Id")`
Relay done but not working 2023-04-23 10:24:11 +00:00			`return`
			`}`
chore: reorganize common package 2024-04-05 18:03:59 +00:00			`if channel.Status != model.ChannelStatusEnabled {`
refactor: update logging related logic 2023-09-17 07:39:46 +00:00			`abortWithMessage(c, http.StatusForbidden, "该渠道已被禁用")`
Relay done but not working 2023-04-23 10:24:11 +00:00			`return`
			`}`
			`} else {`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`requestModel = c.GetString(ctxkey.RequestModel)`
feat: able to set model limitation for token (close #178) 2024-04-03 18:08:18 +00:00			`var err error`
			`channel, err = model.CacheGetRandomSatisfiedChannel(userGroup, requestModel, false)`
Relay done but not working 2023-04-23 10:24:11 +00:00			`if err != nil {`
feat: able to set model limitation for token (close #178) 2024-04-03 18:08:18 +00:00			`message := fmt.Sprintf("当前分组 %s 下对于模型 %s 无可用渠道", userGroup, requestModel)`
fix: fix the wrong message when channel is deleted 2023-06-29 03:27:34 +00:00			`if channel != nil {`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`logger.SysError(fmt.Sprintf("渠道不存在：%d", channel.Id))`
fix: fix the wrong message when channel is deleted 2023-06-29 03:27:34 +00:00			`message = "数据库一致性已被破坏，请联系管理员"`
			`}`
refactor: update logging related logic 2023-09-17 07:39:46 +00:00			`abortWithMessage(c, http.StatusServiceUnavailable, message)`
Relay done but not working 2023-04-23 10:24:11 +00:00			`return`
			`}`
			`}`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`SetupContextForSelectedChannel(c, channel, requestModel)`
Relay done but not working 2023-04-23 10:24:11 +00:00			`c.Next()`
			`}`
			`}`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00
			`func SetupContextForSelectedChannel(c gin.Context, channel model.Channel, modelName string) {`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`c.Set(ctxkey.Channel, channel.Type)`
			`c.Set(ctxkey.ChannelId, channel.Id)`
			`c.Set(ctxkey.ChannelName, channel.Name)`
			`c.Set(ctxkey.ModelMapping, channel.GetModelMapping())`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00			`c.Set(ctxkey.OriginalModel, modelName) // for retry`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`c.Request.Header.Set("Authorization", fmt.Sprintf("Bearer %s", channel.Key))`
chore: do not hardcode context key 2024-04-21 11:43:23 +00:00			`c.Set(ctxkey.BaseURL, channel.GetBaseURL())`
feat: support cloudflare now 2024-04-26 15:05:48 +00:00			`cfg, _ := channel.LoadConfig()`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`// this is for backward compatibility`
fix: support for Spark Lite model (#1526) * fix: Support for Spark Lite model * fix: fix panic * fix: fix xunfei version config --------- Co-authored-by: JustSong <39998050+songquanpeng@users.noreply.github.com> Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-06-12 16:07:26 +00:00			`if channel.Other != nil {`
			`switch channel.Type {`
			`case channeltype.Azure:`
			`if cfg.APIVersion == "" {`
			`cfg.APIVersion = *channel.Other`
			`}`
			`case channeltype.Xunfei:`
			`if cfg.APIVersion == "" {`
			`cfg.APIVersion = *channel.Other`
			`}`
			`case channeltype.Gemini:`
			`if cfg.APIVersion == "" {`
			`cfg.APIVersion = *channel.Other`
			`}`
			`case channeltype.AIProxyLibrary:`
			`if cfg.LibraryID == "" {`
			`cfg.LibraryID = *channel.Other`
			`}`
			`case channeltype.Ali:`
			`if cfg.Plugin == "" {`
			`cfg.Plugin = *channel.Other`
			`}`
feat: support cloudflare now 2024-04-26 15:05:48 +00:00			`}`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`}`
feat: support cloudflare now 2024-04-26 15:05:48 +00:00			`c.Set(ctxkey.Config, cfg)`
feat: built in retry supported (close #1036, close #770) 2024-02-25 11:01:49 +00:00			`}`