Merge branch 'songquanpeng:main' into main

2024-02-26 21:15:04 +08:00 · 2024-02-26 21:15:04 +08:00 · fa5774c7cb
commit fa5774c7cb
parent b07f701261 6b27d6659a
17 changed files with 137 additions and 65 deletions
--- a/.github/workflows/linux-release.yml
+++ b/.github/workflows/linux-release.yml
@ -23,7 +23,7 @@ jobs:
      - uses: actions/setup-node@v3
        with:
          node-version: 16
-      - name: Build Frontend (theme default)
+      - name: Build Frontend
        env:
          CI: ""
        run: |
--- a/.github/workflows/macos-release.yml
+++ b/.github/workflows/macos-release.yml
@ -23,7 +23,7 @@ jobs:
      - uses: actions/setup-node@v3
        with:
          node-version: 16
-      - name: Build Frontend (theme default)
+      - name: Build Frontend
        env:
          CI: ""
        run: |
--- a/.github/workflows/windows-release.yml
+++ b/.github/workflows/windows-release.yml
@ -26,7 +26,7 @@ jobs:
      - uses: actions/setup-node@v3
        with:
          node-version: 16
-      - name: Build Frontend (theme default)
+      - name: Build Frontend
        env:
          CI: ""
        run: |
--- a/2
+++ b/2
@ -23,7 +23,7 @@ ADD go.mod go.sum ./
 RUN go mod download
 COPY . .
 COPY --from=builder /web/build ./web/build
-RUN go build -ldflags "-s -w -X 'one-api/common.Version=$(cat VERSION)' -extldflags '-static'" -o one-api
+RUN go build -ldflags "-s -w -X 'github.com/songquanpeng/one-api/common.Version=$(cat VERSION)' -extldflags '-static'" -o one-api
 FROM alpine
--- a/common/helper/helper.go
+++ b/common/helper/helper.go
@ -137,6 +137,7 @@ func GetUUID() string {
 }
 const keyChars = "0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ"
 const keyNumbers = "0123456789"
 func init() {
 	rand.Seed(time.Now().UnixNano())
@ -168,6 +169,15 @@ func GetRandomString(length int) string {
 	return string(key)
 }
 func GetRandomNumberString(length int) string {
 	rand.Seed(time.Now().UnixNano())
 	key := make([]byte, length)
 	for i := 0; i < length; i++ {
 		key[i] = keyNumbers[rand.Intn(len(keyNumbers))]
 	}
 	return string(key)
 }
 func GetTimestamp() int64 {
 	return time.Now().Unix()
 }
--- a/controller/relay.go
+++ b/controller/relay.go
@ -1,23 +1,24 @@
 package controller
 import (
 	"context"
 	"fmt"
 	"github.com/gin-gonic/gin"
 	"github.com/songquanpeng/one-api/common/config"
 	"github.com/songquanpeng/one-api/common/helper"
 	"github.com/songquanpeng/one-api/common/logger"
 	"github.com/songquanpeng/one-api/middleware"
 	dbmodel "github.com/songquanpeng/one-api/model"
 	"github.com/songquanpeng/one-api/relay/constant"
 	"github.com/songquanpeng/one-api/relay/controller"
 	"github.com/songquanpeng/one-api/relay/model"
 	"github.com/songquanpeng/one-api/relay/util"
 	"net/http"
 	"strconv"
 )
 // https://platform.openai.com/docs/api-reference/chat
-func Relay(c *gin.Context) {
+func relay(c *gin.Context, relayMode int) *model.ErrorWithStatusCode {
 	relayMode := constant.Path2RelayMode(c.Request.URL.Path)
 	var err *model.ErrorWithStatusCode
 	switch relayMode {
 	case constant.RelayModeImagesGenerations:
@ -31,34 +32,82 @@ func Relay(c *gin.Context) {
 	default:
 		err = controller.RelayTextHelper(c)
 	}
-	if err != nil {
+	return err
 }
 func Relay(c *gin.Context) {
 	ctx := c.Request.Context()
 	relayMode := constant.Path2RelayMode(c.Request.URL.Path)
 	bizErr := relay(c, relayMode)
 	if bizErr == nil {
 		return
 	}
 	channelId := c.GetInt("channel_id")
 	lastFailedChannelId := channelId
 	channelName := c.GetString("channel_name")
 	group := c.GetString("group")
 	originalModel := c.GetString("original_model")
 	go processChannelRelayError(ctx, channelId, channelName, bizErr)
 	requestId := c.GetString(logger.RequestIdKey)
-		retryTimesStr := c.Query("retry")
+	retryTimes := config.RetryTimes
-		retryTimes, _ := strconv.Atoi(retryTimesStr)
+	if !shouldRetry(bizErr.StatusCode) {
-		if retryTimesStr == "" {
+		logger.Errorf(ctx, "relay error happen, but status code is %d, won't retry in this case", bizErr.StatusCode)
-			retryTimes = config.RetryTimes
+		retryTimes = 0
 	}
-		if retryTimes > 0 {
+	for i := retryTimes; i > 0; i-- {
-			c.Redirect(http.StatusTemporaryRedirect, fmt.Sprintf("%s?retry=%d", c.Request.URL.Path, retryTimes-1))
+		channel, err := dbmodel.CacheGetRandomSatisfiedChannel(group, originalModel)
-		} else {
+		if err != nil {
-			if err.StatusCode == http.StatusTooManyRequests {
+			logger.Errorf(ctx, "CacheGetRandomSatisfiedChannel failed: %w", err)
-				err.Error.Message = "当前分组上游负载已饱和，请稍后再试"
+			break
 		}
-			err.Error.Message = helper.MessageWithRequestId(err.Error.Message, requestId)
+		logger.Infof(ctx, "using channel #%d to retry (remain times %d)", channel.Id, i)
-			c.JSON(err.StatusCode, gin.H{
+		if channel.Id == lastFailedChannelId {
-				"error": err.Error,
+			continue
 		}
 		middleware.SetupContextForSelectedChannel(c, channel, originalModel)
 		bizErr = relay(c, relayMode)
 		if bizErr == nil {
 			return
 		}
 		channelId := c.GetInt("channel_id")
 		lastFailedChannelId = channelId
 		channelName := c.GetString("channel_name")
 		go processChannelRelayError(ctx, channelId, channelName, bizErr)
 	}
 	if bizErr != nil {
 		if bizErr.StatusCode == http.StatusTooManyRequests {
 			bizErr.Error.Message = "当前分组上游负载已饱和，请稍后再试"
 		}
 		bizErr.Error.Message = helper.MessageWithRequestId(bizErr.Error.Message, requestId)
 		c.JSON(bizErr.StatusCode, gin.H{
 			"error": bizErr.Error,
 		})
 	}
-		channelId := c.GetInt("channel_id")
+}
-		logger.Error(c.Request.Context(), fmt.Sprintf("relay error (channel #%d): %s", channelId, err.Message))
+
 func shouldRetry(statusCode int) bool {
 	if statusCode == http.StatusTooManyRequests {
 		return true
 	}
 	if statusCode/100 == 5 {
 		return true
 	}
 	if statusCode == http.StatusBadRequest {
 		return false
 	}
 	if statusCode/100 == 2 {
 		return false
 	}
 	return true
 }
 func processChannelRelayError(ctx context.Context, channelId int, channelName string, err *model.ErrorWithStatusCode) {
 	logger.Errorf(ctx, "relay error (channel #%d): %s", channelId, err.Message)
 	// https://platform.openai.com/docs/guides/error-codes/api-errors
 	if util.ShouldDisableChannel(&err.Error, err.StatusCode) {
 			channelId := c.GetInt("channel_id")
 			channelName := c.GetString("channel_name")
 		disableChannel(channelId, channelName, err.Message)
 	}
 }
 }
 func RelayNotImplemented(c *gin.Context) {
 	err := model.Error{
--- a/i18n/en.json
+++ b/i18n/en.json
@ -456,6 +456,7 @@
  "已绑定的邮箱账户": "Email Account Bound",
  "用户信息更新成功！": "User information updated successfully!",
  "模型倍率 %.2f，分组倍率 %.2f": "model rate %.2f, group rate %.2f",
  "模型倍率 %.2f，分组倍率 %.2f，补全倍率 %.2f": "model rate %.2f, group rate %.2f, completion rate %.2f",
  "使用明细（总消耗额度：{renderQuota(stat.quota)}）": "Usage Details (Total Consumption Quota: {renderQuota(stat.quota)})",
  "用户名称": "User Name",
  "令牌名称": "Token Name",
--- a/middleware/auth.go
+++ b/middleware/auth.go
@ -108,7 +108,7 @@ func TokenAuth() func(c *gin.Context) {
 		c.Set("token_name", token.Name)
 		if len(parts) > 1 {
 			if model.IsAdmin(token.UserId) {
-				c.Set("channelId", parts[1])
+				c.Set("specific_channel_id", parts[1])
 			} else {
 				abortWithMessage(c, http.StatusForbidden, "普通用户不支持指定渠道")
 				return
--- a/middleware/distributor.go
+++ b/middleware/distributor.go
@ -21,8 +21,9 @@ func Distribute() func(c *gin.Context) {
 		userId := c.GetInt("id")
 		userGroup, _ := model.CacheGetUserGroup(userId)
 		c.Set("group", userGroup)
 		var requestModel string
 		var channel *model.Channel
-		channelId, ok := c.Get("channelId")
+		channelId, ok := c.Get("specific_channel_id")
 		if ok {
 			id, err := strconv.Atoi(channelId.(string))
 			if err != nil {
@ -66,6 +67,7 @@ func Distribute() func(c *gin.Context) {
 					modelRequest.Model = "whisper-1"
 				}
 			}
 			requestModel = modelRequest.Model
 			channel, err = model.CacheGetRandomSatisfiedChannel(userGroup, modelRequest.Model)
 			if err != nil {
 				message := fmt.Sprintf("当前分组 %s 下对于模型 %s 无可用渠道", userGroup, modelRequest.Model)
@ -77,10 +79,17 @@ func Distribute() func(c *gin.Context) {
 				return
 			}
 		}
 		SetupContextForSelectedChannel(c, channel, requestModel)
 		c.Next()
 	}
 }
 func SetupContextForSelectedChannel(c *gin.Context, channel *model.Channel, modelName string) {
 	c.Set("channel", channel.Type)
 	c.Set("channel_id", channel.Id)
 	c.Set("channel_name", channel.Name)
 	c.Set("model_mapping", channel.GetModelMapping())
 	c.Set("original_model", modelName) // for retry
 	c.Request.Header.Set("Authorization", fmt.Sprintf("Bearer %s", channel.Key))
 	c.Set("base_url", channel.GetBaseURL())
 	// this is for backward compatibility
@ -100,6 +109,4 @@ func Distribute() func(c *gin.Context) {
 	for k, v := range cfg {
 		c.Set(common.ConfigKeyPrefix+k, v)
 	}
 		c.Next()
 	}
 }
--- a/middleware/request-id.go
+++ b/middleware/request-id.go
@ -9,7 +9,7 @@ import (
 func RequestId() func(c *gin.Context) {
 	return func(c *gin.Context) {
-		id := helper.GetTimeString() + helper.GetRandomString(8)
+		id := helper.GetTimeString() + helper.GetRandomNumberString(8)
 		c.Set(logger.RequestIdKey, id)
 		ctx := context.WithValue(c.Request.Context(), logger.RequestIdKey, id)
 		c.Request = c.Request.WithContext(ctx)
--- a/model/cache.go
+++ b/model/cache.go
@ -94,7 +94,7 @@ func CacheUpdateUserQuota(id int) error {
 	if !common.RedisEnabled {
 		return nil
 	}
-	quota, err := GetUserQuota(id)
+	quota, err := CacheGetUserQuota(id)
 	if err != nil {
 		return err
 	}
--- a/relay/channel/aiproxy/main.go
+++ b/relay/channel/aiproxy/main.go
@ -53,7 +53,7 @@ func responseAIProxyLibrary2OpenAI(response *LibraryResponse) *openai.TextRespon
 		FinishReason: "stop",
 	}
 	fullTextResponse := openai.TextResponse{
-		Id:      helper.GetUUID(),
+		Id:      fmt.Sprintf("chatcmpl-%s", helper.GetUUID()),
 		Object:  "chat.completion",
 		Created: helper.GetTimestamp(),
 		Choices: []openai.TextResponseChoice{choice},
@ -66,7 +66,7 @@ func documentsAIProxyLibrary(documents []LibraryDocument) *openai.ChatCompletion
 	choice.Delta.Content = aiProxyDocuments2Markdown(documents)
 	choice.FinishReason = &constant.StopFinishReason
 	return &openai.ChatCompletionsStreamResponse{
-		Id:      helper.GetUUID(),
+		Id:      fmt.Sprintf("chatcmpl-%s", helper.GetUUID()),
 		Object:  "chat.completion.chunk",
 		Created: helper.GetTimestamp(),
 		Model:   "",
@ -78,7 +78,7 @@ func streamResponseAIProxyLibrary2OpenAI(response *LibraryStreamResponse) *opena
 	var choice openai.ChatCompletionsStreamResponseChoice
 	choice.Delta.Content = response.Content
 	return &openai.ChatCompletionsStreamResponse{
-		Id:      helper.GetUUID(),
+		Id:      fmt.Sprintf("chatcmpl-%s", helper.GetUUID()),
 		Object:  "chat.completion.chunk",
 		Created: helper.GetTimestamp(),
 		Model:   response.Model,
--- a/relay/channel/openai/model.go
+++ b/relay/channel/openai/model.go
@ -118,8 +118,10 @@ type ImageResponse struct {
 }
 type ChatCompletionsStreamResponseChoice struct {
 	Index int `json:"index"`
 	Delta struct {
 		Content string `json:"content"`
 		Role    string `json:"role,omitempty"`
 	} `json:"delta"`
 	FinishReason *string `json:"finish_reason,omitempty"`
 }
--- a/relay/channel/xunfei/main.go
+++ b/relay/channel/xunfei/main.go
@ -70,6 +70,7 @@ func responseXunfei2OpenAI(response *ChatResponse) *openai.TextResponse {
 		FinishReason: constant.StopFinishReason,
 	}
 	fullTextResponse := openai.TextResponse{
 		Id:      fmt.Sprintf("chatcmpl-%s", helper.GetUUID()),
 		Object:  "chat.completion",
 		Created: helper.GetTimestamp(),
 		Choices: []openai.TextResponseChoice{choice},
@ -92,6 +93,7 @@ func streamResponseXunfei2OpenAI(xunfeiResponse *ChatResponse) *openai.ChatCompl
 		choice.FinishReason = &constant.StopFinishReason
 	}
 	response := openai.ChatCompletionsStreamResponse{
 		Id:      fmt.Sprintf("chatcmpl-%s", helper.GetUUID()),
 		Object:  "chat.completion.chunk",
 		Created: helper.GetTimestamp(),
 		Model:   "SparkDesk",
--- a/relay/controller/text.go
+++ b/relay/controller/text.go
@ -39,6 +39,7 @@ func RelayTextHelper(c *gin.Context) *model.ErrorWithStatusCode {
 	ratio := modelRatio * groupRatio
 	// pre-consume quota
 	promptTokens := getPromptTokens(textRequest, meta.Mode)
 	meta.PromptTokens = promptTokens
 	preConsumedQuota, bizErr := preConsumeQuota(ctx, textRequest, promptTokens, ratio, meta)
 	if bizErr != nil {
 		logger.Warnf(ctx, "preConsumeQuota failed: %+v", *bizErr)
--- a/web/build.sh
+++ b/web/build.sh
@ -1,13 +1,13 @@
 #!/bin/sh
 version=$(cat VERSION)
-themes=$(cat THEMES)
+pwd
 IFS=$'\n'
-for theme in $themes; do
+while IFS= read -r theme; do
    echo "Building theme: $theme"
-    cd $theme
+    rm -r build/$theme
    cd "$theme"
    npm install
    DISABLE_ESLINT_PLUGIN='true' REACT_APP_VERSION=$version npm run build
    cd ..
-done
+done < THEMES