ai-gateway/relay/controller/text.go

package controller

import (
	"bytes"
	"encoding/json"
	"fmt"
	"io"
	"net/http"
	"strings"

	"github.com/gin-gonic/gin"
	"github.com/songquanpeng/one-api/common/logger"
	"github.com/songquanpeng/one-api/relay"
	"github.com/songquanpeng/one-api/relay/adaptor/openai"
	"github.com/songquanpeng/one-api/relay/apitype"
	"github.com/songquanpeng/one-api/relay/billing"
	billingratio "github.com/songquanpeng/one-api/relay/billing/ratio"
	"github.com/songquanpeng/one-api/relay/channeltype"
	"github.com/songquanpeng/one-api/relay/meta"
	"github.com/songquanpeng/one-api/relay/model"
)

func RelayTextHelper(c *gin.Context) *model.ErrorWithStatusCode {
	ctx := c.Request.Context()
	meta := meta.GetByContext(c)
	// get & validate textRequest
	textRequest, err := getAndValidateTextRequest(c, meta.Mode)
	if err != nil {
		logger.Errorf(ctx, "getAndValidateTextRequest failed: %s", err.Error())
		return openai.ErrorWrapper(err, "invalid_text_request", http.StatusBadRequest)
	}
	meta.IsStream = textRequest.Stream

	// map model name
	var isModelMapped bool
	meta.OriginModelName = textRequest.Model
	textRequest.Model, isModelMapped = getMappedModelName(textRequest.Model, meta.ModelMapping)
	meta.ActualModelName = textRequest.Model
	// get model ratio & group ratio
	modelRatio := billingratio.GetModelRatio(textRequest.Model)
	groupRatio := billingratio.GetGroupRatio(meta.Group)
	ratio := modelRatio * groupRatio
	// pre-consume quota
	promptTokens := getPromptTokens(textRequest, meta.Mode)
	meta.PromptTokens = promptTokens
	preConsumedQuota, bizErr := preConsumeQuota(ctx, textRequest, promptTokens, ratio, meta)
	if bizErr != nil {
		logger.Warnf(ctx, "preConsumeQuota failed: %+v", *bizErr)
		return bizErr
	}

	adaptor := relay.GetAdaptor(meta.APIType)
	if adaptor == nil {
		return openai.ErrorWrapper(fmt.Errorf("invalid api type: %d", meta.APIType), "invalid_api_type", http.StatusBadRequest)
	}

	// get request body
	var requestBody io.Reader
	if meta.APIType == apitype.OpenAI {
		// no need to convert request for openai
		shouldResetRequestBody := isModelMapped || meta.ChannelType == channeltype.Baichuan // frequency_penalty 0 is not acceptable for baichuan
		if shouldResetRequestBody {
			jsonStr, err := json.Marshal(textRequest)
			if err != nil {
				return openai.ErrorWrapper(err, "json_marshal_failed", http.StatusInternalServerError)
			}
			requestBody = bytes.NewBuffer(jsonStr)
		} else {
			requestBody = c.Request.Body
		}
	} else {
		convertedRequest, err := adaptor.ConvertRequest(c, meta.Mode, textRequest)
		if err != nil {
			return openai.ErrorWrapper(err, "convert_request_failed", http.StatusInternalServerError)
		}
		jsonData, err := json.Marshal(convertedRequest)
		if err != nil {
			return openai.ErrorWrapper(err, "json_marshal_failed", http.StatusInternalServerError)
		}
		logger.Debugf(ctx, "converted request: \n%s", string(jsonData))
		requestBody = bytes.NewBuffer(jsonData)
	}

	// do request
	resp, err := adaptor.DoRequest(c, meta, requestBody)
	if err != nil {
		logger.Errorf(ctx, "DoRequest failed: %s", err.Error())
		return openai.ErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)
	}
	if resp != nil {
		errorHappened := (resp.StatusCode != http.StatusOK) || (meta.IsStream && strings.HasPrefix(resp.Header.Get("Content-Type"), "application/json"))
		if errorHappened {
			billing.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)
			return RelayErrorHandler(resp)
		}
	}

	// do response
	usage, respErr := adaptor.DoResponse(c, resp, meta)
	if respErr != nil {
		logger.Errorf(ctx, "respErr is not nil: %+v", respErr)
		billing.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)
		return respErr
	}
	// post-consume quota
	go postConsumeQuota(ctx, usage, meta, textRequest, ratio, preConsumedQuota, modelRatio, groupRatio)
	return nil
}
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`package controller`

			`import (`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`"bytes"`
			`"encoding/json"`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`"fmt"`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00			`"io"`
			`"net/http"`
fix: use prefix to match more json response 2024-04-19 17:15:33 +00:00			`"strings"`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00
refactor: refactor relay part (#935) 2024-01-14 11:21:03 +00:00			`"github.com/gin-gonic/gin"`
chore: update module name 2024-01-28 11:38:58 +00:00			`"github.com/songquanpeng/one-api/common/logger"`
chore: remove helper & util subpackage for relay 2024-04-05 17:50:12 +00:00			`"github.com/songquanpeng/one-api/relay"`
chore: reorganize adaptor related package 2024-04-05 17:36:48 +00:00			`"github.com/songquanpeng/one-api/relay/adaptor/openai"`
chore: reorganize constant related package 2024-04-05 16:44:33 +00:00			`"github.com/songquanpeng/one-api/relay/apitype"`
chore: reorganize helper related package 2024-04-05 17:02:35 +00:00			`"github.com/songquanpeng/one-api/relay/billing"`
chore: reorganize billing related package 2024-04-05 17:26:48 +00:00			`billingratio "github.com/songquanpeng/one-api/relay/billing/ratio"`
chore: reorganize constant related package 2024-04-05 16:44:33 +00:00			`"github.com/songquanpeng/one-api/relay/channeltype"`
chore: reorganize relay related package 2024-04-05 17:31:44 +00:00			`"github.com/songquanpeng/one-api/relay/meta"`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`"github.com/songquanpeng/one-api/relay/model"`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`)`

refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`func RelayTextHelper(c gin.Context) model.ErrorWithStatusCode {`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`ctx := c.Request.Context()`
chore: reorganize relay related package 2024-04-05 17:31:44 +00:00			`meta := meta.GetByContext(c)`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// get & validate textRequest`
			`textRequest, err := getAndValidateTextRequest(c, meta.Mode)`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`if err != nil {`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`logger.Errorf(ctx, "getAndValidateTextRequest failed: %s", err.Error())`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`return openai.ErrorWrapper(err, "invalid_text_request", http.StatusBadRequest)`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`}`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`meta.IsStream = textRequest.Stream`

refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// map model name`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`var isModelMapped bool`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`meta.OriginModelName = textRequest.Model`
chore: remove helper & util subpackage for relay 2024-04-05 17:50:12 +00:00			`textRequest.Model, isModelMapped = getMappedModelName(textRequest.Model, meta.ModelMapping)`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`meta.ActualModelName = textRequest.Model`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// get model ratio & group ratio`
chore: reorganize billing related package 2024-04-05 17:26:48 +00:00			`modelRatio := billingratio.GetModelRatio(textRequest.Model)`
			`groupRatio := billingratio.GetGroupRatio(meta.Group)`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`ratio := modelRatio * groupRatio`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// pre-consume quota`
			`promptTokens := getPromptTokens(textRequest, meta.Mode)`
fix: fix prompt token is zero (close #1023) 2024-02-21 14:19:42 +00:00			`meta.PromptTokens = promptTokens`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`preConsumedQuota, bizErr := preConsumeQuota(ctx, textRequest, promptTokens, ratio, meta)`
			`if bizErr != nil {`
			`logger.Warnf(ctx, "preConsumeQuota failed: %+v", *bizErr)`
			`return bizErr`
fix: update cache immediately after cache get Co-authored-by: chikasaki <1347283135@qq.com> Co-authored-by: Cruel <157922018@qq.com> 2023-08-16 15:40:24 +00:00			`}`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00
chore: remove helper & util subpackage for relay 2024-04-05 17:50:12 +00:00			`adaptor := relay.GetAdaptor(meta.APIType)`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`if adaptor == nil {`
			`return openai.ErrorWrapper(fmt.Errorf("invalid api type: %d", meta.APIType), "invalid_api_type", http.StatusBadRequest)`
feat: support claude now (close #150) 2023-07-22 08:18:03 +00:00			`}`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00
			`// get request body`
			`var requestBody io.Reader`
chore: reorganize constant related package 2024-04-05 16:44:33 +00:00			`if meta.APIType == apitype.OpenAI {`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`// no need to convert request for openai`
chore: reorganize constant related package 2024-04-05 16:44:33 +00:00			`shouldResetRequestBody := isModelMapped \|\| meta.ChannelType == channeltype.Baichuan // frequency_penalty 0 is not acceptable for baichuan`
feat: support baichuan's models now (close #1057) 2024-03-01 16:55:48 +00:00			`if shouldResetRequestBody {`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`jsonStr, err := json.Marshal(textRequest)`
			`if err != nil {`
			`return openai.ErrorWrapper(err, "json_marshal_failed", http.StatusInternalServerError)`
			`}`
			`requestBody = bytes.NewBuffer(jsonStr)`
			`} else {`
			`requestBody = c.Request.Body`
			`}`
			`} else {`
			`convertedRequest, err := adaptor.ConvertRequest(c, meta.Mode, textRequest)`
feat: support xunfei's llm (close #206) 2023-07-29 13:55:57 +00:00			`if err != nil {`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`return openai.ErrorWrapper(err, "convert_request_failed", http.StatusInternalServerError)`
feat: support claude now (close #150) 2023-07-22 08:18:03 +00:00			`}`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`jsonData, err := json.Marshal(convertedRequest)`
feat: support xunfei's llm (close #206) 2023-07-29 13:55:57 +00:00			`if err != nil {`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`return openai.ErrorWrapper(err, "json_marshal_failed", http.StatusInternalServerError)`
feat: support ali's llm (close #326) 2023-07-28 15:45:08 +00:00			`}`
fix: fix baidu system prompt (close #1079) 2024-03-13 14:56:54 +00:00			`logger.Debugf(ctx, "converted request: \n%s", string(jsonData))`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`requestBody = bytes.NewBuffer(jsonData)`
			`}`
feat: support xunfei's llm (close #206) 2023-07-29 13:55:57 +00:00
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`// do request`
			`resp, err := adaptor.DoRequest(c, meta, requestBody)`
			`if err != nil {`
			`logger.Errorf(ctx, "DoRequest failed: %s", err.Error())`
			`return openai.ErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)`
fix: empty completion issue caused by bad status code from upstream channel (#422) 2023-08-19 09:58:45 +00:00			`}`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00			`if resp != nil {`
fix: use prefix to match more json response 2024-04-19 17:15:33 +00:00			`errorHappened := (resp.StatusCode != http.StatusOK) \|\| (meta.IsStream && strings.HasPrefix(resp.Header.Get("Content-Type"), "application/json"))`
feat: support aws bedrockruntime claude3 (#1328) * feat: support aws bedrockruntime claude3 closes #622, closes #749, closes #1300 * fix: convert to aws claude model id * fix: Update AWS adapter to handle stream completions and calculate usage metrics Based on the file summaries provided, here are the important bullet points for the commit message: - Add functionality to handle stream completion events from AWS in the relay/adaptor/aws/main.go file - Marshall AWS response to OpenAI format and calculate usage metrics in the same file - Implement a custom render function for streaming events in the same file - Improve error handling for JSON unmarshalling and marshalling errors in the same file * fix: Implement AWS handler with usage tracking and error handling - Implemented streaming response handling for AWS handler - Set response content type to text/event-stream - Added error handling for failed marshaling/unmarshaling - Updated return values to include `relaymodel.ErrorWithStatusCode` and `relaymodel.Usage` - Improved error handling and response formatting for AWS adaptor * fix: Refactor AWS Adapter for Improved Model Mapping and Error Handling * Refactor AWS adapter to improve model management - Replace hardcoded model list in `adapter.go` with a function to get models from `awsModelIDMap` - Update `GetModelList` function to return model list directly - Add `GetChannelName` function to get channel name from `Adaptor` object * Improve error handling and code organization in main.go - Replace switch statement with a map to map AWS model IDs to OpenAI model IDs - Return an error if the model is not found in the map - Use a single return statement instead of wrapping multiple return statements in the `awsModelID` function - Add a new error message for when the model is not found in the map in the `Handler` function * fix: bug fix * chore: change variable name & package * chore: change variable name * perf: update config related code --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2024-04-19 16:40:47 +00:00			`if errorHappened {`
			`billing.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)`
			`return RelayErrorHandler(resp)`
			`}`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`}`

refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// do response`
refactor: use adaptor to do relay & test 2024-02-17 16:15:31 +00:00			`usage, respErr := adaptor.DoResponse(c, resp, meta)`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`if respErr != nil {`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`logger.Errorf(ctx, "respErr is not nil: %+v", respErr)`
chore: reorganize billing related package 2024-04-05 17:26:48 +00:00			`billing.ReturnPreConsumedQuota(ctx, preConsumedQuota, meta.TokenId)`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`return respErr`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`}`
refactor: split RelayTextHelper function 2024-01-28 11:13:11 +00:00			`// post-consume quota`
			`go postConsumeQuota(ctx, usage, meta, textRequest, ratio, preConsumedQuota, modelRatio, groupRatio)`
refactor: refactor relay part (#957) * refactor: refactor relay part * refactor: refactor config part 2024-01-21 15:21:42 +00:00			`return nil`
refactor: split the relay controller 2023-06-19 02:28:55 +00:00			`}`