ai-gateway/providers/gemini/chat.go

package gemini

import (
	"bufio"
	"encoding/json"
	"fmt"
	"io"
	"net/http"
	"one-api/common"
	"one-api/common/image"
	"one-api/providers/base"
	"one-api/types"
	"strings"
)

const (
	GeminiVisionMaxImageNum = 16
)

func (response *GeminiChatResponse) ResponseHandler(resp *http.Response) (OpenAIResponse any, errWithCode *types.OpenAIErrorWithStatusCode) {
	if len(response.Candidates) == 0 {
		return nil, &types.OpenAIErrorWithStatusCode{
			OpenAIError: types.OpenAIError{
				Message: "No candidates returned",
				Type:    "server_error",
				Param:   "",
				Code:    500,
			},
			StatusCode: resp.StatusCode,
		}
	}

	fullTextResponse := &types.ChatCompletionResponse{
		ID:      fmt.Sprintf("chatcmpl-%s", common.GetUUID()),
		Object:  "chat.completion",
		Created: common.GetTimestamp(),
		Model:   response.Model,
		Choices: make([]types.ChatCompletionChoice, 0, len(response.Candidates)),
	}
	for i, candidate := range response.Candidates {
		choice := types.ChatCompletionChoice{
			Index: i,
			Message: types.ChatCompletionMessage{
				Role:    "assistant",
				Content: "",
			},
			FinishReason: base.StopFinishReason,
		}
		if len(candidate.Content.Parts) > 0 {
			choice.Message.Content = candidate.Content.Parts[0].Text
		}
		fullTextResponse.Choices = append(fullTextResponse.Choices, choice)
	}

	completionTokens := common.CountTokenText(response.GetResponseText(), response.Model)
	response.Usage.CompletionTokens = completionTokens
	response.Usage.TotalTokens = response.Usage.PromptTokens + completionTokens

	return fullTextResponse, nil
}

// Setting safety to the lowest possible values since Gemini is already powerless enough
func (p *GeminiProvider) getChatRequestBody(request *types.ChatCompletionRequest) (requestBody *GeminiChatRequest) {
	geminiRequest := GeminiChatRequest{
		Contents: make([]GeminiChatContent, 0, len(request.Messages)),
		//SafetySettings: []GeminiChatSafetySettings{
		//	{
		//		Category:  "HARM_CATEGORY_HARASSMENT",
		//		Threshold: "BLOCK_ONLY_HIGH",
		//	},
		//	{
		//		Category:  "HARM_CATEGORY_HATE_SPEECH",
		//		Threshold: "BLOCK_ONLY_HIGH",
		//	},
		//	{
		//		Category:  "HARM_CATEGORY_SEXUALLY_EXPLICIT",
		//		Threshold: "BLOCK_ONLY_HIGH",
		//	},
		//	{
		//		Category:  "HARM_CATEGORY_DANGEROUS_CONTENT",
		//		Threshold: "BLOCK_ONLY_HIGH",
		//	},
		//},
		GenerationConfig: GeminiChatGenerationConfig{
			Temperature:     request.Temperature,
			TopP:            request.TopP,
			MaxOutputTokens: request.MaxTokens,
		},
	}
	if request.Functions != nil {
		geminiRequest.Tools = []GeminiChatTools{
			{
				FunctionDeclarations: request.Functions,
			},
		}
	}
	shouldAddDummyModelMessage := false
	for _, message := range request.Messages {
		content := GeminiChatContent{
			Role: message.Role,
			Parts: []GeminiPart{
				{
					Text: message.StringContent(),
				},
			},
		}

		openaiContent := message.ParseContent()
		var parts []GeminiPart
		imageNum := 0
		for _, part := range openaiContent {
			if part.Type == types.ContentTypeText {
				parts = append(parts, GeminiPart{
					Text: part.Text,
				})
			} else if part.Type == types.ContentTypeImageURL {
				imageNum += 1
				if imageNum > GeminiVisionMaxImageNum {
					continue
				}
				mimeType, data, _ := image.GetImageFromUrl(part.ImageURL.URL)
				parts = append(parts, GeminiPart{
					InlineData: &GeminiInlineData{
						MimeType: mimeType,
						Data:     data,
					},
				})
			}
		}
		content.Parts = parts

		// there's no assistant role in gemini and API shall vomit if Role is not user or model
		if content.Role == "assistant" {
			content.Role = "model"
		}
		// Converting system prompt to prompt from user for the same reason
		if content.Role == "system" {
			content.Role = "user"
			shouldAddDummyModelMessage = true
		}
		geminiRequest.Contents = append(geminiRequest.Contents, content)

		// If a system message is the last message, we need to add a dummy model message to make gemini happy
		if shouldAddDummyModelMessage {
			geminiRequest.Contents = append(geminiRequest.Contents, GeminiChatContent{
				Role: "model",
				Parts: []GeminiPart{
					{
						Text: "Okay",
					},
				},
			})
			shouldAddDummyModelMessage = false
		}
	}

	return &geminiRequest
}

func (p *GeminiProvider) ChatAction(request *types.ChatCompletionRequest, isModelMapped bool, promptTokens int) (usage *types.Usage, errWithCode *types.OpenAIErrorWithStatusCode) {
	requestBody := p.getChatRequestBody(request)
	fullRequestURL := p.GetFullRequestURL("generateContent", request.Model)
	headers := p.GetRequestHeaders()
	if request.Stream {
		headers["Accept"] = "text/event-stream"
	}

	client := common.NewClient()
	req, err := client.NewRequest(p.Context.Request.Method, fullRequestURL, common.WithBody(requestBody), common.WithHeader(headers))
	if err != nil {
		return nil, common.ErrorWrapper(err, "new_request_failed", http.StatusInternalServerError)
	}

	if request.Stream {
		var responseText string
		errWithCode, responseText = p.sendStreamRequest(req, request.Model)
		if errWithCode != nil {
			return
		}

		usage = &types.Usage{
			PromptTokens:     promptTokens,
			CompletionTokens: common.CountTokenText(responseText, request.Model),
		}
		usage.TotalTokens = promptTokens + usage.CompletionTokens

	} else {
		var geminiResponse = &GeminiChatResponse{
			Model: request.Model,
			Usage: &types.Usage{
				PromptTokens: promptTokens,
			},
		}
		errWithCode = p.SendRequest(req, geminiResponse, false)
		if errWithCode != nil {
			return
		}

		usage = geminiResponse.Usage
	}
	return

}

// func (p *GeminiProvider) streamResponseClaude2OpenAI(geminiResponse *GeminiChatResponse) *types.ChatCompletionStreamResponse {
// 	var choice types.ChatCompletionStreamChoice
// 	choice.Delta.Content = geminiResponse.GetResponseText()
// 	choice.FinishReason = &base.StopFinishReason
// 	var response types.ChatCompletionStreamResponse
// 	response.Object = "chat.completion.chunk"
// 	response.Model = "gemini"
// 	response.Choices = []types.ChatCompletionStreamChoice{choice}
// 	return &response
// }

func (p *GeminiProvider) sendStreamRequest(req *http.Request, model string) (*types.OpenAIErrorWithStatusCode, string) {
	defer req.Body.Close()

	// 发送请求
	client := common.GetHttpClient(p.Channel.Proxy)
	resp, err := client.Do(req)
	if err != nil {
		return common.ErrorWrapper(err, "http_request_failed", http.StatusInternalServerError), ""
	}
	common.PutHttpClient(client)

	if common.IsFailureStatusCode(resp) {
		return common.HandleErrorResp(resp), ""
	}

	defer resp.Body.Close()

	responseText := ""
	dataChan := make(chan string)
	stopChan := make(chan bool)
	scanner := bufio.NewScanner(resp.Body)
	scanner.Split(func(data []byte, atEOF bool) (advance int, token []byte, err error) {
		if atEOF && len(data) == 0 {
			return 0, nil, nil
		}
		if i := strings.Index(string(data), "\n"); i >= 0 {
			return i + 1, data[0:i], nil
		}
		if atEOF {
			return len(data), data, nil
		}
		return 0, nil, nil
	})
	go func() {
		for scanner.Scan() {
			data := scanner.Text()
			data = strings.TrimSpace(data)
			if !strings.HasPrefix(data, "\"text\": \"") {
				continue
			}
			data = strings.TrimPrefix(data, "\"text\": \"")
			data = strings.TrimSuffix(data, "\"")
			dataChan <- data
		}
		stopChan <- true
	}()
	common.SetEventStreamHeaders(p.Context)
	p.Context.Stream(func(w io.Writer) bool {
		select {
		case data := <-dataChan:
			// this is used to prevent annoying \ related format bug
			data = fmt.Sprintf("{\"content\": \"%s\"}", data)
			type dummyStruct struct {
				Content string `json:"content"`
			}
			var dummy dummyStruct
			json.Unmarshal([]byte(data), &dummy)
			responseText += dummy.Content
			var choice types.ChatCompletionStreamChoice
			choice.Delta.Content = dummy.Content
			response := types.ChatCompletionStreamResponse{
				ID:      fmt.Sprintf("chatcmpl-%s", common.GetUUID()),
				Object:  "chat.completion.chunk",
				Created: common.GetTimestamp(),
				Model:   model,
				Choices: []types.ChatCompletionStreamChoice{choice},
			}
			jsonResponse, err := json.Marshal(response)
			if err != nil {
				common.SysError("error marshalling stream response: " + err.Error())
				return true
			}
			p.Context.Render(-1, common.CustomEvent{Data: "data: " + string(jsonResponse)})
			return true
		case <-stopChan:
			p.Context.Render(-1, common.CustomEvent{Data: "data: [DONE]"})
			return false
		}
	})

	return nil, responseText
}
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`package gemini`

			`import (`
			`"bufio"`
			`"encoding/json"`
			`"fmt"`
			`"io"`
			`"net/http"`
			`"one-api/common"`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`"one-api/common/image"`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`"one-api/providers/base"`
			`"one-api/types"`
			`"strings"`
			`)`

Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`const (`
			`GeminiVisionMaxImageNum = 16`
			`)`

Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`func (response GeminiChatResponse) ResponseHandler(resp http.Response) (OpenAIResponse any, errWithCode *types.OpenAIErrorWithStatusCode) {`
			`if len(response.Candidates) == 0 {`
			`return nil, &types.OpenAIErrorWithStatusCode{`
			`OpenAIError: types.OpenAIError{`
			`Message: "No candidates returned",`
			`Type: "server_error",`
			`Param: "",`
			`Code: 500,`
			`},`
			`StatusCode: resp.StatusCode,`
			`}`
			`}`

			`fullTextResponse := &types.ChatCompletionResponse{`
			`ID: fmt.Sprintf("chatcmpl-%s", common.GetUUID()),`
			`Object: "chat.completion",`
			`Created: common.GetTimestamp(),`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`Model: response.Model,`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`Choices: make([]types.ChatCompletionChoice, 0, len(response.Candidates)),`
			`}`
			`for i, candidate := range response.Candidates {`
			`choice := types.ChatCompletionChoice{`
			`Index: i,`
			`Message: types.ChatCompletionMessage{`
			`Role: "assistant",`
			`Content: "",`
			`},`
			`FinishReason: base.StopFinishReason,`
			`}`
			`if len(candidate.Content.Parts) > 0 {`
			`choice.Message.Content = candidate.Content.Parts[0].Text`
			`}`
			`fullTextResponse.Choices = append(fullTextResponse.Choices, choice)`
			`}`

Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`completionTokens := common.CountTokenText(response.GetResponseText(), response.Model)`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`response.Usage.CompletionTokens = completionTokens`
			`response.Usage.TotalTokens = response.Usage.PromptTokens + completionTokens`

			`return fullTextResponse, nil`
			`}`

			`// Setting safety to the lowest possible values since Gemini is already powerless enough`
			`func (p GeminiProvider) getChatRequestBody(request types.ChatCompletionRequest) (requestBody *GeminiChatRequest) {`
			`geminiRequest := GeminiChatRequest{`
			`Contents: make([]GeminiChatContent, 0, len(request.Messages)),`
			`//SafetySettings: []GeminiChatSafetySettings{`
			`// {`
			`// Category: "HARM_CATEGORY_HARASSMENT",`
			`// Threshold: "BLOCK_ONLY_HIGH",`
			`// },`
			`// {`
			`// Category: "HARM_CATEGORY_HATE_SPEECH",`
			`// Threshold: "BLOCK_ONLY_HIGH",`
			`// },`
			`// {`
			`// Category: "HARM_CATEGORY_SEXUALLY_EXPLICIT",`
			`// Threshold: "BLOCK_ONLY_HIGH",`
			`// },`
			`// {`
			`// Category: "HARM_CATEGORY_DANGEROUS_CONTENT",`
			`// Threshold: "BLOCK_ONLY_HIGH",`
			`// },`
			`//},`
			`GenerationConfig: GeminiChatGenerationConfig{`
			`Temperature: request.Temperature,`
			`TopP: request.TopP,`
			`MaxOutputTokens: request.MaxTokens,`
			`},`
			`}`
			`if request.Functions != nil {`
			`geminiRequest.Tools = []GeminiChatTools{`
			`{`
			`FunctionDeclarations: request.Functions,`
			`},`
			`}`
			`}`
			`shouldAddDummyModelMessage := false`
			`for _, message := range request.Messages {`
			`content := GeminiChatContent{`
			`Role: message.Role,`
			`Parts: []GeminiPart{`
			`{`
			`Text: message.StringContent(),`
			`},`
			`},`
			`}`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00
			`openaiContent := message.ParseContent()`
			`var parts []GeminiPart`
			`imageNum := 0`
			`for _, part := range openaiContent {`
			`if part.Type == types.ContentTypeText {`
			`parts = append(parts, GeminiPart{`
			`Text: part.Text,`
			`})`
			`} else if part.Type == types.ContentTypeImageURL {`
			`imageNum += 1`
			`if imageNum > GeminiVisionMaxImageNum {`
			`continue`
			`}`
			`mimeType, data, _ := image.GetImageFromUrl(part.ImageURL.URL)`
			`parts = append(parts, GeminiPart{`
			`InlineData: &GeminiInlineData{`
			`MimeType: mimeType,`
			`Data: data,`
			`},`
			`})`
			`}`
			`}`
			`content.Parts = parts`

Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`// there's no assistant role in gemini and API shall vomit if Role is not user or model`
			`if content.Role == "assistant" {`
			`content.Role = "model"`
			`}`
			`// Converting system prompt to prompt from user for the same reason`
			`if content.Role == "system" {`
			`content.Role = "user"`
			`shouldAddDummyModelMessage = true`
			`}`
			`geminiRequest.Contents = append(geminiRequest.Contents, content)`

			`// If a system message is the last message, we need to add a dummy model message to make gemini happy`
			`if shouldAddDummyModelMessage {`
			`geminiRequest.Contents = append(geminiRequest.Contents, GeminiChatContent{`
			`Role: "model",`
			`Parts: []GeminiPart{`
			`{`
			`Text: "Okay",`
			`},`
			`},`
			`})`
			`shouldAddDummyModelMessage = false`
			`}`
			`}`

			`return &geminiRequest`
			`}`

			`func (p GeminiProvider) ChatAction(request types.ChatCompletionRequest, isModelMapped bool, promptTokens int) (usage types.Usage, errWithCode types.OpenAIErrorWithStatusCode) {`
			`requestBody := p.getChatRequestBody(request)`
			`fullRequestURL := p.GetFullRequestURL("generateContent", request.Model)`
			`headers := p.GetRequestHeaders()`
			`if request.Stream {`
			`headers["Accept"] = "text/event-stream"`
			`}`

			`client := common.NewClient()`
			`req, err := client.NewRequest(p.Context.Request.Method, fullRequestURL, common.WithBody(requestBody), common.WithHeader(headers))`
			`if err != nil {`
			`return nil, common.ErrorWrapper(err, "new_request_failed", http.StatusInternalServerError)`
			`}`

			`if request.Stream {`
			`var responseText string`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`errWithCode, responseText = p.sendStreamRequest(req, request.Model)`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`if errWithCode != nil {`
			`return`
			`}`

🐛 fix usage error & web channel edit label error 2023-12-21 08:52:00 +00:00			`usage = &types.Usage{`
			`PromptTokens: promptTokens,`
			`CompletionTokens: common.CountTokenText(responseText, request.Model),`
			`}`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`usage.TotalTokens = promptTokens + usage.CompletionTokens`

			`} else {`
			`var geminiResponse = &GeminiChatResponse{`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`Model: request.Model,`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`Usage: &types.Usage{`
			`PromptTokens: promptTokens,`
			`},`
			`}`
			`errWithCode = p.SendRequest(req, geminiResponse, false)`
			`if errWithCode != nil {`
			`return`
			`}`

			`usage = geminiResponse.Usage`
			`}`
			`return`

			`}`

Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`// func (p GeminiProvider) streamResponseClaude2OpenAI(geminiResponse GeminiChatResponse) *types.ChatCompletionStreamResponse {`
			`// var choice types.ChatCompletionStreamChoice`
			`// choice.Delta.Content = geminiResponse.GetResponseText()`
			`// choice.FinishReason = &base.StopFinishReason`
			`// var response types.ChatCompletionStreamResponse`
			`// response.Object = "chat.completion.chunk"`
			`// response.Model = "gemini"`
			`// response.Choices = []types.ChatCompletionStreamChoice{choice}`
			`// return &response`
			`// }`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`func (p GeminiProvider) sendStreamRequest(req http.Request, model string) (*types.OpenAIErrorWithStatusCode, string) {`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`defer req.Body.Close()`

			`// 发送请求`
✨ add channel proxy 2023-12-26 10:42:39 +00:00			`client := common.GetHttpClient(p.Channel.Proxy)`
			`resp, err := client.Do(req)`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`if err != nil {`
			`return common.ErrorWrapper(err, "http_request_failed", http.StatusInternalServerError), ""`
			`}`
✨ add channel proxy 2023-12-26 10:42:39 +00:00			`common.PutHttpClient(client)`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00
			`if common.IsFailureStatusCode(resp) {`
			`return common.HandleErrorResp(resp), ""`
			`}`

			`defer resp.Body.Close()`

			`responseText := ""`
			`dataChan := make(chan string)`
			`stopChan := make(chan bool)`
			`scanner := bufio.NewScanner(resp.Body)`
			`scanner.Split(func(data []byte, atEOF bool) (advance int, token []byte, err error) {`
			`if atEOF && len(data) == 0 {`
			`return 0, nil, nil`
			`}`
			`if i := strings.Index(string(data), "\n"); i >= 0 {`
			`return i + 1, data[0:i], nil`
			`}`
			`if atEOF {`
			`return len(data), data, nil`
			`}`
			`return 0, nil, nil`
			`})`
			`go func() {`
			`for scanner.Scan() {`
			`data := scanner.Text()`
			`data = strings.TrimSpace(data)`
			`if !strings.HasPrefix(data, "\"text\": \"") {`
			`continue`
			`}`
			`data = strings.TrimPrefix(data, "\"text\": \"")`
			`data = strings.TrimSuffix(data, "\"")`
			`dataChan <- data`
			`}`
			`stopChan <- true`
			`}()`
			`common.SetEventStreamHeaders(p.Context)`
			`p.Context.Stream(func(w io.Writer) bool {`
			`select {`
			`case data := <-dataChan:`
			`// this is used to prevent annoying \ related format bug`
			`data = fmt.Sprintf("{\"content\": \"%s\"}", data)`
			`type dummyStruct struct {`
			Content string `json:"content"`
			`}`
			`var dummy dummyStruct`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`json.Unmarshal([]byte(data), &dummy)`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`responseText += dummy.Content`
			`var choice types.ChatCompletionStreamChoice`
			`choice.Delta.Content = dummy.Content`
			`response := types.ChatCompletionStreamResponse{`
			`ID: fmt.Sprintf("chatcmpl-%s", common.GetUUID()),`
			`Object: "chat.completion.chunk",`
			`Created: common.GetTimestamp(),`
Merge branch 'songquanpeng' into sync_upstream 2023-12-25 03:23:28 +00:00			`Model: model,`
Merge branch 'songquanpeng' into sync_upstream 2023-12-21 07:36:01 +00:00			`Choices: []types.ChatCompletionStreamChoice{choice},`
			`}`
			`jsonResponse, err := json.Marshal(response)`
			`if err != nil {`
			`common.SysError("error marshalling stream response: " + err.Error())`
			`return true`
			`}`
			`p.Context.Render(-1, common.CustomEvent{Data: "data: " + string(jsonResponse)})`
			`return true`
			`case <-stopChan:`
			`p.Context.Render(-1, common.CustomEvent{Data: "data: [DONE]"})`
			`return false`
			`}`
			`})`

			`return nil, responseText`
			`}`