ai-gateway/controller/relay-palm.go

package controller

import (
	"encoding/json"
	"fmt"
	"github.com/gin-gonic/gin"
	"io"
	"net/http"
	"one-api/common"
)

// https://developers.generativeai.google/api/rest/generativelanguage/models/generateMessage#request-body
// https://developers.generativeai.google/api/rest/generativelanguage/models/generateMessage#response-body

type PaLMChatMessage struct {
	Author  string `json:"author"`
	Content string `json:"content"`
}

type PaLMFilter struct {
	Reason  string `json:"reason"`
	Message string `json:"message"`
}

type PaLMPrompt struct {
	Messages []PaLMChatMessage `json:"messages"`
}

type PaLMChatRequest struct {
	Prompt         PaLMPrompt `json:"prompt"`
	Temperature    float64    `json:"temperature,omitempty"`
	CandidateCount int        `json:"candidateCount,omitempty"`
	TopP           float64    `json:"topP,omitempty"`
	TopK           int        `json:"topK,omitempty"`
}

type PaLMError struct {
	Code    int    `json:"code"`
	Message string `json:"message"`
	Status  string `json:"status"`
}

type PaLMChatResponse struct {
	Candidates []PaLMChatMessage `json:"candidates"`
	Messages   []Message         `json:"messages"`
	Filters    []PaLMFilter      `json:"filters"`
	Error      PaLMError         `json:"error"`
}

func requestOpenAI2PaLM(textRequest GeneralOpenAIRequest) *PaLMChatRequest {
	palmRequest := PaLMChatRequest{
		Prompt: PaLMPrompt{
			Messages: make([]PaLMChatMessage, 0, len(textRequest.Messages)),
		},
		Temperature:    textRequest.Temperature,
		CandidateCount: textRequest.N,
		TopP:           textRequest.TopP,
		TopK:           textRequest.MaxTokens,
	}
	for _, message := range textRequest.Messages {
		palmMessage := PaLMChatMessage{
			Content: message.Content,
		}
		if message.Role == "user" {
			palmMessage.Author = "0"
		} else {
			palmMessage.Author = "1"
		}
		palmRequest.Prompt.Messages = append(palmRequest.Prompt.Messages, palmMessage)
	}
	return &palmRequest
}

func responsePaLM2OpenAI(response *PaLMChatResponse) *OpenAITextResponse {
	fullTextResponse := OpenAITextResponse{
		Choices: make([]OpenAITextResponseChoice, 0, len(response.Candidates)),
	}
	for i, candidate := range response.Candidates {
		choice := OpenAITextResponseChoice{
			Index: i,
			Message: Message{
				Role:    "assistant",
				Content: candidate.Content,
			},
			FinishReason: "stop",
		}
		fullTextResponse.Choices = append(fullTextResponse.Choices, choice)
	}
	return &fullTextResponse
}

func streamResponsePaLM2OpenAI(palmResponse *PaLMChatResponse) *ChatCompletionsStreamResponse {
	var choice ChatCompletionsStreamResponseChoice
	if len(palmResponse.Candidates) > 0 {
		choice.Delta.Content = palmResponse.Candidates[0].Content
	}
	choice.FinishReason = &stopFinishReason
	var response ChatCompletionsStreamResponse
	response.Object = "chat.completion.chunk"
	response.Model = "palm2"
	response.Choices = []ChatCompletionsStreamResponseChoice{choice}
	return &response
}

func palmStreamHandler(c *gin.Context, resp *http.Response) (*OpenAIErrorWithStatusCode, string) {
	responseText := ""
	responseId := fmt.Sprintf("chatcmpl-%s", common.GetUUID())
	createdTime := common.GetTimestamp()
	dataChan := make(chan string)
	stopChan := make(chan bool)
	go func() {
		responseBody, err := io.ReadAll(resp.Body)
		if err != nil {
			common.SysError("error reading stream response: " + err.Error())
			stopChan <- true
			return
		}
		err = resp.Body.Close()
		if err != nil {
			common.SysError("error closing stream response: " + err.Error())
			stopChan <- true
			return
		}
		var palmResponse PaLMChatResponse
		err = json.Unmarshal(responseBody, &palmResponse)
		if err != nil {
			common.SysError("error unmarshalling stream response: " + err.Error())
			stopChan <- true
			return
		}
		fullTextResponse := streamResponsePaLM2OpenAI(&palmResponse)
		fullTextResponse.Id = responseId
		fullTextResponse.Created = createdTime
		if len(palmResponse.Candidates) > 0 {
			responseText = palmResponse.Candidates[0].Content
		}
		jsonResponse, err := json.Marshal(fullTextResponse)
		if err != nil {
			common.SysError("error marshalling stream response: " + err.Error())
			stopChan <- true
			return
		}
		dataChan <- string(jsonResponse)
		stopChan <- true
	}()
	setEventStreamHeaders(c)
	c.Stream(func(w io.Writer) bool {
		select {
		case data := <-dataChan:
			c.Render(-1, common.CustomEvent{Data: "data: " + data})
			return true
		case <-stopChan:
			c.Render(-1, common.CustomEvent{Data: "data: [DONE]"})
			return false
		}
	})
	err := resp.Body.Close()
	if err != nil {
		return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), ""
	}
	return nil, responseText
}

func palmHandler(c *gin.Context, resp *http.Response, promptTokens int, model string) (*OpenAIErrorWithStatusCode, *Usage) {
	responseBody, err := io.ReadAll(resp.Body)
	if err != nil {
		return errorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil
	}
	err = resp.Body.Close()
	if err != nil {
		return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
	}
	var palmResponse PaLMChatResponse
	err = json.Unmarshal(responseBody, &palmResponse)
	if err != nil {
		return errorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil
	}
	if palmResponse.Error.Code != 0 || len(palmResponse.Candidates) == 0 {
		return &OpenAIErrorWithStatusCode{
			OpenAIError: OpenAIError{
				Message: palmResponse.Error.Message,
				Type:    palmResponse.Error.Status,
				Param:   "",
				Code:    palmResponse.Error.Code,
			},
			StatusCode: resp.StatusCode,
		}, nil
	}
	fullTextResponse := responsePaLM2OpenAI(&palmResponse)
	completionTokens := countTokenText(palmResponse.Candidates[0].Content, model)
	usage := Usage{
		PromptTokens:     promptTokens,
		CompletionTokens: completionTokens,
		TotalTokens:      promptTokens + completionTokens,
	}
	fullTextResponse.Usage = usage
	jsonResponse, err := json.Marshal(fullTextResponse)
	if err != nil {
		return errorWrapper(err, "marshal_response_body_failed", http.StatusInternalServerError), nil
	}
	c.Writer.Header().Set("Content-Type", "application/json")
	c.Writer.WriteHeader(resp.StatusCode)
	_, err = c.Writer.Write(jsonResponse)
	return nil, &usage
}
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`package controller`

			`import (`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`"encoding/json"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`"fmt"`
			`"github.com/gin-gonic/gin"`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`"io"`
			`"net/http"`
			`"one-api/common"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`)`

feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`// https://developers.generativeai.google/api/rest/generativelanguage/models/generateMessage#request-body`
			`// https://developers.generativeai.google/api/rest/generativelanguage/models/generateMessage#response-body`

feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`type PaLMChatMessage struct {`
			Author string `json:"author"`
			Content string `json:"content"`
			`}`

			`type PaLMFilter struct {`
			Reason string `json:"reason"`
			Message string `json:"message"`
			`}`

feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`type PaLMPrompt struct {`
			Messages []PaLMChatMessage `json:"messages"`
			`}`

feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`type PaLMChatRequest struct {`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			Prompt PaLMPrompt `json:"prompt"`
			Temperature float64 `json:"temperature,omitempty"`
			CandidateCount int `json:"candidateCount,omitempty"`
			TopP float64 `json:"topP,omitempty"`
			TopK int `json:"topK,omitempty"`
			`}`

			`type PaLMError struct {`
			Code int `json:"code"`
			Message string `json:"message"`
			Status string `json:"status"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`}`

			`type PaLMChatResponse struct {`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			Candidates []PaLMChatMessage `json:"candidates"`
			Messages []Message `json:"messages"`
			Filters []PaLMFilter `json:"filters"`
			Error PaLMError `json:"error"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`}`

feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`func requestOpenAI2PaLM(textRequest GeneralOpenAIRequest) *PaLMChatRequest {`
			`palmRequest := PaLMChatRequest{`
			`Prompt: PaLMPrompt{`
			`Messages: make([]PaLMChatMessage, 0, len(textRequest.Messages)),`
			`},`
			`Temperature: textRequest.Temperature,`
			`CandidateCount: textRequest.N,`
			`TopP: textRequest.TopP,`
			`TopK: textRequest.MaxTokens,`
			`}`
			`for _, message := range textRequest.Messages {`
			`palmMessage := PaLMChatMessage{`
			`Content: message.Content,`
			`}`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`if message.Role == "user" {`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`palmMessage.Author = "0"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`} else {`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`palmMessage.Author = "1"`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`}`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`palmRequest.Prompt.Messages = append(palmRequest.Prompt.Messages, palmMessage)`
			`}`
			`return &palmRequest`
			`}`

			`func responsePaLM2OpenAI(response PaLMChatResponse) OpenAITextResponse {`
			`fullTextResponse := OpenAITextResponse{`
			`Choices: make([]OpenAITextResponseChoice, 0, len(response.Candidates)),`
			`}`
			`for i, candidate := range response.Candidates {`
			`choice := OpenAITextResponseChoice{`
			`Index: i,`
			`Message: Message{`
			`Role: "assistant",`
			`Content: candidate.Content,`
			`},`
			`FinishReason: "stop",`
			`}`
			`fullTextResponse.Choices = append(fullTextResponse.Choices, choice)`
			`}`
			`return &fullTextResponse`
			`}`

			`func streamResponsePaLM2OpenAI(palmResponse PaLMChatResponse) ChatCompletionsStreamResponse {`
			`var choice ChatCompletionsStreamResponseChoice`
			`if len(palmResponse.Candidates) > 0 {`
			`choice.Delta.Content = palmResponse.Candidates[0].Content`
			`}`
fix: fix finish_reason fileld not fully compatible with OpenAI (close #372, #373) * optimize:unify finish_reason field * refactor: use a global stop finish reason --------- Co-authored-by: JustSong <songquanpeng@foxmail.com> 2023-08-12 03:04:53 +00:00			`choice.FinishReason = &stopFinishReason`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`var response ChatCompletionsStreamResponse`
			`response.Object = "chat.completion.chunk"`
			`response.Model = "palm2"`
			`response.Choices = []ChatCompletionsStreamResponseChoice{choice}`
			`return &response`
			`}`

			`func palmStreamHandler(c gin.Context, resp http.Response) (*OpenAIErrorWithStatusCode, string) {`
			`responseText := ""`
			`responseId := fmt.Sprintf("chatcmpl-%s", common.GetUUID())`
			`createdTime := common.GetTimestamp()`
			`dataChan := make(chan string)`
			`stopChan := make(chan bool)`
			`go func() {`
			`responseBody, err := io.ReadAll(resp.Body)`
			`if err != nil {`
			`common.SysError("error reading stream response: " + err.Error())`
			`stopChan <- true`
			`return`
			`}`
			`err = resp.Body.Close()`
			`if err != nil {`
			`common.SysError("error closing stream response: " + err.Error())`
			`stopChan <- true`
			`return`
			`}`
			`var palmResponse PaLMChatResponse`
			`err = json.Unmarshal(responseBody, &palmResponse)`
			`if err != nil {`
			`common.SysError("error unmarshalling stream response: " + err.Error())`
			`stopChan <- true`
			`return`
			`}`
			`fullTextResponse := streamResponsePaLM2OpenAI(&palmResponse)`
			`fullTextResponse.Id = responseId`
			`fullTextResponse.Created = createdTime`
fix: fix PaLM2 not billed 2023-07-22 16:58:14 +00:00			`if len(palmResponse.Candidates) > 0 {`
			`responseText = palmResponse.Candidates[0].Content`
			`}`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`jsonResponse, err := json.Marshal(fullTextResponse)`
			`if err != nil {`
			`common.SysError("error marshalling stream response: " + err.Error())`
			`stopChan <- true`
			`return`
			`}`
			`dataChan <- string(jsonResponse)`
			`stopChan <- true`
			`}()`
refactor: add set event stream headers func (#402) 封装流式传输响应头的设置 2023-08-12 13:55:18 +00:00			`setEventStreamHeaders(c)`
feat: support Google PaLM2 (close #105) 2023-07-22 16:32:47 +00:00			`c.Stream(func(w io.Writer) bool {`
			`select {`
			`case data := <-dataChan:`
			`c.Render(-1, common.CustomEvent{Data: "data: " + data})`
			`return true`
			`case <-stopChan:`
			`c.Render(-1, common.CustomEvent{Data: "data: [DONE]"})`
			`return false`
			`}`
			`})`
			`err := resp.Body.Close()`
			`if err != nil {`
			`return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), ""`
			`}`
			`return nil, responseText`
			`}`

			`func palmHandler(c gin.Context, resp http.Response, promptTokens int, model string) (OpenAIErrorWithStatusCode, Usage) {`
			`responseBody, err := io.ReadAll(resp.Body)`
			`if err != nil {`
			`return errorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil`
			`}`
			`err = resp.Body.Close()`
			`if err != nil {`
			`return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil`
			`}`
			`var palmResponse PaLMChatResponse`
			`err = json.Unmarshal(responseBody, &palmResponse)`
			`if err != nil {`
			`return errorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil`
			`}`
			`if palmResponse.Error.Code != 0 \|\| len(palmResponse.Candidates) == 0 {`
			`return &OpenAIErrorWithStatusCode{`
			`OpenAIError: OpenAIError{`
			`Message: palmResponse.Error.Message,`
			`Type: palmResponse.Error.Status,`
			`Param: "",`
			`Code: palmResponse.Error.Code,`
			`},`
			`StatusCode: resp.StatusCode,`
			`}, nil`
			`}`
			`fullTextResponse := responsePaLM2OpenAI(&palmResponse)`
			`completionTokens := countTokenText(palmResponse.Candidates[0].Content, model)`
			`usage := Usage{`
			`PromptTokens: promptTokens,`
			`CompletionTokens: completionTokens,`
			`TotalTokens: promptTokens + completionTokens,`
			`}`
			`fullTextResponse.Usage = usage`
			`jsonResponse, err := json.Marshal(fullTextResponse)`
			`if err != nil {`
			`return errorWrapper(err, "marshal_response_body_failed", http.StatusInternalServerError), nil`
			`}`
			`c.Writer.Header().Set("Content-Type", "application/json")`
			`c.Writer.WriteHeader(resp.StatusCode)`
			`_, err = c.Writer.Write(jsonResponse)`
			`return nil, &usage`
feat: PaLM support is WIP (#105) 2023-05-21 06:26:59 +00:00			`}`