perf: use max_tokens to reduce token consuming

This commit is contained in:
JustSong 2023-05-16 16:22:25 +08:00
parent c9ac5e391f
commit 58fe923c85
2 changed files with 6 additions and 4 deletions

View File

@ -211,10 +211,11 @@ func buildTestRequest(c *gin.Context) *ChatRequest {
model_ := c.Query("model")
testRequest := &ChatRequest{
Model: model_,
MaxTokens: 1,
}
testMessage := Message{
Role: "user",
Content: "echo hi",
Content: "hi",
}
testRequest.Messages = append(testRequest.Messages, testMessage)
return testRequest

View File

@ -23,6 +23,7 @@ type Message struct {
type ChatRequest struct {
Model string `json:"model"`
Messages []Message `json:"messages"`
MaxTokens int `json:"max_tokens"`
}
type TextRequest struct {