Просмотр исходного кода

perf: use max_tokens to reduce token consuming

JustSong 2 лет назад
Родитель
Сommit
58fe923c85
2 измененных файлов с 6 добавлено и 4 удалено
  1. 3 2
      controller/channel.go
  2. 3 2
      controller/relay.go

+ 3 - 2
controller/channel.go

@@ -210,11 +210,12 @@ func testChannel(channel *model.Channel, request *ChatRequest) error {
 func buildTestRequest(c *gin.Context) *ChatRequest {
 func buildTestRequest(c *gin.Context) *ChatRequest {
 	model_ := c.Query("model")
 	model_ := c.Query("model")
 	testRequest := &ChatRequest{
 	testRequest := &ChatRequest{
-		Model: model_,
+		Model:     model_,
+		MaxTokens: 1,
 	}
 	}
 	testMessage := Message{
 	testMessage := Message{
 		Role:    "user",
 		Role:    "user",
-		Content: "echo hi",
+		Content: "hi",
 	}
 	}
 	testRequest.Messages = append(testRequest.Messages, testMessage)
 	testRequest.Messages = append(testRequest.Messages, testMessage)
 	return testRequest
 	return testRequest

+ 3 - 2
controller/relay.go

@@ -21,8 +21,9 @@ type Message struct {
 }
 }
 
 
 type ChatRequest struct {
 type ChatRequest struct {
-	Model    string    `json:"model"`
-	Messages []Message `json:"messages"`
+	Model     string    `json:"model"`
+	Messages  []Message `json:"messages"`
+	MaxTokens int       `json:"max_tokens"`
 }
 }
 
 
 type TextRequest struct {
 type TextRequest struct {