fix: fix ali function call (#1242 )

feat: use given usage if available in stream mode
feat: initial function call support for xunfei
2024-04-04 00:46:30 +08:00 · 2024-03-31 23:41:52 +08:00 · 2024-03-31 23:12:29 +08:00 · 2024-03-31 22:23:42 +08:00 · 2024-03-30 11:06:31 +08:00 · 2024-03-30 10:47:07 +08:00
8 changed files with 61 additions and 21 deletions
--- a/common/model-ratio.go
+++ b/common/model-ratio.go
@@ -75,7 +75,7 @@ var ModelRatio = map[string]float64{
 	"ERNIE-Bot":       0.8572,     // ￥0.012 / 1k tokens
 	"ERNIE-Bot-turbo": 0.5715,     // ￥0.008 / 1k tokens
 	"ERNIE-Bot-4":     0.12 * RMB, // ￥0.12 / 1k tokens
-	"ERNIE-Bot-8k":    0.024 * RMB,
+	"ERNIE-Bot-8K":    0.024 * RMB,
 	"Embedding-V1":    0.1429, // ￥0.002 / 1k tokens
 	"bge-large-zh":    0.002 * RMB,
 	"bge-large-en":    0.002 * RMB,
--- a/relay/channel/ali/main.go
+++ b/relay/channel/ali/main.go
@@ -50,8 +50,8 @@ func ConvertRequest(request model.GeneralOpenAIRequest) *ChatRequest {
 			TopP:              request.TopP,
 			TopK:              request.TopK,
 			ResultFormat:      "message",
 			Tools:             request.Tools,
 		},
 		Tools: request.Tools,
 	}
 }
--- a/relay/channel/ali/model.go
+++ b/relay/channel/ali/model.go
@@ -16,21 +16,21 @@ type Input struct {
 }
 type Parameters struct {
-	TopP              float64 `json:"top_p,omitempty"`
+	TopP              float64      `json:"top_p,omitempty"`
-	TopK              int     `json:"top_k,omitempty"`
+	TopK              int          `json:"top_k,omitempty"`
-	Seed              uint64  `json:"seed,omitempty"`
+	Seed              uint64       `json:"seed,omitempty"`
-	EnableSearch      bool    `json:"enable_search,omitempty"`
+	EnableSearch      bool         `json:"enable_search,omitempty"`
-	IncrementalOutput bool    `json:"incremental_output,omitempty"`
+	IncrementalOutput bool         `json:"incremental_output,omitempty"`
-	MaxTokens         int     `json:"max_tokens,omitempty"`
+	MaxTokens         int          `json:"max_tokens,omitempty"`
-	Temperature       float64 `json:"temperature,omitempty"`
+	Temperature       float64      `json:"temperature,omitempty"`
-	ResultFormat      string  `json:"result_format,omitempty"`
+	ResultFormat      string       `json:"result_format,omitempty"`
 	Tools             []model.Tool `json:"tools,omitempty"`
 }
 type ChatRequest struct {
-	Model      string       `json:"model"`
+	Model      string     `json:"model"`
-	Input      Input        `json:"input"`
+	Input      Input      `json:"input"`
-	Parameters Parameters   `json:"parameters,omitempty"`
+	Parameters Parameters `json:"parameters,omitempty"`
 	Tools      []model.Tool `json:"tools,omitempty"`
 }
 type EmbeddingRequest struct {
--- a/relay/channel/anthropic/main.go
+++ b/relay/channel/anthropic/main.go
@@ -38,6 +38,7 @@ func ConvertRequest(textRequest model.GeneralOpenAIRequest) *Request {
 		MaxTokens:   textRequest.MaxTokens,
 		Temperature: textRequest.Temperature,
 		TopP:        textRequest.TopP,
 		TopK:        textRequest.TopK,
 		Stream:      textRequest.Stream,
 	}
 	if claudeRequest.MaxTokens == 0 {
--- a/relay/channel/openai/adaptor.go
+++ b/relay/channel/openai/adaptor.go
@@ -70,8 +70,10 @@ func (a *Adaptor) DoRequest(c *gin.Context, meta *util.RelayMeta, requestBody io
 func (a *Adaptor) DoResponse(c *gin.Context, resp *http.Response, meta *util.RelayMeta) (usage *model.Usage, err *model.ErrorWithStatusCode) {
 	if meta.IsStream {
 		var responseText string
-		err, responseText, _ = StreamHandler(c, resp, meta.Mode)
+		err, responseText, usage = StreamHandler(c, resp, meta.Mode)
-		usage = ResponseText2Usage(responseText, meta.ActualModelName, meta.PromptTokens)
+		if usage == nil {
 			usage = ResponseText2Usage(responseText, meta.ActualModelName, meta.PromptTokens)
 		}
 	} else {
 		err, usage = Handler(c, resp, meta.PromptTokens, meta.ActualModelName)
 	}
--- a/relay/channel/xunfei/main.go
+++ b/relay/channel/xunfei/main.go
@@ -26,7 +26,11 @@ import (
 func requestOpenAI2Xunfei(request model.GeneralOpenAIRequest, xunfeiAppId string, domain string) *ChatRequest {
 	messages := make([]Message, 0, len(request.Messages))
 	var lastToolCalls []model.Tool
 	for _, message := range request.Messages {
 		if message.ToolCalls != nil {
 			lastToolCalls = message.ToolCalls
 		}
 		messages = append(messages, Message{
 			Role:    message.Role,
 			Content: message.StringContent(),
@@ -39,9 +43,33 @@ func requestOpenAI2Xunfei(request model.GeneralOpenAIRequest, xunfeiAppId string
 	xunfeiRequest.Parameter.Chat.TopK = request.N
 	xunfeiRequest.Parameter.Chat.MaxTokens = request.MaxTokens
 	xunfeiRequest.Payload.Message.Text = messages
 	if len(lastToolCalls) != 0 {
 		for _, toolCall := range lastToolCalls {
 			xunfeiRequest.Payload.Functions.Text = append(xunfeiRequest.Payload.Functions.Text, toolCall.Function)
 		}
 	}
 	return &xunfeiRequest
 }
 func getToolCalls(response *ChatResponse) []model.Tool {
 	var toolCalls []model.Tool
 	if len(response.Payload.Choices.Text) == 0 {
 		return toolCalls
 	}
 	item := response.Payload.Choices.Text[0]
 	if item.FunctionCall == nil {
 		return toolCalls
 	}
 	toolCall := model.Tool{
 		Id:       fmt.Sprintf("call_%s", helper.GetUUID()),
 		Type:     "function",
 		Function: *item.FunctionCall,
 	}
 	toolCalls = append(toolCalls, toolCall)
 	return toolCalls
 }
 func responseXunfei2OpenAI(response *ChatResponse) *openai.TextResponse {
 	if len(response.Payload.Choices.Text) == 0 {
 		response.Payload.Choices.Text = []ChatResponseTextItem{
@@ -53,8 +81,9 @@ func responseXunfei2OpenAI(response *ChatResponse) *openai.TextResponse {
 	choice := openai.TextResponseChoice{
 		Index: 0,
 		Message: model.Message{
-			Role:    "assistant",
+			Role:      "assistant",
-			Content: response.Payload.Choices.Text[0].Content,
+			Content:   response.Payload.Choices.Text[0].Content,
 			ToolCalls: getToolCalls(response),
 		},
 		FinishReason: constant.StopFinishReason,
 	}
@@ -78,6 +107,7 @@ func streamResponseXunfei2OpenAI(xunfeiResponse *ChatResponse) *openai.ChatCompl
 	}
 	var choice openai.ChatCompletionsStreamResponseChoice
 	choice.Delta.Content = xunfeiResponse.Payload.Choices.Text[0].Content
 	choice.Delta.ToolCalls = getToolCalls(xunfeiResponse)
 	if xunfeiResponse.Payload.Choices.Status == 2 {
 		choice.FinishReason = &constant.StopFinishReason
 	}
--- a/relay/channel/xunfei/model.go
+++ b/relay/channel/xunfei/model.go
@@ -26,13 +26,18 @@ type ChatRequest struct {
 		Message struct {
 			Text []Message `json:"text"`
 		} `json:"message"`
 		Functions struct {
 			Text []model.Function `json:"text,omitempty"`
 		} `json:"functions"`
 	} `json:"payload"`
 }
 type ChatResponseTextItem struct {
-	Content string `json:"content"`
+	Content      string          `json:"content"`
-	Role    string `json:"role"`
+	Role         string          `json:"role"`
-	Index   int    `json:"index"`
+	Index        int             `json:"index"`
 	ContentType  string          `json:"content_type"`
 	FunctionCall *model.Function `json:"function_call"`
 }
 type ChatResponse struct {
--- a/relay/model/general.go
+++ b/relay/model/general.go
@@ -24,6 +24,8 @@ type GeneralOpenAIRequest struct {
 	User             string          `json:"user,omitempty"`
 	Prompt           any             `json:"prompt,omitempty"`
 	Input            any             `json:"input,omitempty"`
 	EncodingFormat   string          `json:"encoding_format,omitempty"`
 	Dimensions       int             `json:"dimensions,omitempty"`
 	Instruction      string          `json:"instruction,omitempty"`
 	Size             string          `json:"size,omitempty"`
 }
Author	SHA1	Message	Date
JustSong	065da8ef8c	fix: fix ali function call (#1242 )	2024-04-04 00:46:30 +08:00
JustSong	e3cfb1fa52	feat: use given usage if available in stream mode	2024-03-31 23:41:52 +08:00
JustSong	f89ae5ad58	feat: initial function call support for xunfei	2024-03-31 23:12:29 +08:00
JustSong	06a3fc5421	chore: update GeneralOpenAIRequest	2024-03-31 22:23:42 +08:00
ManJieqi	a9c464ec5a	fix: update model-ratio.go 修正文心计费模型名称统一文心计费模型名称	2024-03-30 11:06:31 +08:00
JustSong	3f3c13c98c	feat: support top_k for claude (close #1239 )	2024-03-30 10:47:07 +08:00