|
|
@@ -0,0 +1,240 @@
|
|
|
+package controller
|
|
|
+
|
|
|
+import (
|
|
|
+ "bufio"
|
|
|
+ "encoding/json"
|
|
|
+ "github.com/gin-gonic/gin"
|
|
|
+ "io"
|
|
|
+ "net/http"
|
|
|
+ "one-api/common"
|
|
|
+ "strings"
|
|
|
+)
|
|
|
+
|
|
|
+// https://help.aliyun.com/document_detail/613695.html?spm=a2c4g.2399480.0.0.1adb778fAdzP9w#341800c0f8w0r
|
|
|
+
|
|
|
+type AliMessage struct {
|
|
|
+ User string `json:"user"`
|
|
|
+ Bot string `json:"bot"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliInput struct {
|
|
|
+ Prompt string `json:"prompt"`
|
|
|
+ History []AliMessage `json:"history"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliParameters struct {
|
|
|
+ TopP float64 `json:"top_p,omitempty"`
|
|
|
+ TopK int `json:"top_k,omitempty"`
|
|
|
+ Seed uint64 `json:"seed,omitempty"`
|
|
|
+ EnableSearch bool `json:"enable_search,omitempty"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliChatRequest struct {
|
|
|
+ Model string `json:"model"`
|
|
|
+ Input AliInput `json:"input"`
|
|
|
+ Parameters AliParameters `json:"parameters,omitempty"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliError struct {
|
|
|
+ Code string `json:"code"`
|
|
|
+ Message string `json:"message"`
|
|
|
+ RequestId string `json:"request_id"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliUsage struct {
|
|
|
+ InputTokens int `json:"input_tokens"`
|
|
|
+ OutputTokens int `json:"output_tokens"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliOutput struct {
|
|
|
+ Text string `json:"text"`
|
|
|
+ FinishReason string `json:"finish_reason"`
|
|
|
+}
|
|
|
+
|
|
|
+type AliChatResponse struct {
|
|
|
+ Output AliOutput `json:"output"`
|
|
|
+ Usage AliUsage `json:"usage"`
|
|
|
+ AliError
|
|
|
+}
|
|
|
+
|
|
|
+func requestOpenAI2Ali(request GeneralOpenAIRequest) *AliChatRequest {
|
|
|
+ messages := make([]AliMessage, 0, len(request.Messages))
|
|
|
+ prompt := ""
|
|
|
+ for i := 0; i < len(request.Messages); i++ {
|
|
|
+ message := request.Messages[i]
|
|
|
+ if message.Role == "system" {
|
|
|
+ messages = append(messages, AliMessage{
|
|
|
+ User: message.Content,
|
|
|
+ Bot: "Okay",
|
|
|
+ })
|
|
|
+ continue
|
|
|
+ } else {
|
|
|
+ if i == len(request.Messages)-1 {
|
|
|
+ prompt = message.Content
|
|
|
+ break
|
|
|
+ }
|
|
|
+ messages = append(messages, AliMessage{
|
|
|
+ User: message.Content,
|
|
|
+ Bot: request.Messages[i+1].Content,
|
|
|
+ })
|
|
|
+ i++
|
|
|
+ }
|
|
|
+ }
|
|
|
+ return &AliChatRequest{
|
|
|
+ Model: request.Model,
|
|
|
+ Input: AliInput{
|
|
|
+ Prompt: prompt,
|
|
|
+ History: messages,
|
|
|
+ },
|
|
|
+ //Parameters: AliParameters{ // ChatGPT's parameters are not compatible with Ali's
|
|
|
+ // TopP: request.TopP,
|
|
|
+ // TopK: 50,
|
|
|
+ // //Seed: 0,
|
|
|
+ // //EnableSearch: false,
|
|
|
+ //},
|
|
|
+ }
|
|
|
+}
|
|
|
+
|
|
|
+func responseAli2OpenAI(response *AliChatResponse) *OpenAITextResponse {
|
|
|
+ choice := OpenAITextResponseChoice{
|
|
|
+ Index: 0,
|
|
|
+ Message: Message{
|
|
|
+ Role: "assistant",
|
|
|
+ Content: response.Output.Text,
|
|
|
+ },
|
|
|
+ FinishReason: response.Output.FinishReason,
|
|
|
+ }
|
|
|
+ fullTextResponse := OpenAITextResponse{
|
|
|
+ Id: response.RequestId,
|
|
|
+ Object: "chat.completion",
|
|
|
+ Created: common.GetTimestamp(),
|
|
|
+ Choices: []OpenAITextResponseChoice{choice},
|
|
|
+ Usage: Usage{
|
|
|
+ PromptTokens: response.Usage.InputTokens,
|
|
|
+ CompletionTokens: response.Usage.OutputTokens,
|
|
|
+ TotalTokens: response.Usage.InputTokens + response.Usage.OutputTokens,
|
|
|
+ },
|
|
|
+ }
|
|
|
+ return &fullTextResponse
|
|
|
+}
|
|
|
+
|
|
|
+func streamResponseAli2OpenAI(aliResponse *AliChatResponse) *ChatCompletionsStreamResponse {
|
|
|
+ var choice ChatCompletionsStreamResponseChoice
|
|
|
+ choice.Delta.Content = aliResponse.Output.Text
|
|
|
+ choice.FinishReason = aliResponse.Output.FinishReason
|
|
|
+ response := ChatCompletionsStreamResponse{
|
|
|
+ Id: aliResponse.RequestId,
|
|
|
+ Object: "chat.completion.chunk",
|
|
|
+ Created: common.GetTimestamp(),
|
|
|
+ Model: "ernie-bot",
|
|
|
+ Choices: []ChatCompletionsStreamResponseChoice{choice},
|
|
|
+ }
|
|
|
+ return &response
|
|
|
+}
|
|
|
+
|
|
|
+func aliStreamHandler(c *gin.Context, resp *http.Response) (*OpenAIErrorWithStatusCode, *Usage) {
|
|
|
+ var usage Usage
|
|
|
+ scanner := bufio.NewScanner(resp.Body)
|
|
|
+ scanner.Split(func(data []byte, atEOF bool) (advance int, token []byte, err error) {
|
|
|
+ if atEOF && len(data) == 0 {
|
|
|
+ return 0, nil, nil
|
|
|
+ }
|
|
|
+ if i := strings.Index(string(data), "\n"); i >= 0 {
|
|
|
+ return i + 1, data[0:i], nil
|
|
|
+ }
|
|
|
+ if atEOF {
|
|
|
+ return len(data), data, nil
|
|
|
+ }
|
|
|
+ return 0, nil, nil
|
|
|
+ })
|
|
|
+ dataChan := make(chan string)
|
|
|
+ stopChan := make(chan bool)
|
|
|
+ go func() {
|
|
|
+ for scanner.Scan() {
|
|
|
+ data := scanner.Text()
|
|
|
+ if len(data) < 5 { // ignore blank line or wrong format
|
|
|
+ continue
|
|
|
+ }
|
|
|
+ if data[:5] != "data:" {
|
|
|
+ continue
|
|
|
+ }
|
|
|
+ data = data[5:]
|
|
|
+ dataChan <- data
|
|
|
+ }
|
|
|
+ stopChan <- true
|
|
|
+ }()
|
|
|
+ c.Writer.Header().Set("Content-Type", "text/event-stream")
|
|
|
+ c.Writer.Header().Set("Cache-Control", "no-cache")
|
|
|
+ c.Writer.Header().Set("Connection", "keep-alive")
|
|
|
+ c.Writer.Header().Set("Transfer-Encoding", "chunked")
|
|
|
+ c.Writer.Header().Set("X-Accel-Buffering", "no")
|
|
|
+ lastResponseText := ""
|
|
|
+ c.Stream(func(w io.Writer) bool {
|
|
|
+ select {
|
|
|
+ case data := <-dataChan:
|
|
|
+ var aliResponse AliChatResponse
|
|
|
+ err := json.Unmarshal([]byte(data), &aliResponse)
|
|
|
+ if err != nil {
|
|
|
+ common.SysError("error unmarshalling stream response: " + err.Error())
|
|
|
+ return true
|
|
|
+ }
|
|
|
+ usage.PromptTokens += aliResponse.Usage.InputTokens
|
|
|
+ usage.CompletionTokens += aliResponse.Usage.OutputTokens
|
|
|
+ usage.TotalTokens += aliResponse.Usage.InputTokens + aliResponse.Usage.OutputTokens
|
|
|
+ response := streamResponseAli2OpenAI(&aliResponse)
|
|
|
+ response.Choices[0].Delta.Content = strings.TrimPrefix(response.Choices[0].Delta.Content, lastResponseText)
|
|
|
+ lastResponseText = aliResponse.Output.Text
|
|
|
+ jsonResponse, err := json.Marshal(response)
|
|
|
+ if err != nil {
|
|
|
+ common.SysError("error marshalling stream response: " + err.Error())
|
|
|
+ return true
|
|
|
+ }
|
|
|
+ c.Render(-1, common.CustomEvent{Data: "data: " + string(jsonResponse)})
|
|
|
+ return true
|
|
|
+ case <-stopChan:
|
|
|
+ c.Render(-1, common.CustomEvent{Data: "data: [DONE]"})
|
|
|
+ return false
|
|
|
+ }
|
|
|
+ })
|
|
|
+ err := resp.Body.Close()
|
|
|
+ if err != nil {
|
|
|
+ return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
|
|
|
+ }
|
|
|
+ return nil, &usage
|
|
|
+}
|
|
|
+
|
|
|
+func aliHandler(c *gin.Context, resp *http.Response) (*OpenAIErrorWithStatusCode, *Usage) {
|
|
|
+ var aliResponse AliChatResponse
|
|
|
+ responseBody, err := io.ReadAll(resp.Body)
|
|
|
+ if err != nil {
|
|
|
+ return errorWrapper(err, "read_response_body_failed", http.StatusInternalServerError), nil
|
|
|
+ }
|
|
|
+ err = resp.Body.Close()
|
|
|
+ if err != nil {
|
|
|
+ return errorWrapper(err, "close_response_body_failed", http.StatusInternalServerError), nil
|
|
|
+ }
|
|
|
+ err = json.Unmarshal(responseBody, &aliResponse)
|
|
|
+ if err != nil {
|
|
|
+ return errorWrapper(err, "unmarshal_response_body_failed", http.StatusInternalServerError), nil
|
|
|
+ }
|
|
|
+ if aliResponse.Code != "" {
|
|
|
+ return &OpenAIErrorWithStatusCode{
|
|
|
+ OpenAIError: OpenAIError{
|
|
|
+ Message: aliResponse.Message,
|
|
|
+ Type: aliResponse.Code,
|
|
|
+ Param: aliResponse.RequestId,
|
|
|
+ Code: aliResponse.Code,
|
|
|
+ },
|
|
|
+ StatusCode: resp.StatusCode,
|
|
|
+ }, nil
|
|
|
+ }
|
|
|
+ fullTextResponse := responseAli2OpenAI(&aliResponse)
|
|
|
+ jsonResponse, err := json.Marshal(fullTextResponse)
|
|
|
+ if err != nil {
|
|
|
+ return errorWrapper(err, "marshal_response_body_failed", http.StatusInternalServerError), nil
|
|
|
+ }
|
|
|
+ c.Writer.Header().Set("Content-Type", "application/json")
|
|
|
+ c.Writer.WriteHeader(resp.StatusCode)
|
|
|
+ _, err = c.Writer.Write(jsonResponse)
|
|
|
+ return nil, &fullTextResponse.Usage
|
|
|
+}
|