coai/manager/transhipment.go
2023-11-13 21:46:14 +08:00

233 lines
6.3 KiB
Go

package manager
import (
"chat/adapter"
"chat/addition/web"
"chat/admin"
"chat/auth"
"chat/globals"
"chat/utils"
"fmt"
"github.com/gin-gonic/gin"
"io"
"net/http"
"strings"
"time"
)
type TranshipmentForm struct {
Model string `json:"model" binding:"required"`
Messages []globals.Message `json:"messages" binding:"required"`
Stream bool `json:"stream"`
MaxTokens int `json:"max_tokens"`
}
type Choice struct {
Index int `json:"index"`
Message globals.Message `json:"message"`
FinishReason string `json:"finish_reason"`
}
type Usage struct {
PromptTokens int `json:"prompt_tokens"`
CompletionTokens int `json:"completion_tokens"`
TotalTokens int `json:"total_tokens"`
}
type TranshipmentResponse struct {
Id string `json:"id"`
Object string `json:"object"`
Created int64 `json:"created"`
Model string `json:"model"`
Choices []Choice `json:"choices"`
Usage Usage `json:"usage"`
Quota float32 `json:"quota"`
}
type ChoiceDelta struct {
Index int `json:"index"`
Delta globals.Message `json:"delta"`
FinishReason interface{} `json:"finish_reason"`
}
type TranshipmentStreamResponse struct {
Id string `json:"id"`
Object string `json:"object"`
Created int64 `json:"created"`
Model string `json:"model"`
Choices []ChoiceDelta `json:"choices"`
Usage Usage `json:"usage"`
Quota float32 `json:"quota"`
}
func ModelAPI(c *gin.Context) {
c.JSON(http.StatusOK, globals.AllModels)
}
func TranshipmentAPI(c *gin.Context) {
username := utils.GetUserFromContext(c)
if username == "" {
c.AbortWithStatusJSON(403, gin.H{
"code": 403,
"message": "Access denied. Please provide correct api key.",
})
return
}
if utils.GetAgentFromContext(c) != "api" {
c.AbortWithStatusJSON(403, gin.H{
"code": 403,
"message": "Access denied. Please provide correct api key.",
})
return
}
var form TranshipmentForm
if err := c.ShouldBindJSON(&form); err != nil {
c.JSON(400, gin.H{
"status": false,
"error": "invalid request body",
"reason": err.Error(),
})
return
}
db := utils.GetDBFromContext(c)
cache := utils.GetCacheFromContext(c)
user := &auth.User{
Username: username,
}
id := utils.Md5Encrypt(username + form.Model + time.Now().String())
created := time.Now().Unix()
check, plan := auth.CanEnableModelWithSubscription(db, cache, user, form.Model)
if !check {
c.JSON(http.StatusForbidden, gin.H{
"status": false,
"error": "quota exceeded",
"reason": "not enough quota to use this model",
})
return
}
if strings.HasPrefix(form.Model, "web-") {
suffix := strings.TrimPrefix(form.Model, "web-")
if utils.Contains[string](suffix, globals.AllModels) {
form.Model = suffix
form.Messages = web.UsingWebNativeSegment(true, form.Messages)
}
}
if form.Stream {
sendStreamTranshipmentResponse(c, form, id, created, user, plan)
} else {
sendTranshipmentResponse(c, form, id, created, user, plan)
}
}
func sendTranshipmentResponse(c *gin.Context, form TranshipmentForm, id string, created int64, user *auth.User, plan bool) {
buffer := utils.NewBuffer(form.Model, form.Messages)
err := adapter.NewChatRequest(&adapter.ChatProps{
Model: form.Model,
Message: form.Messages,
Plan: plan,
Token: form.MaxTokens,
}, func(data string) error {
buffer.Write(data)
return nil
})
admin.AnalysisRequest(form.Model, buffer, err)
if err != nil {
auth.RevertSubscriptionUsage(utils.GetCacheFromContext(c), user, form.Model, plan)
globals.Warn(fmt.Sprintf("error from chat request api: %s (instance: %s, client: %s)", err, form.Model, c.ClientIP()))
}
CollectQuota(c, user, buffer, plan)
c.JSON(http.StatusOK, TranshipmentResponse{
Id: fmt.Sprintf("chatcmpl-%s", id),
Object: "chat.completion",
Created: created,
Model: form.Model,
Choices: []Choice{
{
Index: 0,
Message: globals.Message{Role: globals.Assistant, Content: buffer.ReadWithDefault(defaultMessage)},
FinishReason: "stop",
},
},
Usage: Usage{
PromptTokens: buffer.CountInputToken(),
CompletionTokens: buffer.CountOutputToken(),
TotalTokens: buffer.CountToken(),
},
Quota: buffer.GetQuota(),
})
}
func getStreamTranshipmentForm(id string, created int64, form TranshipmentForm, data string, buffer *utils.Buffer, end bool) TranshipmentStreamResponse {
return TranshipmentStreamResponse{
Id: fmt.Sprintf("chatcmpl-%s", id),
Object: "chat.completion.chunk",
Created: created,
Model: form.Model,
Choices: []ChoiceDelta{
{
Index: 0,
Delta: globals.Message{
Role: globals.Assistant,
Content: data,
},
FinishReason: utils.Multi[interface{}](end, "stop", nil),
},
},
Usage: Usage{
PromptTokens: utils.MultiF(end, func() int { return buffer.CountInputToken() }, 0),
CompletionTokens: utils.MultiF(end, func() int { return buffer.CountOutputToken() }, 0),
TotalTokens: utils.MultiF(end, func() int { return buffer.CountToken() }, 0),
},
Quota: buffer.GetQuota(),
}
}
func sendStreamTranshipmentResponse(c *gin.Context, form TranshipmentForm, id string, created int64, user *auth.User, plan bool) {
channel := make(chan TranshipmentStreamResponse)
go func() {
buffer := utils.NewBuffer(form.Model, form.Messages)
err := adapter.NewChatRequest(&adapter.ChatProps{
Model: form.Model,
Message: form.Messages,
Plan: plan,
Token: form.MaxTokens,
}, func(data string) error {
channel <- getStreamTranshipmentForm(id, created, form, buffer.Write(data), buffer, false)
return nil
})
admin.AnalysisRequest(form.Model, buffer, err)
if err != nil {
auth.RevertSubscriptionUsage(utils.GetCacheFromContext(c), user, form.Model, plan)
channel <- getStreamTranshipmentForm(id, created, form, fmt.Sprintf("Error: %s", err.Error()), buffer, true)
CollectQuota(c, user, buffer, plan)
close(channel)
return
}
channel <- getStreamTranshipmentForm(id, created, form, "", buffer, true)
CollectQuota(c, user, buffer, plan)
close(channel)
return
}()
c.Stream(func(w io.Writer) bool {
if resp, ok := <-channel; ok {
c.Render(-1, utils.NewEvent(resp))
return true
}
c.Render(-1, utils.NewEndEvent())
return false
})
}