| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811 |
- package common
- import (
- "encoding/json"
- "errors"
- "fmt"
- "strings"
- "time"
- "github.com/QuantumNous/new-api/common"
- "github.com/QuantumNous/new-api/constant"
- "github.com/QuantumNous/new-api/dto"
- relayconstant "github.com/QuantumNous/new-api/relay/constant"
- "github.com/QuantumNous/new-api/setting/model_setting"
- "github.com/QuantumNous/new-api/types"
- "github.com/gin-gonic/gin"
- "github.com/gorilla/websocket"
- )
- type ThinkingContentInfo struct {
- IsFirstThinkingContent bool
- SendLastThinkingContent bool
- HasSentThinkingContent bool
- }
- const (
- LastMessageTypeNone = "none"
- LastMessageTypeText = "text"
- LastMessageTypeTools = "tools"
- LastMessageTypeThinking = "thinking"
- )
- type ClaudeConvertInfo struct {
- LastMessagesType string
- Index int
- Usage *dto.Usage
- FinishReason string
- Done bool
- ToolCallBaseIndex int
- ToolCallMaxIndexOffset int
- }
- type RerankerInfo struct {
- Documents []any
- ReturnDocuments bool
- }
- type BuildInToolInfo struct {
- ToolName string
- CallCount int
- SearchContextSize string
- }
- type ResponsesUsageInfo struct {
- BuiltInTools map[string]*BuildInToolInfo
- }
- type ChannelMeta struct {
- ChannelType int
- ChannelId int
- ChannelIsMultiKey bool
- ChannelMultiKeyIndex int
- ChannelBaseUrl string
- ApiType int
- ApiVersion string
- ApiKey string
- Organization string
- ChannelCreateTime int64
- ParamOverride map[string]interface{}
- HeadersOverride map[string]interface{}
- ChannelSetting dto.ChannelSettings
- ChannelOtherSettings dto.ChannelOtherSettings
- UpstreamModelName string
- IsModelMapped bool
- SupportStreamOptions bool // 是否支持流式选项
- }
- type TokenCountMeta struct {
- //promptTokens int
- estimatePromptTokens int
- }
- type RelayInfo struct {
- TokenId int
- TokenKey string
- TokenGroup string
- UserId int
- UsingGroup string // 使用的分组,当auto跨分组重试时,会变动
- UserGroup string // 用户所在分组
- TokenUnlimited bool
- StartTime time.Time
- FirstResponseTime time.Time
- isFirstResponse bool
- //SendLastReasoningResponse bool
- IsStream bool
- IsGeminiBatchEmbedding bool
- IsPlayground bool
- UsePrice bool
- RelayMode int
- OriginModelName string
- RequestURLPath string
- ShouldIncludeUsage bool
- DisablePing bool // 是否禁止向下游发送自定义 Ping
- ClientWs *websocket.Conn
- TargetWs *websocket.Conn
- InputAudioFormat string
- OutputAudioFormat string
- RealtimeTools []dto.RealTimeTool
- IsFirstRequest bool
- AudioUsage bool
- ReasoningEffort string
- UserSetting dto.UserSetting
- UserEmail string
- UserQuota int
- RelayFormat types.RelayFormat
- SendResponseCount int
- ReceivedResponseCount int
- FinalPreConsumedQuota int // 最终预消耗的配额
- // ForcePreConsume 为 true 时禁用 BillingSession 的信任额度旁路,
- // 强制预扣全额。用于异步任务(视频/音乐生成等),因为请求返回后任务仍在运行,
- // 必须在提交前锁定全额。
- ForcePreConsume bool
- // Billing 是计费会话,封装了预扣费/结算/退款的统一生命周期。
- // 免费模型时为 nil。
- Billing BillingSettler
- // BillingSource indicates whether this request is billed from wallet quota or subscription.
- // "" or "wallet" => wallet; "subscription" => subscription
- BillingSource string
- // SubscriptionId is the user_subscriptions.id used when BillingSource == "subscription"
- SubscriptionId int
- // SubscriptionPreConsumed is the amount pre-consumed on subscription item (quota units or 1)
- SubscriptionPreConsumed int64
- // SubscriptionPostDelta is the post-consume delta applied to amount_used (quota units; can be negative).
- SubscriptionPostDelta int64
- // SubscriptionPlanId / SubscriptionPlanTitle are used for logging/UI display.
- SubscriptionPlanId int
- SubscriptionPlanTitle string
- // RequestId is used for idempotent pre-consume/refund
- RequestId string
- // SubscriptionAmountTotal / SubscriptionAmountUsedAfterPreConsume are used to compute remaining in logs.
- SubscriptionAmountTotal int64
- SubscriptionAmountUsedAfterPreConsume int64
- IsClaudeBetaQuery bool // /v1/messages?beta=true
- IsChannelTest bool // channel test request
- PriceData types.PriceData
- Request dto.Request
- // RequestConversionChain records request format conversions in order, e.g.
- // ["openai", "openai_responses"] or ["openai", "claude"].
- RequestConversionChain []types.RelayFormat
- // 最终请求到上游的格式。可由 adaptor 显式设置;
- // 若为空,调用 GetFinalRequestRelayFormat 会回退到 RequestConversionChain 的最后一项或 RelayFormat。
- FinalRequestRelayFormat types.RelayFormat
- ThinkingContentInfo
- TokenCountMeta
- *ClaudeConvertInfo
- *RerankerInfo
- *ResponsesUsageInfo
- *ChannelMeta
- *TaskRelayInfo
- }
- func (info *RelayInfo) InitChannelMeta(c *gin.Context) {
- channelType := common.GetContextKeyInt(c, constant.ContextKeyChannelType)
- paramOverride := common.GetContextKeyStringMap(c, constant.ContextKeyChannelParamOverride)
- headerOverride := common.GetContextKeyStringMap(c, constant.ContextKeyChannelHeaderOverride)
- apiType, _ := common.ChannelType2APIType(channelType)
- channelMeta := &ChannelMeta{
- ChannelType: channelType,
- ChannelId: common.GetContextKeyInt(c, constant.ContextKeyChannelId),
- ChannelIsMultiKey: common.GetContextKeyBool(c, constant.ContextKeyChannelIsMultiKey),
- ChannelMultiKeyIndex: common.GetContextKeyInt(c, constant.ContextKeyChannelMultiKeyIndex),
- ChannelBaseUrl: common.GetContextKeyString(c, constant.ContextKeyChannelBaseUrl),
- ApiType: apiType,
- ApiVersion: c.GetString("api_version"),
- ApiKey: common.GetContextKeyString(c, constant.ContextKeyChannelKey),
- Organization: c.GetString("channel_organization"),
- ChannelCreateTime: c.GetInt64("channel_create_time"),
- ParamOverride: paramOverride,
- HeadersOverride: headerOverride,
- UpstreamModelName: common.GetContextKeyString(c, constant.ContextKeyOriginalModel),
- IsModelMapped: false,
- SupportStreamOptions: false,
- }
- if channelType == constant.ChannelTypeAzure {
- channelMeta.ApiVersion = GetAPIVersion(c)
- }
- if channelType == constant.ChannelTypeVertexAi {
- channelMeta.ApiVersion = c.GetString("region")
- }
- channelSetting, ok := common.GetContextKeyType[dto.ChannelSettings](c, constant.ContextKeyChannelSetting)
- if ok {
- channelMeta.ChannelSetting = channelSetting
- }
- channelOtherSettings, ok := common.GetContextKeyType[dto.ChannelOtherSettings](c, constant.ContextKeyChannelOtherSetting)
- if ok {
- channelMeta.ChannelOtherSettings = channelOtherSettings
- }
- if streamSupportedChannels[channelMeta.ChannelType] {
- channelMeta.SupportStreamOptions = true
- }
- info.ChannelMeta = channelMeta
- // reset some fields based on channel meta
- // 重置某些字段,例如模型名称等
- if info.Request != nil {
- info.Request.SetModelName(info.OriginModelName)
- }
- }
- func (info *RelayInfo) ToString() string {
- if info == nil {
- return "RelayInfo<nil>"
- }
- // Basic info
- b := &strings.Builder{}
- fmt.Fprintf(b, "RelayInfo{ ")
- fmt.Fprintf(b, "RelayFormat: %s, ", info.RelayFormat)
- fmt.Fprintf(b, "RelayMode: %d, ", info.RelayMode)
- fmt.Fprintf(b, "IsStream: %t, ", info.IsStream)
- fmt.Fprintf(b, "IsPlayground: %t, ", info.IsPlayground)
- fmt.Fprintf(b, "RequestURLPath: %q, ", info.RequestURLPath)
- fmt.Fprintf(b, "OriginModelName: %q, ", info.OriginModelName)
- fmt.Fprintf(b, "EstimatePromptTokens: %d, ", info.estimatePromptTokens)
- fmt.Fprintf(b, "ShouldIncludeUsage: %t, ", info.ShouldIncludeUsage)
- fmt.Fprintf(b, "DisablePing: %t, ", info.DisablePing)
- fmt.Fprintf(b, "SendResponseCount: %d, ", info.SendResponseCount)
- fmt.Fprintf(b, "FinalPreConsumedQuota: %d, ", info.FinalPreConsumedQuota)
- // User & token info (mask secrets)
- fmt.Fprintf(b, "User{ Id: %d, Email: %q, Group: %q, UsingGroup: %q, Quota: %d }, ",
- info.UserId, common.MaskEmail(info.UserEmail), info.UserGroup, info.UsingGroup, info.UserQuota)
- fmt.Fprintf(b, "Token{ Id: %d, Unlimited: %t, Key: ***masked*** }, ", info.TokenId, info.TokenUnlimited)
- // Time info
- latencyMs := info.FirstResponseTime.Sub(info.StartTime).Milliseconds()
- fmt.Fprintf(b, "Timing{ Start: %s, FirstResponse: %s, LatencyMs: %d }, ",
- info.StartTime.Format(time.RFC3339Nano), info.FirstResponseTime.Format(time.RFC3339Nano), latencyMs)
- // Audio / realtime
- if info.InputAudioFormat != "" || info.OutputAudioFormat != "" || len(info.RealtimeTools) > 0 || info.AudioUsage {
- fmt.Fprintf(b, "Realtime{ AudioUsage: %t, InFmt: %q, OutFmt: %q, Tools: %d }, ",
- info.AudioUsage, info.InputAudioFormat, info.OutputAudioFormat, len(info.RealtimeTools))
- }
- // Reasoning
- if info.ReasoningEffort != "" {
- fmt.Fprintf(b, "ReasoningEffort: %q, ", info.ReasoningEffort)
- }
- // Price data (non-sensitive)
- if info.PriceData.UsePrice {
- fmt.Fprintf(b, "PriceData{ %s }, ", info.PriceData.ToSetting())
- }
- // Channel metadata (mask ApiKey)
- if info.ChannelMeta != nil {
- cm := info.ChannelMeta
- fmt.Fprintf(b, "ChannelMeta{ Type: %d, Id: %d, IsMultiKey: %t, MultiKeyIndex: %d, BaseURL: %q, ApiType: %d, ApiVersion: %q, Organization: %q, CreateTime: %d, UpstreamModelName: %q, IsModelMapped: %t, SupportStreamOptions: %t, ApiKey: ***masked*** }, ",
- cm.ChannelType, cm.ChannelId, cm.ChannelIsMultiKey, cm.ChannelMultiKeyIndex, cm.ChannelBaseUrl, cm.ApiType, cm.ApiVersion, cm.Organization, cm.ChannelCreateTime, cm.UpstreamModelName, cm.IsModelMapped, cm.SupportStreamOptions)
- }
- // Responses usage info (non-sensitive)
- if info.ResponsesUsageInfo != nil && len(info.ResponsesUsageInfo.BuiltInTools) > 0 {
- fmt.Fprintf(b, "ResponsesTools{ ")
- first := true
- for name, tool := range info.ResponsesUsageInfo.BuiltInTools {
- if !first {
- fmt.Fprintf(b, ", ")
- }
- first = false
- if tool != nil {
- fmt.Fprintf(b, "%s: calls=%d", name, tool.CallCount)
- } else {
- fmt.Fprintf(b, "%s: calls=0", name)
- }
- }
- fmt.Fprintf(b, " }, ")
- }
- fmt.Fprintf(b, "}")
- return b.String()
- }
- // 定义支持流式选项的通道类型
- var streamSupportedChannels = map[int]bool{
- constant.ChannelTypeOpenAI: true,
- constant.ChannelTypeAnthropic: true,
- constant.ChannelTypeAws: true,
- constant.ChannelTypeGemini: true,
- constant.ChannelCloudflare: true,
- constant.ChannelTypeAzure: true,
- constant.ChannelTypeVolcEngine: true,
- constant.ChannelTypeOllama: true,
- constant.ChannelTypeXai: true,
- constant.ChannelTypeDeepSeek: true,
- constant.ChannelTypeBaiduV2: true,
- constant.ChannelTypeZhipu_v4: true,
- constant.ChannelTypeAli: true,
- constant.ChannelTypeSubmodel: true,
- constant.ChannelTypeCodex: true,
- constant.ChannelTypeMoonshot: true,
- constant.ChannelTypeMiniMax: true,
- constant.ChannelTypeSiliconFlow: true,
- }
- func GenRelayInfoWs(c *gin.Context, ws *websocket.Conn) *RelayInfo {
- info := genBaseRelayInfo(c, nil)
- info.RelayFormat = types.RelayFormatOpenAIRealtime
- info.ClientWs = ws
- info.InputAudioFormat = "pcm16"
- info.OutputAudioFormat = "pcm16"
- info.IsFirstRequest = true
- return info
- }
- func GenRelayInfoClaude(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatClaude
- info.ShouldIncludeUsage = false
- info.ClaudeConvertInfo = &ClaudeConvertInfo{
- LastMessagesType: LastMessageTypeNone,
- }
- info.IsClaudeBetaQuery = c.Query("beta") == "true" || isClaudeBetaForced(c)
- return info
- }
- func isClaudeBetaForced(c *gin.Context) bool {
- channelOtherSettings, ok := common.GetContextKeyType[dto.ChannelOtherSettings](c, constant.ContextKeyChannelOtherSetting)
- return ok && channelOtherSettings.ClaudeBetaQuery
- }
- func GenRelayInfoRerank(c *gin.Context, request *dto.RerankRequest) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayMode = relayconstant.RelayModeRerank
- info.RelayFormat = types.RelayFormatRerank
- info.RerankerInfo = &RerankerInfo{
- Documents: request.Documents,
- ReturnDocuments: request.GetReturnDocuments(),
- }
- return info
- }
- func GenRelayInfoOpenAIAudio(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatOpenAIAudio
- return info
- }
- func GenRelayInfoEmbedding(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatEmbedding
- return info
- }
- func GenRelayInfoResponses(c *gin.Context, request *dto.OpenAIResponsesRequest) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayMode = relayconstant.RelayModeResponses
- info.RelayFormat = types.RelayFormatOpenAIResponses
- info.ResponsesUsageInfo = &ResponsesUsageInfo{
- BuiltInTools: make(map[string]*BuildInToolInfo),
- }
- if len(request.Tools) > 0 {
- for _, tool := range request.GetToolsMap() {
- toolType := common.Interface2String(tool["type"])
- info.ResponsesUsageInfo.BuiltInTools[toolType] = &BuildInToolInfo{
- ToolName: toolType,
- CallCount: 0,
- }
- switch toolType {
- case dto.BuildInToolWebSearchPreview:
- searchContextSize := common.Interface2String(tool["search_context_size"])
- if searchContextSize == "" {
- searchContextSize = "medium"
- }
- info.ResponsesUsageInfo.BuiltInTools[toolType].SearchContextSize = searchContextSize
- }
- }
- }
- return info
- }
- func GenRelayInfoGemini(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatGemini
- info.ShouldIncludeUsage = false
- return info
- }
- func GenRelayInfoImage(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatOpenAIImage
- return info
- }
- func GenRelayInfoOpenAI(c *gin.Context, request dto.Request) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- info.RelayFormat = types.RelayFormatOpenAI
- return info
- }
- func genBaseRelayInfo(c *gin.Context, request dto.Request) *RelayInfo {
- //channelType := common.GetContextKeyInt(c, constant.ContextKeyChannelType)
- //channelId := common.GetContextKeyInt(c, constant.ContextKeyChannelId)
- //paramOverride := common.GetContextKeyStringMap(c, constant.ContextKeyChannelParamOverride)
- tokenGroup := common.GetContextKeyString(c, constant.ContextKeyTokenGroup)
- // 当令牌分组为空时,表示使用用户分组
- if tokenGroup == "" {
- tokenGroup = common.GetContextKeyString(c, constant.ContextKeyUserGroup)
- }
- startTime := common.GetContextKeyTime(c, constant.ContextKeyRequestStartTime)
- if startTime.IsZero() {
- startTime = time.Now()
- }
- isStream := false
- if request != nil {
- isStream = request.IsStream(c)
- }
- // firstResponseTime = time.Now() - 1 second
- reqId := common.GetContextKeyString(c, common.RequestIdKey)
- if reqId == "" {
- reqId = common.GetTimeString() + common.GetRandomString(8)
- }
- info := &RelayInfo{
- Request: request,
- RequestId: reqId,
- UserId: common.GetContextKeyInt(c, constant.ContextKeyUserId),
- UsingGroup: common.GetContextKeyString(c, constant.ContextKeyUsingGroup),
- UserGroup: common.GetContextKeyString(c, constant.ContextKeyUserGroup),
- UserQuota: common.GetContextKeyInt(c, constant.ContextKeyUserQuota),
- UserEmail: common.GetContextKeyString(c, constant.ContextKeyUserEmail),
- OriginModelName: common.GetContextKeyString(c, constant.ContextKeyOriginalModel),
- TokenId: common.GetContextKeyInt(c, constant.ContextKeyTokenId),
- TokenKey: common.GetContextKeyString(c, constant.ContextKeyTokenKey),
- TokenUnlimited: common.GetContextKeyBool(c, constant.ContextKeyTokenUnlimited),
- TokenGroup: tokenGroup,
- isFirstResponse: true,
- RelayMode: relayconstant.Path2RelayMode(c.Request.URL.Path),
- RequestURLPath: c.Request.URL.String(),
- IsStream: isStream,
- StartTime: startTime,
- FirstResponseTime: startTime.Add(-time.Second),
- ThinkingContentInfo: ThinkingContentInfo{
- IsFirstThinkingContent: true,
- SendLastThinkingContent: false,
- },
- TokenCountMeta: TokenCountMeta{
- //promptTokens: common.GetContextKeyInt(c, constant.ContextKeyPromptTokens),
- estimatePromptTokens: common.GetContextKeyInt(c, constant.ContextKeyEstimatedTokens),
- },
- }
- if info.RelayMode == relayconstant.RelayModeUnknown {
- info.RelayMode = c.GetInt("relay_mode")
- }
- if strings.HasPrefix(c.Request.URL.Path, "/pg") {
- info.IsPlayground = true
- info.RequestURLPath = strings.TrimPrefix(info.RequestURLPath, "/pg")
- info.RequestURLPath = "/v1" + info.RequestURLPath
- }
- userSetting, ok := common.GetContextKeyType[dto.UserSetting](c, constant.ContextKeyUserSetting)
- if ok {
- info.UserSetting = userSetting
- }
- return info
- }
- func GenRelayInfo(c *gin.Context, relayFormat types.RelayFormat, request dto.Request, ws *websocket.Conn) (*RelayInfo, error) {
- var info *RelayInfo
- var err error
- switch relayFormat {
- case types.RelayFormatOpenAI:
- info = GenRelayInfoOpenAI(c, request)
- case types.RelayFormatOpenAIAudio:
- info = GenRelayInfoOpenAIAudio(c, request)
- case types.RelayFormatOpenAIImage:
- info = GenRelayInfoImage(c, request)
- case types.RelayFormatOpenAIRealtime:
- info = GenRelayInfoWs(c, ws)
- case types.RelayFormatClaude:
- info = GenRelayInfoClaude(c, request)
- case types.RelayFormatRerank:
- if request, ok := request.(*dto.RerankRequest); ok {
- info = GenRelayInfoRerank(c, request)
- break
- }
- err = errors.New("request is not a RerankRequest")
- case types.RelayFormatGemini:
- info = GenRelayInfoGemini(c, request)
- case types.RelayFormatEmbedding:
- info = GenRelayInfoEmbedding(c, request)
- case types.RelayFormatOpenAIResponses:
- if request, ok := request.(*dto.OpenAIResponsesRequest); ok {
- info = GenRelayInfoResponses(c, request)
- break
- }
- err = errors.New("request is not a OpenAIResponsesRequest")
- case types.RelayFormatOpenAIResponsesCompaction:
- if request, ok := request.(*dto.OpenAIResponsesCompactionRequest); ok {
- return GenRelayInfoResponsesCompaction(c, request), nil
- }
- return nil, errors.New("request is not a OpenAIResponsesCompactionRequest")
- case types.RelayFormatTask:
- info = genBaseRelayInfo(c, nil)
- info.TaskRelayInfo = &TaskRelayInfo{}
- case types.RelayFormatMjProxy:
- info = genBaseRelayInfo(c, nil)
- info.TaskRelayInfo = &TaskRelayInfo{}
- default:
- err = errors.New("invalid relay format")
- }
- if err != nil {
- return nil, err
- }
- if info == nil {
- return nil, errors.New("failed to build relay info")
- }
- info.InitRequestConversionChain()
- return info, nil
- }
- func (info *RelayInfo) InitRequestConversionChain() {
- if info == nil {
- return
- }
- if len(info.RequestConversionChain) > 0 {
- return
- }
- if info.RelayFormat == "" {
- return
- }
- info.RequestConversionChain = []types.RelayFormat{info.RelayFormat}
- }
- func (info *RelayInfo) AppendRequestConversion(format types.RelayFormat) {
- if info == nil {
- return
- }
- if format == "" {
- return
- }
- if len(info.RequestConversionChain) == 0 {
- info.RequestConversionChain = []types.RelayFormat{format}
- return
- }
- last := info.RequestConversionChain[len(info.RequestConversionChain)-1]
- if last == format {
- return
- }
- info.RequestConversionChain = append(info.RequestConversionChain, format)
- }
- func (info *RelayInfo) GetFinalRequestRelayFormat() types.RelayFormat {
- if info == nil {
- return ""
- }
- if info.FinalRequestRelayFormat != "" {
- return info.FinalRequestRelayFormat
- }
- if n := len(info.RequestConversionChain); n > 0 {
- return info.RequestConversionChain[n-1]
- }
- return info.RelayFormat
- }
- func GenRelayInfoResponsesCompaction(c *gin.Context, request *dto.OpenAIResponsesCompactionRequest) *RelayInfo {
- info := genBaseRelayInfo(c, request)
- if info.RelayMode == relayconstant.RelayModeUnknown {
- info.RelayMode = relayconstant.RelayModeResponsesCompact
- }
- info.RelayFormat = types.RelayFormatOpenAIResponsesCompaction
- return info
- }
- //func (info *RelayInfo) SetPromptTokens(promptTokens int) {
- // info.promptTokens = promptTokens
- //}
- func (info *RelayInfo) SetEstimatePromptTokens(promptTokens int) {
- info.estimatePromptTokens = promptTokens
- }
- func (info *RelayInfo) GetEstimatePromptTokens() int {
- return info.estimatePromptTokens
- }
- func (info *RelayInfo) SetFirstResponseTime() {
- if info.isFirstResponse {
- info.FirstResponseTime = time.Now()
- info.isFirstResponse = false
- }
- }
- func (info *RelayInfo) HasSendResponse() bool {
- return info.FirstResponseTime.After(info.StartTime)
- }
- type TaskRelayInfo struct {
- Action string
- OriginTaskID string
- // PublicTaskID 是提交时预生成的 task_xxxx 格式公开 ID,
- // 供 DoResponse 在返回给客户端时使用(避免暴露上游真实 ID)。
- PublicTaskID string
- ConsumeQuota bool
- // LockedChannel holds the full channel object when the request is bound to
- // a specific channel (e.g., remix on origin task's channel). Stored as any
- // to avoid an import cycle with model; callers type-assert to *model.Channel.
- LockedChannel any
- }
- type TaskSubmitReq struct {
- Prompt string `json:"prompt"`
- Model string `json:"model,omitempty"`
- Mode string `json:"mode,omitempty"`
- Image string `json:"image,omitempty"`
- Images []string `json:"images,omitempty"`
- Size string `json:"size,omitempty"`
- Duration int `json:"duration,omitempty"`
- Seconds string `json:"seconds,omitempty"`
- InputReference string `json:"input_reference,omitempty"`
- Metadata map[string]interface{} `json:"metadata,omitempty"`
- }
- func (t *TaskSubmitReq) GetPrompt() string {
- return t.Prompt
- }
- func (t *TaskSubmitReq) HasImage() bool {
- return len(t.Images) > 0
- }
- func (t *TaskSubmitReq) UnmarshalJSON(data []byte) error {
- type Alias TaskSubmitReq
- aux := &struct {
- Metadata json.RawMessage `json:"metadata,omitempty"`
- *Alias
- }{
- Alias: (*Alias)(t),
- }
- if err := common.Unmarshal(data, &aux); err != nil {
- return err
- }
- if len(aux.Metadata) > 0 {
- var metadataStr string
- if err := common.Unmarshal(aux.Metadata, &metadataStr); err == nil && metadataStr != "" {
- var metadataObj map[string]interface{}
- if err := common.Unmarshal([]byte(metadataStr), &metadataObj); err == nil {
- t.Metadata = metadataObj
- return nil
- }
- }
- var metadataObj map[string]interface{}
- if err := common.Unmarshal(aux.Metadata, &metadataObj); err == nil {
- t.Metadata = metadataObj
- }
- }
- return nil
- }
- func (t *TaskSubmitReq) UnmarshalMetadata(v any) error {
- metadata := t.Metadata
- if metadata != nil {
- metadataBytes, err := common.Marshal(metadata)
- if err != nil {
- return fmt.Errorf("marshal metadata failed: %w", err)
- }
- err = common.Unmarshal(metadataBytes, v)
- if err != nil {
- return fmt.Errorf("unmarshal metadata to target failed: %w", err)
- }
- }
- return nil
- }
- type TaskInfo struct {
- Code int `json:"code"`
- TaskID string `json:"task_id"`
- Status string `json:"status"`
- Reason string `json:"reason,omitempty"`
- Url string `json:"url,omitempty"`
- RemoteUrl string `json:"remote_url,omitempty"`
- Progress string `json:"progress,omitempty"`
- CompletionTokens int `json:"completion_tokens,omitempty"` // 用于按倍率计费
- TotalTokens int `json:"total_tokens,omitempty"` // 用于按倍率计费
- }
- func FailTaskInfo(reason string) *TaskInfo {
- return &TaskInfo{
- Status: "FAILURE",
- Reason: reason,
- }
- }
- // RemoveDisabledFields 从请求 JSON 数据中移除渠道设置中禁用的字段
- // service_tier: 服务层级字段,可能导致额外计费(OpenAI、Claude、Responses API 支持)
- // store: 数据存储授权字段,涉及用户隐私(仅 OpenAI、Responses API 支持,默认允许透传,禁用后可能导致 Codex 无法使用)
- // safety_identifier: 安全标识符,用于向 OpenAI 报告违规用户(仅 OpenAI 支持,涉及用户隐私)
- func RemoveDisabledFields(jsonData []byte, channelOtherSettings dto.ChannelOtherSettings) ([]byte, error) {
- var data map[string]interface{}
- if err := common.Unmarshal(jsonData, &data); err != nil {
- common.SysError("RemoveDisabledFields Unmarshal error :" + err.Error())
- return jsonData, nil
- }
- // 默认移除 service_tier,除非明确允许(避免额外计费风险)
- if !channelOtherSettings.AllowServiceTier {
- if _, exists := data["service_tier"]; exists {
- delete(data, "service_tier")
- }
- }
- // 默认允许 store 透传,除非明确禁用(禁用可能影响 Codex 使用)
- if channelOtherSettings.DisableStore {
- if _, exists := data["store"]; exists {
- delete(data, "store")
- }
- }
- // 默认移除 safety_identifier,除非明确允许(保护用户隐私,避免向 OpenAI 报告用户信息)
- if !channelOtherSettings.AllowSafetyIdentifier {
- if _, exists := data["safety_identifier"]; exists {
- delete(data, "safety_identifier")
- }
- }
- jsonDataAfter, err := common.Marshal(data)
- if err != nil {
- common.SysError("RemoveDisabledFields Marshal error :" + err.Error())
- return jsonData, nil
- }
- return jsonDataAfter, nil
- }
- // RemoveGeminiDisabledFields removes disabled fields from Gemini request JSON data
- // Currently supports removing functionResponse.id field which Vertex AI does not support
- func RemoveGeminiDisabledFields(jsonData []byte) ([]byte, error) {
- if !model_setting.GetGeminiSettings().RemoveFunctionResponseIdEnabled {
- return jsonData, nil
- }
- var data map[string]interface{}
- if err := common.Unmarshal(jsonData, &data); err != nil {
- common.SysError("RemoveGeminiDisabledFields Unmarshal error: " + err.Error())
- return jsonData, nil
- }
- // Process contents array
- // Handle both camelCase (functionResponse) and snake_case (function_response)
- if contents, ok := data["contents"].([]interface{}); ok {
- for _, content := range contents {
- if contentMap, ok := content.(map[string]interface{}); ok {
- if parts, ok := contentMap["parts"].([]interface{}); ok {
- for _, part := range parts {
- if partMap, ok := part.(map[string]interface{}); ok {
- // Check functionResponse (camelCase)
- if funcResp, ok := partMap["functionResponse"].(map[string]interface{}); ok {
- delete(funcResp, "id")
- }
- // Check function_response (snake_case)
- if funcResp, ok := partMap["function_response"].(map[string]interface{}); ok {
- delete(funcResp, "id")
- }
- }
- }
- }
- }
- }
- }
- jsonDataAfter, err := common.Marshal(data)
- if err != nil {
- common.SysError("RemoveGeminiDisabledFields Marshal error: " + err.Error())
- return jsonData, nil
- }
- return jsonDataAfter, nil
- }
|