|
@@ -264,10 +264,10 @@ func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo, textRe
|
|
|
completionTokens := usage.CompletionTokens
|
|
completionTokens := usage.CompletionTokens
|
|
|
|
|
|
|
|
tokenName := ctx.GetString("token_name")
|
|
tokenName := ctx.GetString("token_name")
|
|
|
|
|
+ completionRatio := common.GetCompletionRatio(textRequest.Model)
|
|
|
|
|
|
|
|
quota := 0
|
|
quota := 0
|
|
|
if modelPrice == -1 {
|
|
if modelPrice == -1 {
|
|
|
- completionRatio := common.GetCompletionRatio(textRequest.Model)
|
|
|
|
|
quota = promptTokens + int(float64(completionTokens)*completionRatio)
|
|
quota = promptTokens + int(float64(completionTokens)*completionRatio)
|
|
|
quota = int(float64(quota) * ratio)
|
|
quota = int(float64(quota) * ratio)
|
|
|
if ratio != 0 && quota <= 0 {
|
|
if ratio != 0 && quota <= 0 {
|
|
@@ -279,7 +279,7 @@ func postConsumeQuota(ctx *gin.Context, relayInfo *relaycommon.RelayInfo, textRe
|
|
|
totalTokens := promptTokens + completionTokens
|
|
totalTokens := promptTokens + completionTokens
|
|
|
var logContent string
|
|
var logContent string
|
|
|
if modelPrice == -1 {
|
|
if modelPrice == -1 {
|
|
|
- logContent = fmt.Sprintf("模型倍率 %.2f,分组倍率 %.2f", modelRatio, groupRatio)
|
|
|
|
|
|
|
+ logContent = fmt.Sprintf("模型倍率 %.2f,分组倍率 %.2f,补全倍率 %.2f", modelRatio, groupRatio, completionRatio)
|
|
|
} else {
|
|
} else {
|
|
|
logContent = fmt.Sprintf("模型价格 %.2f,分组倍率 %.2f", modelPrice, groupRatio)
|
|
logContent = fmt.Sprintf("模型价格 %.2f,分组倍率 %.2f", modelPrice, groupRatio)
|
|
|
}
|
|
}
|