fix: 修复高并发下，高额度用户使用低额度令牌没有预扣费的问题

2026-04-28 01:34:25 +08:00 · 2024-01-10 14:23:23 +08:00
parent 042d55cfd3
commit a3b726dd82
2 changed files with 20 additions and 4 deletions
--- a/controller/relay-text.go
+++ b/controller/relay-text.go
@@ -52,6 +52,7 @@ func relayTextHelper(c *gin.Context, relayMode int) *OpenAIErrorWithStatusCode {
 	tokenId := c.GetInt("token_id")
 	userId := c.GetInt("id")
 	group := c.GetString("group")
 	tokenQuota := c.GetInt("token_quota")
 	startTime := time.Now()
 	var textRequest GeneralOpenAIRequest
@@ -261,10 +262,20 @@ func relayTextHelper(c *gin.Context, relayMode int) *OpenAIErrorWithStatusCode {
 		return errorWrapper(err, "decrease_user_quota_failed", http.StatusInternalServerError)
 	}
 	if userQuota > 100*preConsumedQuota {
-		// in this case, we do not pre-consume quota
+		// 用户额度充足，判断令牌额度是否充足
-		// because the user has enough quota
+		if tokenQuota != -1 {
-		preConsumedQuota = 0
+			// 非无限令牌，判断令牌额度是否充足
-		common.LogInfo(c.Request.Context(), fmt.Sprintf("user %d has enough quota %d, trusted and no need to pre-consume", userId, userQuota))
+			if tokenQuota > 100*preConsumedQuota {
 				// 令牌额度充足，信任令牌
 				preConsumedQuota = 0
 				common.LogInfo(c.Request.Context(), fmt.Sprintf("user %d quota %d and token %d quota %d are enough, trusted and no need to pre-consume", userId, userQuota, tokenId, tokenQuota))
 			}
 		} else {
 			// in this case, we do not pre-consume quota
 			// because the user has enough quota
 			preConsumedQuota = 0
 			common.LogInfo(c.Request.Context(), fmt.Sprintf("user %d with unlimited token has enough quota %d, trusted and no need to pre-consume", userId, userQuota))
 		}
 	}
 	if preConsumedQuota > 0 {
 		userQuota, err = model.PreConsumeTokenQuota(tokenId, preConsumedQuota)
--- a/middleware/auth.go
+++ b/middleware/auth.go
@@ -115,6 +115,11 @@ func TokenAuth() func(c *gin.Context) {
 		c.Set("id", token.UserId)
 		c.Set("token_id", token.Id)
 		c.Set("token_name", token.Name)
 		if !token.UnlimitedQuota {
 			c.Set("token_quota", token.RemainQuota)
 		} else {
 			c.Set("token_quota", -1)
 		}
 		if token.ModelLimitsEnabled {
 			c.Set("token_model_limit_enabled", true)
 			c.Set("token_model_limit", token.GetModelLimitsMap())