mirror of
https://github.com/songquanpeng/one-api.git
synced 2025-09-29 22:56:39 +08:00
259 lines
7.8 KiB
Go
259 lines
7.8 KiB
Go
package controller
|
|
|
|
import (
|
|
"bufio"
|
|
"bytes"
|
|
"context"
|
|
"encoding/json"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"math"
|
|
"net/http"
|
|
"one-api/common"
|
|
"one-api/common/audio"
|
|
"one-api/model"
|
|
"one-api/relay/channel/openai"
|
|
"one-api/relay/constant"
|
|
"one-api/relay/util"
|
|
"os"
|
|
"strings"
|
|
|
|
"github.com/gin-gonic/gin"
|
|
)
|
|
|
|
const (
|
|
TokensPerSecond = 1000 / 20 // $0.006 / minute -> $0.002 / 20 seconds -> $0.002 / 1K tokens
|
|
)
|
|
|
|
func countAudioTokens(req *http.Request) (int, error) {
|
|
cloned := common.CloneRequest(req)
|
|
defer cloned.Body.Close()
|
|
file, header, err := cloned.FormFile("file")
|
|
if err != nil {
|
|
return 0, err
|
|
}
|
|
defer file.Close()
|
|
f, err := common.SaveTmpFile(header.Filename, file)
|
|
if err != nil {
|
|
return 0, err
|
|
}
|
|
defer os.Remove(f)
|
|
duration, err := audio.GetAudioDuration(cloned.Context(), f)
|
|
if err != nil {
|
|
return 0, err
|
|
}
|
|
return int(math.Ceil(duration)) * TokensPerSecond, nil
|
|
}
|
|
|
|
func RelayAudioHelper(c *gin.Context, relayMode int) *openai.ErrorWithStatusCode {
|
|
audioModel := "whisper-1"
|
|
|
|
tokenId := c.GetInt("token_id")
|
|
channelType := c.GetInt("channel")
|
|
channelId := c.GetInt("channel_id")
|
|
userId := c.GetInt("id")
|
|
group := c.GetString("group")
|
|
tokenName := c.GetString("token_name")
|
|
|
|
var inputTokens int
|
|
var ttsRequest openai.TextToSpeechRequest
|
|
modelRatio := common.GetModelRatio(audioModel)
|
|
groupRatio := common.GetGroupRatio(group)
|
|
ratio := modelRatio * groupRatio
|
|
var quota int
|
|
var preConsumedQuota int
|
|
switch relayMode {
|
|
case constant.RelayModeAudioSpeech:
|
|
// Read JSON
|
|
err := common.UnmarshalBodyReusable(c, &ttsRequest)
|
|
// Check if JSON is valid
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "invalid_json", http.StatusBadRequest)
|
|
}
|
|
audioModel = ttsRequest.Model
|
|
// Check if text is too long 4096
|
|
if len(ttsRequest.Input) > 4096 {
|
|
return openai.ErrorWrapper(errors.New("input is too long (over 4096 characters)"), "text_too_long", http.StatusBadRequest)
|
|
}
|
|
inputTokens = len(ttsRequest.Input)
|
|
default:
|
|
// whisper-1 audio transcription
|
|
audioTokens, err := countAudioTokens(c.Request)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "get_audio_duration_failed", http.StatusInternalServerError)
|
|
}
|
|
inputTokens = audioTokens
|
|
}
|
|
preConsumedQuota = int(float64(inputTokens) * ratio)
|
|
quota = preConsumedQuota
|
|
userQuota, err := model.CacheGetUserQuota(userId)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "get_user_quota_failed", http.StatusInternalServerError)
|
|
}
|
|
|
|
// Check if user quota is enough
|
|
if userQuota-preConsumedQuota < 0 {
|
|
return openai.ErrorWrapper(errors.New("user quota is not enough"), "insufficient_user_quota", http.StatusForbidden)
|
|
}
|
|
err = model.CacheDecreaseUserQuota(userId, preConsumedQuota)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "decrease_user_quota_failed", http.StatusInternalServerError)
|
|
}
|
|
if userQuota > 100*preConsumedQuota {
|
|
// in this case, we do not pre-consume quota
|
|
// because the user has enough quota
|
|
preConsumedQuota = 0
|
|
}
|
|
if preConsumedQuota > 0 {
|
|
err := model.PreConsumeTokenQuota(tokenId, preConsumedQuota)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "pre_consume_token_quota_failed", http.StatusForbidden)
|
|
}
|
|
}
|
|
|
|
// map model name
|
|
modelMapping := c.GetString("model_mapping")
|
|
if modelMapping != "" {
|
|
modelMap := make(map[string]string)
|
|
err := json.Unmarshal([]byte(modelMapping), &modelMap)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "unmarshal_model_mapping_failed", http.StatusInternalServerError)
|
|
}
|
|
if modelMap[audioModel] != "" {
|
|
audioModel = modelMap[audioModel]
|
|
}
|
|
}
|
|
|
|
baseURL := common.ChannelBaseURLs[channelType]
|
|
requestURL := c.Request.URL.String()
|
|
if c.GetString("base_url") != "" {
|
|
baseURL = c.GetString("base_url")
|
|
}
|
|
|
|
fullRequestURL := util.GetFullRequestURL(baseURL, requestURL, channelType)
|
|
if relayMode == constant.RelayModeAudioTranscription && channelType == common.ChannelTypeAzure {
|
|
// https://learn.microsoft.com/en-us/azure/ai-services/openai/whisper-quickstart?tabs=command-line#rest-api
|
|
apiVersion := util.GetAPIVersion(c)
|
|
fullRequestURL = fmt.Sprintf("%s/openai/deployments/%s/audio/transcriptions?api-version=%s", baseURL, audioModel, apiVersion)
|
|
}
|
|
|
|
requestBody := &bytes.Buffer{}
|
|
_, err = io.Copy(requestBody, c.Request.Body)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "new_request_body_failed", http.StatusInternalServerError)
|
|
}
|
|
c.Request.Body = io.NopCloser(bytes.NewBuffer(requestBody.Bytes()))
|
|
|
|
req, err := http.NewRequest(c.Request.Method, fullRequestURL, requestBody)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "new_request_failed", http.StatusInternalServerError)
|
|
}
|
|
|
|
if relayMode == constant.RelayModeAudioTranscription && channelType == common.ChannelTypeAzure {
|
|
// https://learn.microsoft.com/en-us/azure/ai-services/openai/whisper-quickstart?tabs=command-line#rest-api
|
|
apiKey := c.Request.Header.Get("Authorization")
|
|
apiKey = strings.TrimPrefix(apiKey, "Bearer ")
|
|
req.Header.Set("api-key", apiKey)
|
|
req.ContentLength = c.Request.ContentLength
|
|
} else {
|
|
req.Header.Set("Authorization", c.Request.Header.Get("Authorization"))
|
|
}
|
|
req.Header.Set("Content-Type", c.Request.Header.Get("Content-Type"))
|
|
req.Header.Set("Accept", c.Request.Header.Get("Accept"))
|
|
|
|
resp, err := util.HTTPClient.Do(req)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "do_request_failed", http.StatusInternalServerError)
|
|
}
|
|
|
|
err = req.Body.Close()
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "close_request_body_failed", http.StatusInternalServerError)
|
|
}
|
|
err = c.Request.Body.Close()
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "close_request_body_failed", http.StatusInternalServerError)
|
|
}
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
if preConsumedQuota > 0 {
|
|
// we need to roll back the pre-consumed quota
|
|
defer func(ctx context.Context) {
|
|
go func() {
|
|
// negative means add quota back for token & user
|
|
err := model.PostConsumeTokenQuota(tokenId, -preConsumedQuota)
|
|
if err != nil {
|
|
common.LogError(ctx, fmt.Sprintf("error rollback pre-consumed quota: %s", err.Error()))
|
|
}
|
|
}()
|
|
}(c.Request.Context())
|
|
}
|
|
return util.RelayErrorHandler(resp)
|
|
}
|
|
quotaDelta := quota - preConsumedQuota
|
|
defer func(ctx context.Context) {
|
|
go util.PostConsumeQuota(ctx, tokenId, quotaDelta, quota, userId, channelId, modelRatio, groupRatio, audioModel, tokenName)
|
|
}(c.Request.Context())
|
|
|
|
for k, v := range resp.Header {
|
|
c.Writer.Header().Set(k, v[0])
|
|
}
|
|
c.Writer.WriteHeader(resp.StatusCode)
|
|
|
|
_, err = io.Copy(c.Writer, resp.Body)
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "copy_response_body_failed", http.StatusInternalServerError)
|
|
}
|
|
err = resp.Body.Close()
|
|
if err != nil {
|
|
return openai.ErrorWrapper(err, "close_response_body_failed", http.StatusInternalServerError)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func getTextFromVTT(body []byte) (string, error) {
|
|
return getTextFromSRT(body)
|
|
}
|
|
|
|
func getTextFromVerboseJSON(body []byte) (string, error) {
|
|
var whisperResponse openai.WhisperVerboseJSONResponse
|
|
if err := json.Unmarshal(body, &whisperResponse); err != nil {
|
|
return "", fmt.Errorf("unmarshal_response_body_failed err :%w", err)
|
|
}
|
|
return whisperResponse.Text, nil
|
|
}
|
|
|
|
func getTextFromSRT(body []byte) (string, error) {
|
|
scanner := bufio.NewScanner(strings.NewReader(string(body)))
|
|
var builder strings.Builder
|
|
var textLine bool
|
|
for scanner.Scan() {
|
|
line := scanner.Text()
|
|
if textLine {
|
|
builder.WriteString(line)
|
|
textLine = false
|
|
continue
|
|
} else if strings.Contains(line, "-->") {
|
|
textLine = true
|
|
continue
|
|
}
|
|
}
|
|
if err := scanner.Err(); err != nil {
|
|
return "", err
|
|
}
|
|
return builder.String(), nil
|
|
}
|
|
|
|
func getTextFromText(body []byte) (string, error) {
|
|
return strings.TrimSuffix(string(body), "\n"), nil
|
|
}
|
|
|
|
func getTextFromJSON(body []byte) (string, error) {
|
|
var whisperResponse openai.WhisperJSONResponse
|
|
if err := json.Unmarshal(body, &whisperResponse); err != nil {
|
|
return "", fmt.Errorf("unmarshal_response_body_failed err :%w", err)
|
|
}
|
|
return whisperResponse.Text, nil
|
|
}
|