diff --git a/relay/adaptor/openrouter/constants.go b/relay/adaptor/openrouter/constants.go index 3ad8ed55..b12fa65c 100644 --- a/relay/adaptor/openrouter/constants.go +++ b/relay/adaptor/openrouter/constants.go @@ -1,20 +1,235 @@ package openrouter var ModelList = []string{ - "openai/gpt-3.5-turbo", - "openai/chatgpt-4o-latest", - "openai/o1", - "openai/o1-preview", - "openai/o1-mini", - "openai/o3-mini", - "google/gemini-2.0-flash-001", - "google/gemini-2.0-flash-thinking-exp:free", - "google/gemini-2.0-flash-lite-preview-02-05:free", - "google/gemini-2.0-pro-exp-02-05:free", - "google/gemini-flash-1.5-8b", - "anthropic/claude-3.5-sonnet", + "01-ai/yi-large", + "aetherwiing/mn-starcannon-12b", + "ai21/jamba-1-5-large", + "ai21/jamba-1-5-mini", + "ai21/jamba-instruct", + "aion-labs/aion-1.0", + "aion-labs/aion-1.0-mini", + "aion-labs/aion-rp-llama-3.1-8b", + "allenai/llama-3.1-tulu-3-405b", + "alpindale/goliath-120b", + "alpindale/magnum-72b", + "amazon/nova-lite-v1", + "amazon/nova-micro-v1", + "amazon/nova-pro-v1", + "anthracite-org/magnum-v2-72b", + "anthracite-org/magnum-v4-72b", + "anthropic/claude-2", + "anthropic/claude-2.0", + "anthropic/claude-2.0:beta", + "anthropic/claude-2.1", + "anthropic/claude-2.1:beta", + "anthropic/claude-2:beta", + "anthropic/claude-3-haiku", + "anthropic/claude-3-haiku:beta", + "anthropic/claude-3-opus", + "anthropic/claude-3-opus:beta", + "anthropic/claude-3-sonnet", + "anthropic/claude-3-sonnet:beta", "anthropic/claude-3.5-haiku", - "deepseek/deepseek-r1:free", + "anthropic/claude-3.5-haiku-20241022", + "anthropic/claude-3.5-haiku-20241022:beta", + "anthropic/claude-3.5-haiku:beta", + "anthropic/claude-3.5-sonnet", + "anthropic/claude-3.5-sonnet-20240620", + "anthropic/claude-3.5-sonnet-20240620:beta", + "anthropic/claude-3.5-sonnet:beta", + "cognitivecomputations/dolphin-mixtral-8x22b", + "cognitivecomputations/dolphin-mixtral-8x7b", + "cohere/command", + "cohere/command-r", + "cohere/command-r-03-2024", + "cohere/command-r-08-2024", + "cohere/command-r-plus", + "cohere/command-r-plus-04-2024", + "cohere/command-r-plus-08-2024", + "cohere/command-r7b-12-2024", + "databricks/dbrx-instruct", + "deepseek/deepseek-chat", + "deepseek/deepseek-chat-v2.5", + "deepseek/deepseek-chat:free", "deepseek/deepseek-r1", + "deepseek/deepseek-r1-distill-llama-70b", + "deepseek/deepseek-r1-distill-llama-70b:free", + "deepseek/deepseek-r1-distill-llama-8b", + "deepseek/deepseek-r1-distill-qwen-1.5b", + "deepseek/deepseek-r1-distill-qwen-14b", + "deepseek/deepseek-r1-distill-qwen-32b", + "deepseek/deepseek-r1:free", + "eva-unit-01/eva-llama-3.33-70b", + "eva-unit-01/eva-qwen-2.5-32b", + "eva-unit-01/eva-qwen-2.5-72b", + "google/gemini-2.0-flash-001", + "google/gemini-2.0-flash-exp:free", + "google/gemini-2.0-flash-lite-preview-02-05:free", + "google/gemini-2.0-flash-thinking-exp-1219:free", + "google/gemini-2.0-flash-thinking-exp:free", + "google/gemini-2.0-pro-exp-02-05:free", + "google/gemini-exp-1206:free", + "google/gemini-flash-1.5", + "google/gemini-flash-1.5-8b", + "google/gemini-flash-1.5-8b-exp", + "google/gemini-pro", + "google/gemini-pro-1.5", + "google/gemini-pro-vision", + "google/gemma-2-27b-it", + "google/gemma-2-9b-it", + "google/gemma-2-9b-it:free", + "google/gemma-7b-it", + "google/learnlm-1.5-pro-experimental:free", + "google/palm-2-chat-bison", + "google/palm-2-chat-bison-32k", + "google/palm-2-codechat-bison", + "google/palm-2-codechat-bison-32k", + "gryphe/mythomax-l2-13b", + "gryphe/mythomax-l2-13b:free", + "huggingfaceh4/zephyr-7b-beta:free", + "infermatic/mn-inferor-12b", + "inflection/inflection-3-pi", + "inflection/inflection-3-productivity", + "jondurbin/airoboros-l2-70b", + "liquid/lfm-3b", + "liquid/lfm-40b", + "liquid/lfm-7b", + "mancer/weaver", + "meta-llama/llama-2-13b-chat", + "meta-llama/llama-2-70b-chat", + "meta-llama/llama-3-70b-instruct", + "meta-llama/llama-3-8b-instruct", + "meta-llama/llama-3-8b-instruct:free", + "meta-llama/llama-3.1-405b", + "meta-llama/llama-3.1-405b-instruct", + "meta-llama/llama-3.1-70b-instruct", + "meta-llama/llama-3.1-8b-instruct", + "meta-llama/llama-3.2-11b-vision-instruct", + "meta-llama/llama-3.2-11b-vision-instruct:free", + "meta-llama/llama-3.2-1b-instruct", + "meta-llama/llama-3.2-3b-instruct", + "meta-llama/llama-3.2-90b-vision-instruct", + "meta-llama/llama-3.3-70b-instruct", + "meta-llama/llama-3.3-70b-instruct:free", + "meta-llama/llama-guard-2-8b", + "microsoft/phi-3-medium-128k-instruct", + "microsoft/phi-3-medium-128k-instruct:free", + "microsoft/phi-3-mini-128k-instruct", + "microsoft/phi-3-mini-128k-instruct:free", + "microsoft/phi-3.5-mini-128k-instruct", + "microsoft/phi-4", + "microsoft/wizardlm-2-7b", + "microsoft/wizardlm-2-8x22b", + "minimax/minimax-01", + "mistralai/codestral-2501", + "mistralai/codestral-mamba", + "mistralai/ministral-3b", + "mistralai/ministral-8b", + "mistralai/mistral-7b-instruct", + "mistralai/mistral-7b-instruct-v0.1", + "mistralai/mistral-7b-instruct-v0.3", + "mistralai/mistral-7b-instruct:free", + "mistralai/mistral-large", + "mistralai/mistral-large-2407", + "mistralai/mistral-large-2411", + "mistralai/mistral-medium", + "mistralai/mistral-nemo", + "mistralai/mistral-nemo:free", + "mistralai/mistral-small", + "mistralai/mistral-small-24b-instruct-2501", + "mistralai/mistral-small-24b-instruct-2501:free", + "mistralai/mistral-tiny", + "mistralai/mixtral-8x22b-instruct", + "mistralai/mixtral-8x7b", + "mistralai/mixtral-8x7b-instruct", + "mistralai/pixtral-12b", + "mistralai/pixtral-large-2411", + "neversleep/llama-3-lumimaid-70b", + "neversleep/llama-3-lumimaid-8b", + "neversleep/llama-3-lumimaid-8b:extended", + "neversleep/llama-3.1-lumimaid-70b", + "neversleep/llama-3.1-lumimaid-8b", + "neversleep/noromaid-20b", + "nothingiisreal/mn-celeste-12b", + "nousresearch/hermes-2-pro-llama-3-8b", + "nousresearch/hermes-3-llama-3.1-405b", + "nousresearch/hermes-3-llama-3.1-70b", + "nousresearch/nous-hermes-2-mixtral-8x7b-dpo", + "nousresearch/nous-hermes-llama2-13b", + "nvidia/llama-3.1-nemotron-70b-instruct", + "nvidia/llama-3.1-nemotron-70b-instruct:free", + "openai/chatgpt-4o-latest", + "openai/gpt-3.5-turbo", + "openai/gpt-3.5-turbo-0125", + "openai/gpt-3.5-turbo-0613", + "openai/gpt-3.5-turbo-1106", + "openai/gpt-3.5-turbo-16k", + "openai/gpt-3.5-turbo-instruct", + "openai/gpt-4", + "openai/gpt-4-0314", + "openai/gpt-4-1106-preview", + "openai/gpt-4-32k", + "openai/gpt-4-32k-0314", + "openai/gpt-4-turbo", + "openai/gpt-4-turbo-preview", + "openai/gpt-4o", + "openai/gpt-4o-2024-05-13", + "openai/gpt-4o-2024-08-06", + "openai/gpt-4o-2024-11-20", + "openai/gpt-4o-mini", + "openai/gpt-4o-mini-2024-07-18", + "openai/gpt-4o:extended", + "openai/o1", + "openai/o1-mini", + "openai/o1-mini-2024-09-12", + "openai/o1-preview", + "openai/o1-preview-2024-09-12", + "openai/o3-mini", + "openai/o3-mini-high", + "openchat/openchat-7b", + "openchat/openchat-7b:free", + "openrouter/auto", + "perplexity/llama-3.1-sonar-huge-128k-online", + "perplexity/llama-3.1-sonar-large-128k-chat", + "perplexity/llama-3.1-sonar-large-128k-online", + "perplexity/llama-3.1-sonar-small-128k-chat", + "perplexity/llama-3.1-sonar-small-128k-online", + "perplexity/sonar", + "perplexity/sonar-reasoning", + "pygmalionai/mythalion-13b", + "qwen/qvq-72b-preview", + "qwen/qwen-2-72b-instruct", + "qwen/qwen-2-7b-instruct", + "qwen/qwen-2-7b-instruct:free", + "qwen/qwen-2-vl-72b-instruct", + "qwen/qwen-2-vl-7b-instruct", + "qwen/qwen-2.5-72b-instruct", + "qwen/qwen-2.5-7b-instruct", + "qwen/qwen-2.5-coder-32b-instruct", + "qwen/qwen-max", + "qwen/qwen-plus", + "qwen/qwen-turbo", "qwen/qwen-vl-plus:free", + "qwen/qwen2.5-vl-72b-instruct:free", + "qwen/qwq-32b-preview", + "raifle/sorcererlm-8x22b", + "sao10k/fimbulvetr-11b-v2", + "sao10k/l3-euryale-70b", + "sao10k/l3-lunaris-8b", + "sao10k/l3.1-70b-hanami-x1", + "sao10k/l3.1-euryale-70b", + "sao10k/l3.3-euryale-70b", + "sophosympatheia/midnight-rose-70b", + "sophosympatheia/rogue-rose-103b-v0.2:free", + "teknium/openhermes-2.5-mistral-7b", + "thedrummer/rocinante-12b", + "thedrummer/unslopnemo-12b", + "undi95/remm-slerp-l2-13b", + "undi95/toppy-m-7b", + "undi95/toppy-m-7b:free", + "x-ai/grok-2-1212", + "x-ai/grok-2-vision-1212", + "x-ai/grok-beta", + "x-ai/grok-vision-beta", + "xwin-lm/xwin-lm-70b", } diff --git a/relay/billing/ratio/model.go b/relay/billing/ratio/model.go index 4a4bbdb0..e8b3b615 100644 --- a/relay/billing/ratio/model.go +++ b/relay/billing/ratio/model.go @@ -59,6 +59,8 @@ var ModelRatio = map[string]float64{ "o1-preview-2024-09-12": 7.5, "o1-mini": 1.5, // $3.00 / 1M input tokens "o1-mini-2024-09-12": 1.5, + "o3-mini": 1.5, // $3.00 / 1M input tokens + "o3-mini-2025-01-31": 1.5, "davinci-002": 1, // $0.002 / 1K tokens "babbage-002": 0.2, // $0.0004 / 1K tokens "text-ada-001": 0.2, @@ -385,6 +387,238 @@ var ModelRatio = map[string]float64{ "mistralai/mistral-7b-instruct-v0.2": 0.050 * USD, "mistralai/mistral-7b-v0.1": 0.050 * USD, "mistralai/mixtral-8x7b-instruct-v0.1": 0.300 * USD, + //https://openrouter.ai/models + "01-ai/yi-large": 1.5, + "aetherwiing/mn-starcannon-12b": 0.6, + "ai21/jamba-1-5-large": 4.0, + "ai21/jamba-1-5-mini": 0.2, + "ai21/jamba-instruct": 0.35, + "aion-labs/aion-1.0": 6.0, + "aion-labs/aion-1.0-mini": 1.2, + "aion-labs/aion-rp-llama-3.1-8b": 0.1, + "allenai/llama-3.1-tulu-3-405b": 5.0, + "alpindale/goliath-120b": 4.6875, + "alpindale/magnum-72b": 1.125, + "amazon/nova-lite-v1": 0.12, + "amazon/nova-micro-v1": 0.07, + "amazon/nova-pro-v1": 1.6, + "anthracite-org/magnum-v2-72b": 1.5, + "anthracite-org/magnum-v4-72b": 1.125, + "anthropic/claude-2": 12.0, + "anthropic/claude-2.0": 12.0, + "anthropic/claude-2.0:beta": 12.0, + "anthropic/claude-2.1": 12.0, + "anthropic/claude-2.1:beta": 12.0, + "anthropic/claude-2:beta": 12.0, + "anthropic/claude-3-haiku": 0.625, + "anthropic/claude-3-haiku:beta": 0.625, + "anthropic/claude-3-opus": 37.5, + "anthropic/claude-3-opus:beta": 37.5, + "anthropic/claude-3-sonnet": 7.5, + "anthropic/claude-3-sonnet:beta": 7.5, + "anthropic/claude-3.5-haiku": 2.0, + "anthropic/claude-3.5-haiku-20241022": 2.0, + "anthropic/claude-3.5-haiku-20241022:beta": 2.0, + "anthropic/claude-3.5-haiku:beta": 2.0, + "anthropic/claude-3.5-sonnet": 7.5, + "anthropic/claude-3.5-sonnet-20240620": 7.5, + "anthropic/claude-3.5-sonnet-20240620:beta": 7.5, + "anthropic/claude-3.5-sonnet:beta": 7.5, + "cognitivecomputations/dolphin-mixtral-8x22b": 0.45, + "cognitivecomputations/dolphin-mixtral-8x7b": 0.25, + "cohere/command": 0.95, + "cohere/command-r": 0.7125, + "cohere/command-r-03-2024": 0.7125, + "cohere/command-r-08-2024": 0.285, + "cohere/command-r-plus": 7.125, + "cohere/command-r-plus-04-2024": 7.125, + "cohere/command-r-plus-08-2024": 4.75, + "cohere/command-r7b-12-2024": 0.075, + "databricks/dbrx-instruct": 0.6, + "deepseek/deepseek-chat": 0.445, + "deepseek/deepseek-chat-v2.5": 1.0, + "deepseek/deepseek-chat:free": 0.0, + "deepseek/deepseek-r1": 1.2, + "deepseek/deepseek-r1-distill-llama-70b": 0.345, + "deepseek/deepseek-r1-distill-llama-70b:free": 0.0, + "deepseek/deepseek-r1-distill-llama-8b": 0.02, + "deepseek/deepseek-r1-distill-qwen-1.5b": 0.09, + "deepseek/deepseek-r1-distill-qwen-14b": 0.075, + "deepseek/deepseek-r1-distill-qwen-32b": 0.09, + "deepseek/deepseek-r1:free": 0.0, + "eva-unit-01/eva-llama-3.33-70b": 3.0, + "eva-unit-01/eva-qwen-2.5-32b": 1.7, + "eva-unit-01/eva-qwen-2.5-72b": 3.0, + "google/gemini-2.0-flash-001": 0.2, + "google/gemini-2.0-flash-exp:free": 0.0, + "google/gemini-2.0-flash-lite-preview-02-05:free": 0.0, + "google/gemini-2.0-flash-thinking-exp-1219:free": 0.0, + "google/gemini-2.0-flash-thinking-exp:free": 0.0, + "google/gemini-2.0-pro-exp-02-05:free": 0.0, + "google/gemini-exp-1206:free": 0.0, + "google/gemini-flash-1.5": 0.15, + "google/gemini-flash-1.5-8b": 0.075, + "google/gemini-flash-1.5-8b-exp": 0.0, + "google/gemini-pro": 0.75, + "google/gemini-pro-1.5": 2.5, + "google/gemini-pro-vision": 0.75, + "google/gemma-2-27b-it": 0.135, + "google/gemma-2-9b-it": 0.03, + "google/gemma-2-9b-it:free": 0.0, + "google/gemma-7b-it": 0.075, + "google/learnlm-1.5-pro-experimental:free": 0.0, + "google/palm-2-chat-bison": 1.0, + "google/palm-2-chat-bison-32k": 1.0, + "google/palm-2-codechat-bison": 1.0, + "google/palm-2-codechat-bison-32k": 1.0, + "gryphe/mythomax-l2-13b": 0.0325, + "gryphe/mythomax-l2-13b:free": 0.0, + "huggingfaceh4/zephyr-7b-beta:free": 0.0, + "infermatic/mn-inferor-12b": 0.6, + "inflection/inflection-3-pi": 5.0, + "inflection/inflection-3-productivity": 5.0, + "jondurbin/airoboros-l2-70b": 0.25, + "liquid/lfm-3b": 0.01, + "liquid/lfm-40b": 0.075, + "liquid/lfm-7b": 0.005, + "mancer/weaver": 1.125, + "meta-llama/llama-2-13b-chat": 0.11, + "meta-llama/llama-2-70b-chat": 0.45, + "meta-llama/llama-3-70b-instruct": 0.2, + "meta-llama/llama-3-8b-instruct": 0.03, + "meta-llama/llama-3-8b-instruct:free": 0.0, + "meta-llama/llama-3.1-405b": 1.0, + "meta-llama/llama-3.1-405b-instruct": 0.4, + "meta-llama/llama-3.1-70b-instruct": 0.15, + "meta-llama/llama-3.1-8b-instruct": 0.025, + "meta-llama/llama-3.2-11b-vision-instruct": 0.0275, + "meta-llama/llama-3.2-11b-vision-instruct:free": 0.0, + "meta-llama/llama-3.2-1b-instruct": 0.005, + "meta-llama/llama-3.2-3b-instruct": 0.0125, + "meta-llama/llama-3.2-90b-vision-instruct": 0.8, + "meta-llama/llama-3.3-70b-instruct": 0.15, + "meta-llama/llama-3.3-70b-instruct:free": 0.0, + "meta-llama/llama-guard-2-8b": 0.1, + "microsoft/phi-3-medium-128k-instruct": 0.5, + "microsoft/phi-3-medium-128k-instruct:free": 0.0, + "microsoft/phi-3-mini-128k-instruct": 0.05, + "microsoft/phi-3-mini-128k-instruct:free": 0.0, + "microsoft/phi-3.5-mini-128k-instruct": 0.05, + "microsoft/phi-4": 0.07, + "microsoft/wizardlm-2-7b": 0.035, + "microsoft/wizardlm-2-8x22b": 0.25, + "minimax/minimax-01": 0.55, + "mistralai/codestral-2501": 0.45, + "mistralai/codestral-mamba": 0.125, + "mistralai/ministral-3b": 0.02, + "mistralai/ministral-8b": 0.05, + "mistralai/mistral-7b-instruct": 0.0275, + "mistralai/mistral-7b-instruct-v0.1": 0.1, + "mistralai/mistral-7b-instruct-v0.3": 0.0275, + "mistralai/mistral-7b-instruct:free": 0.0, + "mistralai/mistral-large": 3.0, + "mistralai/mistral-large-2407": 3.0, + "mistralai/mistral-large-2411": 3.0, + "mistralai/mistral-medium": 4.05, + "mistralai/mistral-nemo": 0.04, + "mistralai/mistral-nemo:free": 0.0, + "mistralai/mistral-small": 0.3, + "mistralai/mistral-small-24b-instruct-2501": 0.07, + "mistralai/mistral-small-24b-instruct-2501:free": 0.0, + "mistralai/mistral-tiny": 0.125, + "mistralai/mixtral-8x22b-instruct": 0.45, + "mistralai/mixtral-8x7b": 0.3, + "mistralai/mixtral-8x7b-instruct": 0.12, + "mistralai/pixtral-12b": 0.05, + "mistralai/pixtral-large-2411": 3.0, + "neversleep/llama-3-lumimaid-70b": 2.25, + "neversleep/llama-3-lumimaid-8b": 0.5625, + "neversleep/llama-3-lumimaid-8b:extended": 0.5625, + "neversleep/llama-3.1-lumimaid-70b": 2.25, + "neversleep/llama-3.1-lumimaid-8b": 0.5625, + "neversleep/noromaid-20b": 1.125, + "nothingiisreal/mn-celeste-12b": 0.6, + "nousresearch/hermes-2-pro-llama-3-8b": 0.02, + "nousresearch/hermes-3-llama-3.1-405b": 0.4, + "nousresearch/hermes-3-llama-3.1-70b": 0.15, + "nousresearch/nous-hermes-2-mixtral-8x7b-dpo": 0.3, + "nousresearch/nous-hermes-llama2-13b": 0.085, + "nvidia/llama-3.1-nemotron-70b-instruct": 0.15, + "nvidia/llama-3.1-nemotron-70b-instruct:free": 0.0, + "openai/chatgpt-4o-latest": 7.5, + "openai/gpt-3.5-turbo": 0.75, + "openai/gpt-3.5-turbo-0125": 0.75, + "openai/gpt-3.5-turbo-0613": 1.0, + "openai/gpt-3.5-turbo-1106": 1.0, + "openai/gpt-3.5-turbo-16k": 2.0, + "openai/gpt-3.5-turbo-instruct": 1.0, + "openai/gpt-4": 30.0, + "openai/gpt-4-0314": 30.0, + "openai/gpt-4-1106-preview": 15.0, + "openai/gpt-4-32k": 60.0, + "openai/gpt-4-32k-0314": 60.0, + "openai/gpt-4-turbo": 15.0, + "openai/gpt-4-turbo-preview": 15.0, + "openai/gpt-4o": 5.0, + "openai/gpt-4o-2024-05-13": 7.5, + "openai/gpt-4o-2024-08-06": 5.0, + "openai/gpt-4o-2024-11-20": 5.0, + "openai/gpt-4o-mini": 0.3, + "openai/gpt-4o-mini-2024-07-18": 0.3, + "openai/gpt-4o:extended": 9.0, + "openai/o1": 30.0, + "openai/o1-mini": 2.2, + "openai/o1-mini-2024-09-12": 2.2, + "openai/o1-preview": 30.0, + "openai/o1-preview-2024-09-12": 30.0, + "openai/o3-mini": 2.2, + "openai/o3-mini-high": 2.2, + "openchat/openchat-7b": 0.0275, + "openchat/openchat-7b:free": 0.0, + "openrouter/auto": -500000.0, + "perplexity/llama-3.1-sonar-huge-128k-online": 2.5, + "perplexity/llama-3.1-sonar-large-128k-chat": 0.5, + "perplexity/llama-3.1-sonar-large-128k-online": 0.5, + "perplexity/llama-3.1-sonar-small-128k-chat": 0.1, + "perplexity/llama-3.1-sonar-small-128k-online": 0.1, + "perplexity/sonar": 0.5, + "perplexity/sonar-reasoning": 2.5, + "pygmalionai/mythalion-13b": 0.6, + "qwen/qvq-72b-preview": 0.25, + "qwen/qwen-2-72b-instruct": 0.45, + "qwen/qwen-2-7b-instruct": 0.027, + "qwen/qwen-2-7b-instruct:free": 0.0, + "qwen/qwen-2-vl-72b-instruct": 0.2, + "qwen/qwen-2-vl-7b-instruct": 0.05, + "qwen/qwen-2.5-72b-instruct": 0.2, + "qwen/qwen-2.5-7b-instruct": 0.025, + "qwen/qwen-2.5-coder-32b-instruct": 0.08, + "qwen/qwen-max": 3.2, + "qwen/qwen-plus": 0.6, + "qwen/qwen-turbo": 0.1, + "qwen/qwen-vl-plus:free": 0.0, + "qwen/qwen2.5-vl-72b-instruct:free": 0.0, + "qwen/qwq-32b-preview": 0.09, + "raifle/sorcererlm-8x22b": 2.25, + "sao10k/fimbulvetr-11b-v2": 0.6, + "sao10k/l3-euryale-70b": 0.4, + "sao10k/l3-lunaris-8b": 0.03, + "sao10k/l3.1-70b-hanami-x1": 1.5, + "sao10k/l3.1-euryale-70b": 0.4, + "sao10k/l3.3-euryale-70b": 0.4, + "sophosympatheia/midnight-rose-70b": 0.4, + "sophosympatheia/rogue-rose-103b-v0.2:free": 0.0, + "teknium/openhermes-2.5-mistral-7b": 0.085, + "thedrummer/rocinante-12b": 0.25, + "thedrummer/unslopnemo-12b": 0.25, + "undi95/remm-slerp-l2-13b": 0.6, + "undi95/toppy-m-7b": 0.035, + "undi95/toppy-m-7b:free": 0.0, + "x-ai/grok-2-1212": 5.0, + "x-ai/grok-2-vision-1212": 5.0, + "x-ai/grok-beta": 7.5, + "x-ai/grok-vision-beta": 7.5, + "xwin-lm/xwin-lm-70b": 1.875, } var CompletionRatio = map[string]float64{