version: 1.2.1 cache: true registration: socialLogins: - "discord" - "facebook" - "github" - "google" - "openid" endpoints: custom: # APIpie # https://apipie.ai/dashboard/ # Script to fetch models: https://github.com/LibreChat-AI/librechat-config-yaml/blob/main/scripts/apipie.py - name: "APIpie" apiKey: "${APIPIE_API_KEY}" baseURL: "https://apipie.ai/v1/" models: default: - DeepSeek-V3 - Llama-2-13b-chat-hf - Llama-2-70b-chat-hf - Llama-2-70b-hf - Llama-2-7b-chat-hf - Llama-3-70b-chat-hf - Llama-3-8b-chat-hf - Llama-3.1-Nemotron-70B-Instruct-HF - Llama-3.2-11B-Vision-Instruct-Turbo - Llama-3.2-3B-Instruct-Turbo - Llama-3.2-90B-Vision-Instruct-Turbo - Llama-3.3-70B-Instruct-Turbo - Meta-Llama-3-70B-Instruct - Meta-Llama-3-70B-Instruct-Lite - Meta-Llama-3-70B-Instruct-Turbo - Meta-Llama-3-8B-Instruct - Meta-Llama-3-8B-Instruct-Lite - Meta-Llama-3-8B-Instruct-Turbo - Meta-Llama-3.1-70B-Instruct-Turbo - Meta-Llama-3.1-8B-Instruct-Turbo - Meta-Llama-3.1-8B-Instruct-Turbo-128K - Mistral-7B-Instruct-v0.1 - Mistral-7B-Instruct-v0.2 - Mistral-7B-Instruct-v0.3 - Mixtral-8x22B-Instruct-v0.1 - Mixtral-8x22B-v0.1 - Mixtral-8x7B-Instruct-v0.1 - Mixtral-8x7B-v0.1 - MythoMax-L2-13b - MythoMax-L2-13b-Lite - Nous-Hermes-2-Mixtral-8x7B-DPO - QwQ-32B-Preview - Qwen2.5-72B-Instruct-Turbo - Qwen2.5-7B-Instruct-Turbo - SOLAR-10.7B-Instruct-v1.0 - WizardLM-2-7B - WizardLM-2-8x22B - aion-1.0 - aion-1.0-mini - aion-rp-llama-3.1-8b - airoboros-70b - airoboros-l2-70b - amazon.nova-lite-v1:0 - amazon.nova-micro-v1:0 - amazon.nova-pro-v1:0 - chatgpt-4o-latest - chatx_cheap_128k - chatx_cheap_32k - chatx_cheap_4k - chatx_cheap_64k - chatx_cheap_8k - chatx_mids_4k - chatx_premium_128k - chatx_premium_32k - chatx_premium_4k - chatx_premium_8k - chronos-hermes-13b-v2 - claude-2 - claude-2.0 - claude-2.1 - claude-3-5-haiku - claude-3-5-haiku-20241022 - claude-3-5-haiku-20241022-v1 - claude-3-5-haiku-latest - claude-3-5-sonnet - claude-3-5-sonnet-20240620 - claude-3-5-sonnet-20240620-v1 - claude-3-5-sonnet-20241022 - claude-3-5-sonnet-20241022-v2 - claude-3-5-sonnet-latest - claude-3-7-sonnet-20250219 - claude-3-7-sonnet-20250219-v1 - claude-3-7-sonnet-latest - claude-3-haiku - claude-3-haiku-20240307 - claude-3-haiku-20240307-v1 - claude-3-opus - claude-3-opus-20240229 - claude-3-opus-20240229-v1 - claude-3-opus-latest - claude-3-sonnet - claude-3-sonnet-20240229 - claude-3-sonnet-20240229-v1 - claude-3.5-haiku - claude-3.5-haiku-20241022 - claude-3.5-sonnet - claude-3.5-sonnet-20240620 - claude-3.7-sonnet - claude2 - codestral-2501 - codestral-mamba - command - command-light - command-light-text-v14 - command-nightly - command-r - command-r-03-2024 - command-r-08-2024 - command-r-plus - command-r-plus-04-2024 - command-r-plus-08-2024 - command-r-plus-v1 - command-r-v1 - command-r7b-12-2024 - command-text-v14 - dbrx-instruct - deepseek-chat - deepseek-r1 - deepseek-r1-distill-llama-70b - deepseek-r1-distill-llama-8b - deepseek-r1-distill-qwen-1.5b - deepseek-r1-distill-qwen-14b - deepseek-r1-distill-qwen-32b - dolphin-2.6-mixtral-8x7b - dolphin-mixtral-8x22b - dolphin-mixtral-8x7b - dolphin3.0-mistral-24b - dolphin3.0-r1-mistral-24b - eva-llama-3.33-70b - eva-qwen-2.5-32b - eva-qwen-2.5-72b - fimbulvetr-11b-v2 - gemini-1.5-flash - gemini-1.5-flash-8b - gemini-1.5-flash-8b-latest - gemini-1.5-flash-latest - gemini-1.5-pro - gemini-1.5-pro-latest - gemini-2.0-flash - gemini-2.0-flash-001 - gemini-2.0-flash-lite-001 - gemini-2.0-flash-lite-preview-02-05 - gemini-2.0-flash-thinking-exp-1219 - gemini-2.0-pro-exp-02-05 - gemini-flash - gemini-flash-1.5 - gemini-flash-1.5-8b - gemini-pro - gemini-pro-1.5 - gemini-pro-vision - gemma-1.1-7b-it - gemma-2-27b-it - gemma-2-9b-it - gemma-2b-it - gemma-7b-it - general - goliath-120b - gpt-3.5 - gpt-3.5-turbo - gpt-3.5-turbo-0125 - gpt-3.5-turbo-0613 - gpt-3.5-turbo-1106 - gpt-3.5-turbo-16k - gpt-3.5-turbo-instruct - gpt-4 - gpt-4-0125-preview - gpt-4-0314 - gpt-4-0613 - gpt-4-1106-preview - gpt-4-1106-vision-preview - gpt-4-32k - gpt-4-32k-0314 - gpt-4-turbo - gpt-4-turbo-2024-04-09 - gpt-4-turbo-preview - gpt-4-vision-preview - gpt-4o - gpt-4o-2024-05-13 - gpt-4o-2024-08-06 - gpt-4o-2024-11-20 - gpt-4o-audio-preview-2024-10-01 - gpt-4o-audio-preview-2024-12-17 - gpt-4o-mini - gpt-4o-mini-2024-07-18 - gpt-4o-mini-audio-preview - gpt-4o-mini-audio-preview-2024-12-17 - grok-2-1212 - grok-2-vision-1212 - grok-beta - grok-vision-beta - hermes-2-pro-llama-3-8b - hermes-3-llama-3.1-405b - hermes-3-llama-3.1-70b - inflection-3-pi - j2-grande-instruct - j2-jumbo-instruct - j2-mid - j2-mid-v1 - j2-ultra - j2-ultra-v1 - jamba-1-5-large - jamba-1-5-large-v1 - jamba-1-5-mini - jamba-1-5-mini-v1 - jamba-instruct - jamba-instruct-v1 - l3-euryale-70b - l3-lunaris-8b - l3.1-70b-hanami-x1 - l3.1-euryale-70b - l3.3-euryale-70b - lfm-3b - lfm-40b - lfm-7b - llama-2-13b-chat - llama-2-70b-chat - llama-3-70b-instruct - llama-3-8b-instruct - llama-3-lumimaid-70b - llama-3-lumimaid-8b - llama-3-sonar-large-32k-chat - llama-3.1-405b - llama-3.1-405b-instruct - llama-3.1-70b-instruct - llama-3.1-8b-instruct - llama-3.1-lumimaid-70b - llama-3.1-lumimaid-8b - llama-3.1-nemotron-70b-instruct - llama-3.1-sonar-huge-128k-online - llama-3.1-sonar-large-128k-chat - llama-3.1-sonar-large-128k-online - llama-3.1-sonar-small-128k-chat - llama-3.1-sonar-small-128k-online - llama-3.1-tulu-3-405b - llama-3.2-11b-vision-instruct - llama-3.2-1b-instruct - llama-3.2-3b-instruct - llama-3.2-90b-vision-instruct - llama-3.3-70b-instruct - llama-guard-2-8b - llama-guard-3-8b - llama2-13b-chat-v1 - llama2-70b-chat-v1 - llama3-1 - llama3-1-405b-instruct-v1:0 - llama3-1-70b-instruct-v1 - llama3-1-70b-instruct-v1:0 - llama3-1-8b-instruct-v1 - llama3-1-8b-instruct-v1:0 - llama3-2 - llama3-2-11b-instruct-v1 - llama3-2-1b-instruct-v1 - llama3-2-3b-instruct-v1 - llama3-2-90b-instruct-v1 - llama3-3-70b-instruct-v1 - llama3-70b-instruct-v1 - llama3-8b-instruct-v1 - magnum-72b - magnum-v2-72b - magnum-v4-72b - meta-llama-3.1-8b-instruct - midnight-rose-70b - minimax-01 - ministral-3b - ministral-8b - mistral - mistral-7b-instruct - mistral-7b-instruct-v0 - mistral-7b-instruct-v0.1 - mistral-7b-instruct-v0.3 - mistral-large - mistral-large-2402-v1 - mistral-large-2407 - mistral-large-2411 - mistral-large-latest - mistral-medium - mistral-nemo - mistral-saba - mistral-small - mistral-small-2402-v1 - mistral-small-24b-instruct-2501 - mistral-small-latest - mistral-tiny - mixtral - mixtral-8x22b-instruct - mixtral-8x7b - mixtral-8x7b-instruct - mixtral-8x7b-instruct-v0 - mn-celeste-12b - mn-inferor-12b - mn-starcannon-12b - mythalion-13b - mythomax-l2-13b - nai-meta-v1 - noromaid-20b - nous-hermes-2-mixtral-8x7b-dpo - nous-hermes-2-vision-7b - nous-hermes-llama2-13b - nova-canvas-v1 - nova-lite-v1 - nova-micro-v1 - nova-pro-v1 - nova-reel-v1 - o1 - o1-2024-12-17 - o1-mini - o1-mini-2024-09-12 - o1-preview - o1-preview-2024-09-12 - o3-mini - o3-mini-2025-01-31 - o3-mini-high - olympus-premier-v1 - online-llama - openchat-7b - openchat_3.5 - openhermes-2.5-mistral-7b - palm-2-chat-bison - palm-2-chat-bison-32k - palm-2-codechat-bison - palm-2-codechat-bison-32k - phi-3-medium-128k-instruct - phi-3-mini-128k-instruct - phi-3.5-mini-128k-instruct - phi-4 - pixtral-12b - pixtral-large-2411 - pixtral-large-latest - qvq-72b-preview - qwen-2-72b-instruct - qwen-2-vl-72b-instruct - qwen-2-vl-7b-instruct - qwen-2.5-72b-instruct - qwen-2.5-7b-instruct - qwen-2.5-coder-32b-instruct - qwen-max - qwen-plus - qwen-turbo - qwen-vl-plus - qwen1-5 - qwen2 - qwen2.5-vl-72b-instruct - qwq-32b-preview - r1-1776 - remm-slerp-l2-13b - rocinante-12b - rogue-rose-103b-v0.2 - scb10x-llama3-typhoon-v1-5-8b-instruct - scb10x-llama3-typhoon-v1-5x-4f316 - sonar - sonar-reasoning - sorcererlm-8x22b - titan - titan-text-express-v1 - titan-text-lite-v1 - titan-text-premier-v1 - titan-tg1-large - toppy-m-7b - unslopnemo-12b - weaver - wizardlm-2-7b - wizardlm-2-8x22b - xwin-lm-70b - yi-large - yi-vision - zephyr-orpo-141b-A35b-v0.1 fetch: false titleConvo: true titleModel: "claude-3-haiku" summarize: false summaryModel: "claude-3-haiku" dropParams: - "stream" modelDisplayLabel: "APIpie" iconURL: "https://raw.githubusercontent.com/fuegovic/lc-config-yaml/main/icons/APIpie.png" # cohere # Model list: https://dashboard.cohere.com/playground/chat - name: "cohere" apiKey: "${COHERE_API_KEY}" baseURL: "https://api.cohere.ai/v1" models: default: - c4ai-aya-expanse-32b - command - command-light-nightly - command-r - command-r-08-2024 - command-r-plus - command-r-plus-08-2024 - command-r7b-12-2024 fetch: false modelDisplayLabel: "cohere" titleModel: "command" dropParams: - "stop" - "user" - "frequency_penalty" - "presence_penalty" - "temperature" - "top_p" # deepseek # https://platform.deepseek.com/api_keys # Model list: https://platform.deepseek.com/api-docs/pricing - name: "deepseek" apiKey: "${DEEPSEEK_API_KEY}" baseURL: "https://api.deepseek.com" models: default: - deepseek-chat - deepseek-reasoner fetch: false titleConvo: true titleModel: "deepseek-chat" summarize: false summaryModel: "deepseek-chat" modelDisplayLabel: "DeepSeek" # Fireworks.ai # Models: https://fireworks.ai/models?show=Serverless - name: "Fireworks" apiKey: "${FIREWORKS_API_KEY}" baseURL: "https://api.fireworks.ai/inference/v1" models: default: - accounts/fireworks/models/deepseek-r1 - accounts/fireworks/models/deepseek-v3 - accounts/fireworks/models/llama-guard-3-8b - accounts/fireworks/models/llama-v3-70b-instruct - accounts/fireworks/models/llama-v3-8b-instruct - accounts/fireworks/models/llama-v3-8b-instruct-hf - accounts/fireworks/models/llama-v3p1-405b-instruct - accounts/fireworks/models/llama-v3p1-405b-instruct-long - accounts/fireworks/models/llama-v3p1-70b-instruct - accounts/fireworks/models/llama-v3p1-8b-instruct - accounts/fireworks/models/llama-v3p2-11b-vision-instruct - accounts/fireworks/models/llama-v3p2-3b-instruct - accounts/fireworks/models/llama-v3p2-90b-vision-instruct - accounts/fireworks/models/llama-v3p3-70b-instruct - accounts/fireworks/models/mistral-small-24b-instruct-2501 - accounts/fireworks/models/mixtral-8x22b-instruct - accounts/fireworks/models/mixtral-8x7b-instruct - accounts/fireworks/models/mythomax-l2-13b - accounts/fireworks/models/phi-3-vision-128k-instruct - accounts/fireworks/models/qwen-qwq-32b-preview - accounts/fireworks/models/qwen2-vl-72b-instruct - accounts/fireworks/models/qwen2p5-72b-instruct - accounts/fireworks/models/qwen2p5-coder-32b-instruct - accounts/mels-e0299e/models/aiderlm-v0 - accounts/perplexity/models/r1-1776 - accounts/sentientfoundation/models/dobby-mini-leashed-llama-3-1-8b - accounts/sentientfoundation/models/dobby-mini-unhinged-llama-3-1-8b - accounts/sentientfoundation/models/dobby-unhinged-llama-3-3-70b-new - accounts/yi-01-ai/models/yi-large fetch: false titleConvo: true titleModel: "accounts/fireworks/models/llama-v2-7b-chat" summarize: false summaryModel: "accounts/fireworks/models/llama-v2-7b-chat" forcePrompt: false modelDisplayLabel: "Fireworks" dropParams: - "user" # GitHub - name: "Github Models" iconURL: https://github.githubassets.com/assets/GitHub-Mark-ea2971cee799.png apiKey: "${GITHUB_TOKEN}" baseURL: "https://models.inference.ai.azure.com" models: default: - AI21-Jamba-Instruct - Cohere-command-r - Cohere-command-r-plus - Cohere-embed-v3-english - Cohere-embed-v3-multilingual - Meta-Llama-3-70B-Instruct - Meta-Llama-3-8B-Instruct - Meta-Llama-3.1-405B-Instruct - Meta-Llama-3.1-70B-Instruct - Meta-Llama-3.1-8B-Instruct - Mistral-Nemo - Mistral-large - Mistral-large-2407 - Mistral-small - Phi-3-medium-128k-instruct - Phi-3-medium-4k-instruct - Phi-3-mini-128k-instruct - Phi-3-mini-4k-instruct - Phi-3-small-128k-instruct - Phi-3-small-8k-instruct - Phi-3.5-mini-instruct - gpt-4o - gpt-4o-mini - text-embedding-3-large - text-embedding-3-small fetch: false titleConvo: true titleModel: "gpt-4o-mini" # groq # Model list: https://console.groq.com/settings/limits - name: "groq" apiKey: "${GROQ_API_KEY}" baseURL: "https://api.groq.com/openai/v1/" models: default: - deepseek-r1-distill-llama-70b - deepseek-r1-distill-qwen-32b - gemma2-9b-it - llama-3.1-8b-instant - llama-3.2-11b-vision-preview - llama-3.2-1b-preview - llama-3.2-3b-preview - llama-3.2-90b-vision-preview - llama-3.3-70b-specdec - llama-3.3-70b-versatile - llama-guard-3-8b - llama3-70b-8192 - llama3-8b-8192 - mistral-saba-24b - mixtral-8x7b-32768 - qwen-2.5-32b - qwen-2.5-coder-32b fetch: false titleConvo: true titleModel: "mixtral-8x7b-32768" modelDisplayLabel: "groq" # HuggingFace # https://huggingface.co/settings/tokens - name: 'HuggingFace' apiKey: '${HUGGINGFACE_TOKEN}' baseURL: 'https://api-inference.huggingface.co/v1' models: default: - AIDC-AI/Marco-o1 - BioMistral/BioMistral-7B - CohereForAI/c4ai-command-r-plus - CohereForAI/c4ai-command-r-v01 - HuggingFaceH4/zephyr-7b-alpha - HuggingFaceH4/zephyr-7b-beta - HuggingFaceTB/SmolLM2-1.7B-Instruct - Intel/neural-chat-7b-v3-1 - MiniMaxAI/MiniMax-Text-01 - NexaAIDev/Octopus-v2 - NousResearch/Hermes-2-Pro-Mistral-7B - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO - NovaSky-AI/Sky-T1-32B-Preview - Open-Orca/Mistral-7B-OpenOrca - PygmalionAI/pygmalion-6b - Qwen/QwQ-32B-Preview - Qwen/Qwen2-72B-Instruct - Qwen/Qwen2-7B-Instruct - Qwen/Qwen2.5-72B-Instruct - Qwen/Qwen2.5-7B-Instruct - Qwen/Qwen2.5-Coder-32B-Instruct - Qwen/Qwen2.5-Coder-7B-Instruct - TheBloke/Mistral-7B-Instruct-v0.2-GGUF - TinyLlama/TinyLlama-1.1B-Chat-v1.0 - berkeley-nest/Starling-LM-7B-alpha - cognitivecomputations/dolphin-2.5-mixtral-8x7b - cognitivecomputations/dolphin-2.9-llama3-8b - databricks/dbrx-base - databricks/dbrx-instruct - deepseek-ai/DeepSeek-Coder-V2-Instruct - deepseek-ai/DeepSeek-R1 - deepseek-ai/DeepSeek-R1-Distill-Llama-70B - deepseek-ai/DeepSeek-R1-Distill-Llama-8B - deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B - deepseek-ai/DeepSeek-R1-Distill-Qwen-14B - deepseek-ai/DeepSeek-R1-Distill-Qwen-32B - deepseek-ai/DeepSeek-R1-Distill-Qwen-7B - deepseek-ai/DeepSeek-R1-Zero - deepseek-ai/DeepSeek-V2-Chat - deepseek-ai/DeepSeek-V2.5 - deepseek-ai/DeepSeek-V3 - deepseek-ai/deepseek-coder-33b-instruct - google/gemma-2-27b-it - google/gemma-2-2b-it - google/gemma-2-9b-it - google/gemma-2b-it - google/gemma-7b-it - gradientai/Llama-3-8B-Instruct-Gradient-1048k - jinaai/ReaderLM-v2 - jinaai/reader-lm-1.5b - mattshumer/Reflection-Llama-3.1-70B - meta-llama/Llama-2-13b-chat-hf - meta-llama/Llama-2-70b-chat-hf - meta-llama/Llama-2-7b-chat-hf - meta-llama/Llama-3.1-405B-Instruct - meta-llama/Llama-3.1-70B-Instruct - meta-llama/Llama-3.1-8B-Instruct - meta-llama/Llama-3.2-1B-Instruct - meta-llama/Llama-3.2-3B-Instruct - meta-llama/Llama-3.3-70B-Instruct - meta-llama/Meta-Llama-3-70B-Instruct - meta-llama/Meta-Llama-3-8B-Instruct - microsoft/Phi-3-mini-128k-instruct - microsoft/Phi-3-mini-4k-instruct - microsoft/Phi-3-vision-128k-instruct - microsoft/Phi-3.5-MoE-instruct - microsoft/Phi-3.5-mini-instruct - microsoft/phi-4 - mistralai/Codestral-22B-v0.1 - mistralai/Mistral-7B-Instruct-v0.1 - mistralai/Mistral-7B-Instruct-v0.2 - mistralai/Mistral-7B-Instruct-v0.3 - mistralai/Mistral-Nemo-Instruct-2407 - mistralai/Mistral-Small-24B-Instruct-2501 - mistralai/Mixtral-8x22B-Instruct-v0.1 - mistralai/Mixtral-8x7B-Instruct-v0.1 - nvidia/Llama-3.1-Nemotron-70B-Instruct-HF - nvidia/Llama3-ChatQA-1.5-8B - openchat/openchat_3.5 - shenzhi-wang/Llama3-8B-Chinese-Chat - teknium/OpenHermes-2.5-Mistral-7B - tiiuae/falcon-180B-chat - tiiuae/falcon-7b-instruct - unsloth/DeepSeek-R1-GGUF - upstage/SOLAR-10.7B-Instruct-v1.0 - upstage/solar-pro-preview-instruct fetch: false titleConvo: true titleModel: "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO" dropParams: - "top_p" # Hyperbolic # https://app.hyperbolic.xyz/models - name: 'Hyperbolic' apiKey: '${HYPERBOLIC_API_KEY}' baseURL: 'https://api.hyperbolic.xyz/v1/' models: default: - NousResearch/Hermes-3-Llama-3.1-70B - Qwen/QwQ-32B-Preview - Qwen/Qwen2-VL-72B-Instruct - Qwen/Qwen2-VL-7B-Instruct - Qwen/Qwen2.5-72B-Instruct - Qwen/Qwen2.5-Coder-32B-Instruct - deepseek-ai/DeepSeek-R1 - deepseek-ai/DeepSeek-V3 - meta-llama/Llama-3.2-3B-Instruct - meta-llama/Llama-3.3-70B-Instruct - meta-llama/Meta-Llama-3-70B-Instruct - meta-llama/Meta-Llama-3.1-405B - meta-llama/Meta-Llama-3.1-405B-FP8 - meta-llama/Meta-Llama-3.1-405B-Instruct - meta-llama/Meta-Llama-3.1-405B-Instruct-Virtuals - meta-llama/Meta-Llama-3.1-70B-Instruct - meta-llama/Meta-Llama-3.1-8B-Instruct - mistralai/Pixtral-12B-2409 fetch: false titleConvo: true titleModel: "meta-llama/Meta-Llama-3.1-8B-Instruct" modelDisplayLabel: "Hyperbolic" iconURL: "https://app.hyperbolic.xyz/icon.svg" # kluster.ai # https://platform.kluster.ai/apikeys - name: "Kluster" apiKey: "${KLUSTER_API_KEY}" baseURL: "https://api.kluster.ai/v1/" models: default: - deepseek-ai/DeepSeek-R1 - klusterai/Meta-Llama-3.1-405B-Instruct-Turbo - klusterai/Meta-Llama-3.1-8B-Instruct-Turbo - klusterai/Meta-Llama-3.3-70B-Instruct-Turbo fetch: false titleConvo: true titleModel: 'klusterai/Meta-Llama-3.1-8B-Instruct-Turbo' modelDisplayLabel: 'Kluster' iconURL: "https://platform.kluster.ai/cropped-fav-1-144x144.png" # Mistral AI API # Model list: https://docs.mistral.ai/getting-started/models/ - name: "Mistral" apiKey: "${MISTRAL_API_KEY}" baseURL: "https://api.mistral.ai/v1" models: default: - codestral-2405 - codestral-2411-rc5 - codestral-2412 - codestral-2501 - codestral-latest - codestral-mamba-2407 - codestral-mamba-latest - ministral-3b-2410 - ministral-3b-latest - ministral-8b-2410 - ministral-8b-latest - mistral-embed - mistral-large-2402 - mistral-large-2407 - mistral-large-2411 - mistral-large-latest - mistral-large-pixtral-2411 - mistral-medium - mistral-medium-2312 - mistral-medium-latest - mistral-moderation-2411 - mistral-moderation-latest - mistral-saba-2502 - mistral-saba-latest - mistral-small - mistral-small-2312 - mistral-small-2402 - mistral-small-2409 - mistral-small-2501 - mistral-small-latest - mistral-tiny - mistral-tiny-2312 - mistral-tiny-2407 - mistral-tiny-latest - open-codestral-mamba - open-mistral-7b - open-mistral-nemo - open-mistral-nemo-2407 - open-mixtral-8x22b - open-mixtral-8x22b-2404 - open-mixtral-8x7b - pixtral-12b - pixtral-12b-2409 - pixtral-12b-latest - pixtral-large-2411 - pixtral-large-latest fetch: false titleConvo: true titleMethod: "completion" titleModel: "mistral-tiny" summarize: false summaryModel: "mistral-tiny" forcePrompt: false modelDisplayLabel: "Mistral" dropParams: - "stop" - "user" - "frequency_penalty" - "presence_penalty" # NanoGPT # https://nano-gpt.com/api # Model list: https://nano-gpt.com/api/models - name: "NanoGPT" iconURL: "https://nano-gpt.com/logo.png" apiKey: "${NANOGPT_API_KEY}" baseURL: "https://nano-gpt.com/api/v1/" models: default: - EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0 - EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1 - EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2 - EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2 - Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B - Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B - GalrionSoftworks/MN-LooseCannon-12B-v1 - Gryphe/MythoMax-L2-13b - Infermatic/MN-12B-Inferor-v0.0 - LatitudeGames/Wayfarer-Large-70B-Llama-3.3 - Llama-3.1-Tulu-3-405B - Llama-3.3+3.1-70B-ArliAI-RPMax-v1.3 - Llama-3.3-70B-MiraiFanfare - MarinaraSpaghetti/NemoMix-Unleashed-12B - Meta-Llama-3-1-405B-Instruct-FP8 - Meta-Llama-3-1-8B-Instruct-FP8 - Mistral-Nemo-12B-ArliAI-RPMax-v1.2 - Mistral-Nemo-12B-Wayfarer - NeverSleep/Llama-3-Lumimaid-70B-v0.1 - NeverSleep/Lumimaid-v0.2-70B - Nexusflow/Athene-V2-Chat - Qwen/QwQ-32B-Preview - Qwen/Qwen2.5-Coder-32B-Instruct - Qwen2.5-32B-Dazzling-Star-Aurora-32b-v0.0 - Qwen2.5-32B-EVA-v0.2 - Sao10K/L3.1-70B-Euryale-v2.2 - Sao10K/L3.1-70B-Hanami-x1 - Sao10K/L3.3-70B-Euryale-v2.3 - Steelskull/L3.3-Damascus-R1 - Steelskull/L3.3-MS-Evalebis-70b - Steelskull/L3.3-MS-Evayale-70B - TheDrummer/Anubis-70B-v1 - TheDrummer/Cydonia-24B-v2 - TheDrummer/Rocinante-12B-v1.1 - TheDrummer/UnslopNemo-12B-v4.1 - VongolaChouko/Starcannon-Unleashed-12B-v1.0 - abacusai/Dracarys-72B-Instruct - aion-labs/aion-1.0 - aion-labs/aion-1.0-mini - aion-labs/aion-rp-llama-3.1-8b - amazon/nova-lite-v1 - amazon/nova-micro-v1 - amazon/nova-pro-v1 - anthracite-org/magnum-v2-72b - anthracite-org/magnum-v4-72b - azure-gpt-4-turbo - azure-gpt-4o - azure-gpt-4o-mini - azure-o1 - azure-o3-mini - chatgpt-4o-latest - claude-3-5-haiku-20241022 - claude-3-5-sonnet-20240620 - claude-3-5-sonnet-20241022 - claude-3-7-sonnet-20250219 - claude-3-7-sonnet-thinking - claude-3-7-sonnet-thinking:1024 - claude-3-7-sonnet-thinking:128000 - claude-3-7-sonnet-thinking:32768 - claude-3-7-sonnet-thinking:8192 - claude-3-opus-20240229 - cognitivecomputations/dolphin-mixtral-8x22b - cohere/command-r - cohere/command-r-plus-08-2024 - deep-research - deepclaude - deepseek-ai/DeepSeek-R1-Zero - deepseek-chat - deepseek-chat-cheaper - deepseek-r1-llama-70b - deepseek-r1-nano - deepseek-r1-sambanova - deepseek-reasoner - deepseek-reasoner-cheaper - dolphin-2.9.2-qwen2-72b - doubao-1.5-pro-256k - doubao-1.5-pro-32k - doubao-1.5-vision-pro-32k - eva-unit-01/eva-qwen-2.5-72b - failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5 - free-model - gemini-2.0-flash-001 - gemini-2.0-flash-exp-search - gemini-2.0-flash-lite - gemini-2.0-flash-thinking-exp-01-21 - gemini-2.0-flash-thinking-exp-1219 - gemini-2.0-pro-exp-02-05 - gemini-exp-1206 - gemini-exp-1206 - glm-4 - glm-4-air - glm-4-air-0111 - glm-4-airx - glm-4-flash - glm-4-long - glm-4-plus - glm-4-plus-0111 - glm-zero-preview - google/gemini-flash-1.5 - gpt-3.5-turbo - gpt-4-turbo-preview - gpt-4o - gpt-4o-2024-08-06 - gpt-4o-2024-11-20 - gpt-4o-mini - grok-2-1212 - grok-2-vision-1212 - grok-3 - grok-3-deepsearch - grok-3-reasoner - grok-beta - huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated - huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated - huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated - huihui-ai/Llama-3.3-70B-Instruct-abliterated - inflatebot/MN-12B-Mag-Mell-R1 - inflection/inflection-3-pi - inflection/inflection-3-productivity - kimi-k1.5-preview - kimi-latest - learnlm-1.5-pro-experimental - llama-3.3-70b - meta-llama/llama-3.1-8b-instruct - meta-llama/llama-3.2-3b-instruct - meta-llama/llama-3.2-90b-vision-instruct - microsoft/wizardlm-2-7b - microsoft/wizardlm-2-8x22b - minimax/minimax-01 - mistralai/Mistral-Nemo-Instruct-2407 - mistralai/mistral-7b-instruct - mistralai/mistral-large - mistralai/mistral-saba - mistralai/mistral-tiny - mlabonne/NeuralDaredevil-8B-abliterated - model-selector - nothingiisreal/L3.1-70B-Celeste-V0.1-BF16 - nousresearch/hermes-3-llama-3.1-405b - nvidia/Llama-3.1-Nemotron-70B-Instruct-HF - o1 - o1-plus - o1-preview - o3-mini - o3-mini-high - o3-mini-low - qwen-long - qwen-max - qwen-plus - qwen-turbo - qwen/qwen-2.5-72b-instruct - r1-1776 - raifle/sorcererlm-8x22b - recommended-model - sonar - sonar-deep-research - sonar-pro - sonar-reasoning - sonar-reasoning-pro - step-2-16k - step-2-16k-exp - step-2-mini - undi95/remm-slerp-l2-13b - yi-34b-chat-0205 - yi-34b-chat-200k - yi-large - yi-large-turbo - yi-lightning - yi-medium-200k fetch: false titleConvo: true titleModel: "current_model" modelDisplayLabel: "NanoGPT" # NVIDIA # https://build.nvidia.com/explore/discover - name: "Nvidia" apiKey: "${NVIDIA_API_KEY}" baseURL: "https://integrate.api.nvidia.com/v1/" models: default: - 01-ai/yi-large - abacusai/dracarys-llama-3.1-70b-instruct - adept/fuyu-8b - ai21labs/jamba-1.5-large-instruct - ai21labs/jamba-1.5-mini-instruct - aisingapore/sea-lion-7b-instruct - baai/bge-m3 - baichuan-inc/baichuan2-13b-chat - bigcode/starcoder2-15b - bigcode/starcoder2-7b - databricks/dbrx-instruct - deepseek-ai/deepseek-coder-6.7b-instruct - deepseek-ai/deepseek-r1 - google/codegemma-1.1-7b - google/codegemma-7b - google/deplot - google/gemma-2-27b-it - google/gemma-2-2b-it - google/gemma-2-9b-it - google/gemma-2b - google/gemma-7b - google/paligemma - google/recurrentgemma-2b - google/shieldgemma-9b - ibm/granite-3.0-3b-a800m-instruct - ibm/granite-3.0-8b-instruct - ibm/granite-34b-code-instruct - ibm/granite-8b-code-instruct - ibm/granite-guardian-3.0-8b - igenius/colosseum_355b_instruct_16k - igenius/italia_10b_instruct_16k - institute-of-science-tokyo/llama-3.1-swallow-70b-instruct-v0.1 - institute-of-science-tokyo/llama-3.1-swallow-8b-instruct-v0.1 - mediatek/breeze-7b-instruct - meta/codellama-70b - meta/llama-3.1-405b-instruct - meta/llama-3.1-70b-instruct - meta/llama-3.1-8b-instruct - meta/llama-3.2-1b-instruct - meta/llama-3.2-3b-instruct - meta/llama-3.3-70b-instruct - meta/llama2-70b - meta/llama3-70b-instruct - meta/llama3-8b-instruct - microsoft/kosmos-2 - microsoft/phi-3-medium-128k-instruct - microsoft/phi-3-medium-4k-instruct - microsoft/phi-3-mini-128k-instruct - microsoft/phi-3-mini-4k-instruct - microsoft/phi-3-small-128k-instruct - microsoft/phi-3-small-8k-instruct - microsoft/phi-3-vision-128k-instruct - microsoft/phi-3.5-mini-instruct - microsoft/phi-3.5-moe-instruct - microsoft/phi-3.5-vision-instruct - microsoft/phi-4-mini-instruct - mistralai/codestral-22b-instruct-v0.1 - mistralai/mamba-codestral-7b-v0.1 - mistralai/mathstral-7b-v0.1 - mistralai/mistral-7b-instruct-v0.2 - mistralai/mistral-7b-instruct-v0.3 - mistralai/mistral-large - mistralai/mistral-large-2-instruct - mistralai/mistral-small-24b-instruct - mistralai/mixtral-8x22b-instruct-v0.1 - mistralai/mixtral-8x22b-v0.1 - mistralai/mixtral-8x7b-instruct-v0.1 - nv-mistralai/mistral-nemo-12b-instruct - nvidia/embed-qa-4 - nvidia/llama-3.1-nemoguard-8b-content-safety - nvidia/llama-3.1-nemoguard-8b-topic-control - nvidia/llama-3.1-nemotron-51b-instruct - nvidia/llama-3.1-nemotron-70b-instruct - nvidia/llama-3.1-nemotron-70b-reward - nvidia/llama-3.2-nv-embedqa-1b-v1 - nvidia/llama-3.2-nv-embedqa-1b-v2 - nvidia/llama3-chatqa-1.5-70b - nvidia/llama3-chatqa-1.5-8b - nvidia/mistral-nemo-minitron-8b-8k-instruct - nvidia/mistral-nemo-minitron-8b-base - nvidia/nemotron-4-340b-instruct - nvidia/nemotron-4-340b-reward - nvidia/nemotron-4-mini-hindi-4b-instruct - nvidia/nemotron-mini-4b-instruct - nvidia/neva-22b - nvidia/nv-embed-v1 - nvidia/nv-embedqa-e5-v5 - nvidia/nv-embedqa-mistral-7b-v2 - nvidia/nvclip - nvidia/usdcode-llama-3.1-70b-instruct - nvidia/vila - qwen/qwen2-7b-instruct - qwen/qwen2.5-7b-instruct - qwen/qwen2.5-coder-32b-instruct - qwen/qwen2.5-coder-7b-instruct - rakuten/rakutenai-7b-chat - rakuten/rakutenai-7b-instruct - snowflake/arctic-embed-l - thudm/chatglm3-6b - tiiuae/falcon3-7b-instruct - tokyotech-llm/llama-3-swallow-70b-instruct-v0.1 - upstage/solar-10.7b-instruct - writer/palmyra-creative-122b - writer/palmyra-fin-70b-32k - writer/palmyra-med-70b - writer/palmyra-med-70b-32k - yentinglin/llama-3-taiwan-70b-instruct - zyphra/zamba2-7b-instruct fetch: false titleConvo: true titleModel: "nvidia/nemotron-mini-4b-instruct" modelDisplayLabel: "Nvidia" iconURL: "https://raw.githubusercontent.com/LibreChat-AI/librechat-config-yaml/refs/heads/main/icons/nvidia.png" # OpenRouter.ai # Model list: https://openrouter.ai/models # Script to fetch models: https://github.com/LibreChat-AI/librechat-config-yaml/blob/main/scripts/openrouter.py - name: "OpenRouter" apiKey: "${OPENROUTER_KEY}" baseURL: "https://openrouter.ai/api/v1" models: default: - openrouter/auto - '---FREE---' - cognitivecomputations/dolphin3.0-mistral-24b:free - cognitivecomputations/dolphin3.0-r1-mistral-24b:free - deepseek/deepseek-chat:free - deepseek/deepseek-r1-distill-llama-70b:free - deepseek/deepseek-r1:free - google/gemini-2.0-flash-exp:free - google/gemini-2.0-flash-lite-preview-02-05:free - google/gemini-2.0-flash-thinking-exp-1219:free - google/gemini-2.0-flash-thinking-exp:free - google/gemini-2.0-pro-exp-02-05:free - google/gemini-exp-1206:free - google/gemma-2-9b-it:free - google/learnlm-1.5-pro-experimental:free - gryphe/mythomax-l2-13b:free - huggingfaceh4/zephyr-7b-beta:free - meta-llama/llama-3-8b-instruct:free - meta-llama/llama-3.1-8b-instruct:free - meta-llama/llama-3.2-11b-vision-instruct:free - meta-llama/llama-3.2-1b-instruct:free - meta-llama/llama-3.3-70b-instruct:free - microsoft/phi-3-medium-128k-instruct:free - microsoft/phi-3-mini-128k-instruct:free - mistralai/mistral-7b-instruct:free - mistralai/mistral-nemo:free - mistralai/mistral-small-24b-instruct-2501:free - nvidia/llama-3.1-nemotron-70b-instruct:free - openchat/openchat-7b:free - qwen/qwen-vl-plus:free - qwen/qwen2.5-vl-72b-instruct:free - sophosympatheia/rogue-rose-103b-v0.2:free - undi95/toppy-m-7b:free - '---BETA---' - anthropic/claude-2.0:beta - anthropic/claude-2.1:beta - anthropic/claude-2:beta - anthropic/claude-3-haiku:beta - anthropic/claude-3-opus:beta - anthropic/claude-3-sonnet:beta - anthropic/claude-3.5-haiku-20241022:beta - anthropic/claude-3.5-haiku:beta - anthropic/claude-3.5-sonnet-20240620:beta - anthropic/claude-3.5-sonnet:beta - anthropic/claude-3.7-sonnet:beta - '---EXTENDED---' - neversleep/llama-3-lumimaid-8b:extended - openai/gpt-4o:extended - '---AI21---' - ai21/jamba-1-5-large - ai21/jamba-1-5-mini - ai21/jamba-instruct - '---AION-LABS---' - aion-labs/aion-1.0 - aion-labs/aion-1.0-mini - aion-labs/aion-rp-llama-3.1-8b - '---AMAZON---' - amazon/nova-lite-v1 - amazon/nova-micro-v1 - amazon/nova-pro-v1 - '---ANTHROPIC---' - anthropic/claude-2 - anthropic/claude-2.0 - anthropic/claude-2.1 - anthropic/claude-3-7-sonnet - anthropic/claude-3-haiku - anthropic/claude-3-opus - anthropic/claude-3-sonnet - anthropic/claude-3.5-haiku - anthropic/claude-3.5-haiku-20241022 - anthropic/claude-3.5-sonnet - anthropic/claude-3.5-sonnet-20240620 - anthropic/claude-3.7-sonnet - anthropic/claude-3.7-sonnet:thinking - '---COHERE---' - cohere/command - cohere/command-r - cohere/command-r-03-2024 - cohere/command-r-08-2024 - cohere/command-r-plus - cohere/command-r-plus-04-2024 - cohere/command-r-plus-08-2024 - cohere/command-r7b-12-2024 - '---DEEPSEEK---' - deepseek/deepseek-chat - deepseek/deepseek-chat-v2.5 - deepseek/deepseek-r1 - deepseek/deepseek-r1-distill-llama-70b - deepseek/deepseek-r1-distill-llama-8b - deepseek/deepseek-r1-distill-qwen-1.5b - deepseek/deepseek-r1-distill-qwen-14b - deepseek/deepseek-r1-distill-qwen-32b - '---EVA-UNIT-01---' - eva-unit-01/eva-llama-3.33-70b - eva-unit-01/eva-qwen-2.5-32b - eva-unit-01/eva-qwen-2.5-72b - '---GOOGLE---' - google/gemini-2.0-flash-001 - google/gemini-2.0-flash-lite-001 - google/gemini-flash-1.5 - google/gemini-flash-1.5-8b - google/gemini-flash-1.5-8b-exp - google/gemini-pro - google/gemini-pro-1.5 - google/gemini-pro-vision - google/gemma-2-27b-it - google/gemma-2-9b-it - google/gemma-7b-it - google/palm-2-chat-bison - google/palm-2-chat-bison-32k - google/palm-2-codechat-bison - google/palm-2-codechat-bison-32k - '---LIQUID---' - liquid/lfm-3b - liquid/lfm-40b - liquid/lfm-7b - '---META-LLAMA---' - meta-llama/llama-2-13b-chat - meta-llama/llama-2-70b-chat - meta-llama/llama-3-70b-instruct - meta-llama/llama-3-8b-instruct - meta-llama/llama-3.1-405b - meta-llama/llama-3.1-405b-instruct - meta-llama/llama-3.1-70b-instruct - meta-llama/llama-3.1-8b-instruct - meta-llama/llama-3.2-11b-vision-instruct - meta-llama/llama-3.2-1b-instruct - meta-llama/llama-3.2-3b-instruct - meta-llama/llama-3.2-90b-vision-instruct - meta-llama/llama-3.3-70b-instruct - meta-llama/llama-guard-2-8b - meta-llama/llama-guard-3-8b - '---MICROSOFT---' - microsoft/phi-3-medium-128k-instruct - microsoft/phi-3-mini-128k-instruct - microsoft/phi-3.5-mini-128k-instruct - microsoft/phi-4 - microsoft/wizardlm-2-7b - microsoft/wizardlm-2-8x22b - '---MISTRALAI---' - mistralai/codestral-2501 - mistralai/codestral-mamba - mistralai/ministral-3b - mistralai/ministral-8b - mistralai/mistral-7b-instruct - mistralai/mistral-7b-instruct-v0.1 - mistralai/mistral-7b-instruct-v0.3 - mistralai/mistral-large - mistralai/mistral-large-2407 - mistralai/mistral-large-2411 - mistralai/mistral-medium - mistralai/mistral-nemo - mistralai/mistral-saba - mistralai/mistral-small - mistralai/mistral-small-24b-instruct-2501 - mistralai/mistral-tiny - mistralai/mixtral-8x22b-instruct - mistralai/mixtral-8x7b - mistralai/mixtral-8x7b-instruct - mistralai/pixtral-12b - mistralai/pixtral-large-2411 - '---NEVERSLEEP---' - neversleep/llama-3-lumimaid-70b - neversleep/llama-3-lumimaid-8b - neversleep/llama-3.1-lumimaid-70b - neversleep/llama-3.1-lumimaid-8b - neversleep/noromaid-20b - '---NOUSRESEARCH---' - nousresearch/hermes-2-pro-llama-3-8b - nousresearch/hermes-3-llama-3.1-405b - nousresearch/hermes-3-llama-3.1-70b - nousresearch/nous-hermes-2-mixtral-8x7b-dpo - nousresearch/nous-hermes-llama2-13b - '---OPENAI---' - openai/chatgpt-4o-latest - openai/gpt-3.5-turbo - openai/gpt-3.5-turbo-0125 - openai/gpt-3.5-turbo-0613 - openai/gpt-3.5-turbo-1106 - openai/gpt-3.5-turbo-16k - openai/gpt-3.5-turbo-instruct - openai/gpt-4 - openai/gpt-4-0314 - openai/gpt-4-1106-preview - openai/gpt-4-32k - openai/gpt-4-32k-0314 - openai/gpt-4-turbo - openai/gpt-4-turbo-preview - openai/gpt-4o - openai/gpt-4o-2024-05-13 - openai/gpt-4o-2024-08-06 - openai/gpt-4o-2024-11-20 - openai/gpt-4o-mini - openai/gpt-4o-mini-2024-07-18 - openai/o1 - openai/o1-mini - openai/o1-mini-2024-09-12 - openai/o1-preview - openai/o1-preview-2024-09-12 - openai/o3-mini - openai/o3-mini-high - '---PERPLEXITY---' - perplexity/llama-3.1-sonar-huge-128k-online - perplexity/llama-3.1-sonar-large-128k-chat - perplexity/llama-3.1-sonar-large-128k-online - perplexity/llama-3.1-sonar-small-128k-chat - perplexity/llama-3.1-sonar-small-128k-online - perplexity/r1-1776 - perplexity/sonar - perplexity/sonar-reasoning - '---QWEN---' - qwen/qvq-72b-preview - qwen/qwen-2-72b-instruct - qwen/qwen-2-vl-72b-instruct - qwen/qwen-2-vl-7b-instruct - qwen/qwen-2.5-72b-instruct - qwen/qwen-2.5-7b-instruct - qwen/qwen-2.5-coder-32b-instruct - qwen/qwen-max - qwen/qwen-plus - qwen/qwen-turbo - qwen/qwq-32b-preview - '---SAO10K---' - sao10k/fimbulvetr-11b-v2 - sao10k/l3-euryale-70b - sao10k/l3-lunaris-8b - sao10k/l3.1-70b-hanami-x1 - sao10k/l3.1-euryale-70b - sao10k/l3.3-euryale-70b - '---X-AI---' - x-ai/grok-2-1212 - x-ai/grok-2-vision-1212 - x-ai/grok-beta - x-ai/grok-vision-beta - '---OTHERS---' - 01-ai/yi-large - aetherwiing/mn-starcannon-12b - allenai/llama-3.1-tulu-3-405b - alpindale/goliath-120b - alpindale/magnum-72b - anthracite-org/magnum-v2-72b - anthracite-org/magnum-v4-72b - cognitivecomputations/dolphin-mixtral-8x22b - cognitivecomputations/dolphin-mixtral-8x7b - databricks/dbrx-instruct - gryphe/mythomax-l2-13b - infermatic/mn-inferor-12b - inflatebot/mn-mag-mell-r1 - inflection/inflection-3-pi - inflection/inflection-3-productivity - jondurbin/airoboros-l2-70b - mancer/weaver - minimax/minimax-01 - nothingiisreal/mn-celeste-12b - nvidia/llama-3.1-nemotron-70b-instruct - openchat/openchat-7b - pygmalionai/mythalion-13b - raifle/sorcererlm-8x22b - sophosympatheia/midnight-rose-70b - teknium/openhermes-2.5-mistral-7b - thedrummer/rocinante-12b - thedrummer/unslopnemo-12b - undi95/remm-slerp-l2-13b - undi95/toppy-m-7b - xwin-lm/xwin-lm-70b fetch: false dropParams: - "stop" titleConvo: true titleModel: "openai/gpt-4o-mini" summarize: false summaryModel: "openai/gpt-4o-mini" forcePrompt: false modelDisplayLabel: "OpenRouter" # Preplexity # Model list: https://docs.perplexity.ai/docs/model-cards - name: "Perplexity" apiKey: "${PERPLEXITY_API_KEY}" baseURL: "https://api.perplexity.ai/" models: default: - r1-1776 - sonar - sonar-deep-research - sonar-pro - sonar-reasoning - sonar-reasoning-pro fetch: false # fetching list of models is not supported titleConvo: true titleModel: "llama-3.1-sonar-small-128k-chat" summarize: false summaryModel: "llama-3.1-sonar-small-128k-chat" forcePrompt: false dropParams: - "stop" - "frequency_penalty" modelDisplayLabel: "Perplexity" # SambaNova # https://cloud.sambanova.ai/apis - name: "SambaNova" iconURL: "https://sambanova.ai/hubfs/logotype_sambanova_orange.png" apiKey: "${SAMBANOVA_API_KEY}" baseURL: "https://api.sambanova.ai/v1/" models: default: - DeepSeek-R1 - DeepSeek-R1-Distill-Llama-70B - Llama-3.1-Tulu-3-405B - Llama-3.2-11B-Vision-Instruct - Llama-3.2-90B-Vision-Instruct - Meta-Llama-3.1-405B-Instruct - Meta-Llama-3.1-70B-Instruct - Meta-Llama-3.1-8B-Instruct - Meta-Llama-3.2-1B-Instruct - Meta-Llama-3.2-3B-Instruct - Meta-Llama-3.3-70B-Instruct - Meta-Llama-Guard-3-8B - QwQ-32B-Preview - Qwen2-Audio-7B-Instruct - Qwen2.5-72B-Instruct - Qwen2.5-Coder-32B-Instruct fetch: false titleConvo: true titleModel: "Meta-Llama-3.1-8B-Instruct" modelDisplayLabel: "SambaNova" # together.ai # https://api.together.ai/settings/api-keys # Model list: https://docs.together.ai/docs/inference-models - name: "together.ai" apiKey: "${TOGETHERAI_API_KEY}" baseURL: "https://api.together.xyz" models: default: - Gryphe/MythoMax-L2-13b - Gryphe/MythoMax-L2-13b-Lite - NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO - Qwen/QwQ-32B-Preview - Qwen/Qwen2-72B-Instruct - Qwen/Qwen2-VL-72B-Instruct - Qwen/Qwen2.5-72B-Instruct-Turbo - Qwen/Qwen2.5-7B-Instruct-Turbo - Qwen/Qwen2.5-Coder-32B-Instruct - databricks/dbrx-instruct - deepseek-ai/DeepSeek-R1 - deepseek-ai/DeepSeek-R1-Distill-Llama-70B - deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free - deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B - deepseek-ai/DeepSeek-R1-Distill-Qwen-14B - deepseek-ai/DeepSeek-V3 - google/gemma-2-27b-it - google/gemma-2-9b-it - google/gemma-2b-it - meta-llama/Llama-2-13b-chat-hf - meta-llama/Llama-2-7b-chat-hf - meta-llama/Llama-3-70b-chat-hf - meta-llama/Llama-3-8b-chat-hf - meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo - meta-llama/Llama-3.2-3B-Instruct-Turbo - meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo - meta-llama/Llama-3.3-70B-Instruct-Turbo - meta-llama/Llama-3.3-70B-Instruct-Turbo-Free - meta-llama/Llama-Vision-Free - meta-llama/Meta-Llama-3-70B-Instruct-Lite - meta-llama/Meta-Llama-3-70B-Instruct-Turbo - meta-llama/Meta-Llama-3-8B-Instruct-Lite - meta-llama/Meta-Llama-3-8B-Instruct-Turbo - meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo - meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo - meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo - meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo-128K - meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo-classifier - microsoft/WizardLM-2-8x22B - mistralai/Mistral-7B-Instruct-v0.1 - mistralai/Mistral-7B-Instruct-v0.2 - mistralai/Mistral-7B-Instruct-v0.3 - mistralai/Mistral-Small-24B-Instruct-2501 - mistralai/Mixtral-8x22B-Instruct-v0.1 - mistralai/Mixtral-8x7B-Instruct-v0.1 - nvidia/Llama-3.1-Nemotron-70B-Instruct-HF - scb10x/scb10x-llama3-1-typhoon2-60256 - scb10x/scb10x-llama3-typhoon-v1-5-8b-instruct - scb10x/scb10x-llama3-typhoon-v1-5x-4f316 - togethercomputer/MoA-1 - togethercomputer/MoA-1-Turbo - upstage/SOLAR-10.7B-Instruct-v1.0 fetch: false titleConvo: true titleModel: "togethercomputer/llama-2-7b-chat" summarize: false summaryModel: "togethercomputer/llama-2-7b-chat" forcePrompt: false modelDisplayLabel: "together.ai" # Unify # Model list: https://unify.ai/chat - name: "Unify" apiKey: "${UNIFY_API_KEY}" baseURL: "https://api.unify.ai/v0/" models: default: - chatgpt-4o-latest@openai - claude-3-haiku@anthropic - claude-3-haiku@aws-bedrock - claude-3-haiku@vertex-ai - claude-3-opus@anthropic - claude-3-opus@aws-bedrock - claude-3-opus@vertex-ai - claude-3-sonnet@anthropic - claude-3-sonnet@aws-bedrock - claude-3.5-haiku@anthropic - claude-3.5-haiku@aws-bedrock - claude-3.5-haiku@replicate - claude-3.5-haiku@vertex-ai - claude-3.5-sonnet-20240620@anthropic - claude-3.5-sonnet-20240620@aws-bedrock - claude-3.5-sonnet-20240620@vertex-ai - claude-3.5-sonnet@anthropic - claude-3.5-sonnet@aws-bedrock - claude-3.5-sonnet@replicate - claude-3.5-sonnet@vertex-ai - claude-3.7-sonnet@anthropic - claude-3.7-sonnet@aws-bedrock - claude-3.7-sonnet@vertex-ai - command-r-plus@aws-bedrock - deepseek-r1@deepinfra - deepseek-r1@deepseek - deepseek-r1@fireworks-ai - deepseek-r1@replicate - deepseek-r1@together-ai - deepseek-v3@deepinfra - deepseek-v3@deepseek - deepseek-v3@fireworks-ai - deepseek-v3@together-ai - gemini-1.0-pro-001@vertex-ai - gemini-1.0-pro-002@vertex-ai - gemini-1.0-pro@vertex-ai - gemini-1.5-flash-001@vertex-ai - gemini-1.5-flash-002@vertex-ai - gemini-1.5-flash@vertex-ai - gemini-1.5-pro-001@vertex-ai - gemini-1.5-pro-002@vertex-ai - gemini-1.5-pro@vertex-ai - gemini-2.0-flash-lite@vertex-ai - gemini-2.0-flash@vertex-ai - gemma-2-27b-it@deepinfra - gemma-2-27b-it@together-ai - gemma-2-9b-it@deepinfra - gemma-2-9b-it@groq - gemma-2-9b-it@lepton-ai - gemma-2-9b-it@together-ai - gpt-3.5-turbo@openai - gpt-4-turbo@openai - gpt-4@openai - gpt-4o-2024-05-13@openai - gpt-4o-2024-08-06@openai - gpt-4o-2024-11-20@openai - gpt-4o-mini@openai - gpt-4o@openai - grok-2-vision@xai - grok-2@xai - llama-3-70b-chat@aws-bedrock - llama-3-70b-chat@deepinfra - llama-3-70b-chat@fireworks-ai - llama-3-70b-chat@groq - llama-3-70b-chat@replicate - llama-3-70b-chat@together-ai - llama-3-8b-chat@aws-bedrock - llama-3-8b-chat@deepinfra - llama-3-8b-chat@fireworks-ai - llama-3-8b-chat@groq - llama-3-8b-chat@replicate - llama-3-8b-chat@together-ai - llama-3.1-405b-chat@aws-bedrock - llama-3.1-405b-chat@deepinfra - llama-3.1-405b-chat@fireworks-ai - llama-3.1-405b-chat@replicate - llama-3.1-405b-chat@together-ai - llama-3.1-405b-chat@vertex-ai - llama-3.1-70b-chat@aws-bedrock - llama-3.1-70b-chat@deepinfra - llama-3.1-70b-chat@fireworks-ai - llama-3.1-70b-chat@together-ai - llama-3.1-70b-chat@vertex-ai - llama-3.1-8b-chat@aws-bedrock - llama-3.1-8b-chat@deepinfra - llama-3.1-8b-chat@fireworks-ai - llama-3.1-8b-chat@groq - llama-3.1-8b-chat@lepton-ai - llama-3.1-8b-chat@together-ai - llama-3.1-8b-chat@vertex-ai - llama-3.1-nemotron-70b-chat@deepinfra - llama-3.2-11b-chat@deepinfra - llama-3.2-11b-chat@fireworks-ai - llama-3.2-11b-chat@groq - llama-3.2-11b-chat@together-ai - llama-3.2-11b-chat@vertex-ai - llama-3.2-1b-chat@aws-bedrock - llama-3.2-1b-chat@deepinfra - llama-3.2-1b-chat@groq - llama-3.2-1b-chat@lepton-ai - llama-3.2-3b-chat@aws-bedrock - llama-3.2-3b-chat@deepinfra - llama-3.2-3b-chat@fireworks-ai - llama-3.2-3b-chat@groq - llama-3.2-3b-chat@lepton-ai - llama-3.2-3b-chat@together-ai - llama-3.2-90b-chat@deepinfra - llama-3.2-90b-chat@fireworks-ai - llama-3.2-90b-chat@groq - llama-3.2-90b-chat@together-ai - llama-3.2-90b-chat@vertex-ai - llama-3.3-70b-chat@aws-bedrock - llama-3.3-70b-chat@deepinfra - llama-3.3-70b-chat@fireworks-ai - llama-3.3-70b-chat@groq - llama-3.3-70b-chat@lepton-ai - llama-3.3-70b-chat@together-ai - ministral-3b@mistral-ai - ministral-8b@mistral-ai - mistral-7b-instruct-v0.2@aws-bedrock - mistral-7b-instruct-v0.3@deepinfra - mistral-7b-instruct-v0.3@lepton-ai - mistral-7b-instruct-v0.3@mistral-ai - mistral-7b-instruct-v0.3@together-ai - mistral-large@aws-bedrock - mistral-large@mistral-ai - mistral-large@vertex-ai - mistral-nemo@deepinfra - mistral-nemo@lepton-ai - mistral-nemo@mistral-ai - mistral-nemo@vertex-ai - mistral-small@deepinfra - mistral-small@fireworks-ai - mistral-small@mistral-ai - mistral-small@together-ai - mixtral-8x22b-instruct-v0.1@fireworks-ai - mixtral-8x22b-instruct-v0.1@mistral-ai - mixtral-8x22b-instruct-v0.1@together-ai - mixtral-8x7b-instruct-v0.1@aws-bedrock - mixtral-8x7b-instruct-v0.1@deepinfra - mixtral-8x7b-instruct-v0.1@fireworks-ai - mixtral-8x7b-instruct-v0.1@groq - mixtral-8x7b-instruct-v0.1@lepton-ai - mixtral-8x7b-instruct-v0.1@mistral-ai - mixtral-8x7b-instruct-v0.1@together-ai - o1-mini@openai - o1@openai - o3-mini@openai - qwen-2-72b-instruct@together-ai - qwen-2.5-72b-instruct@deepinfra - qwen-2.5-72b-instruct@fireworks-ai - qwen-2.5-72b-instruct@together-ai - qwen-2.5-7b-instruct@deepinfra - qwen-2.5-7b-instruct@together-ai - qwen-2.5-coder-32b-instruct@deepinfra - qwen-2.5-coder-32b-instruct@fireworks-ai - qwen-2.5-coder-32b-instruct@groq - qwen-2.5-coder-32b-instruct@together-ai - qwen-qwq-32b-preview@fireworks-ai - qwen-qwq-32b-preview@together-ai fetch: false titleConvo: true titleModel: "gpt-4o-mini@openai" dropParams: - "stop" - "user" - "frequency_penalty" - "presence_penalty" # xAI # https://x.ai/api - name: "xai" apiKey: "${XAI_API_KEY}" baseURL: "https://api.x.ai/v1" models: default: - "grok-beta" fetch: false titleConvo: true titleMethod: "completion" titleModel: "grok-beta" summarize: false summaryModel: "grok-beta" forcePrompt: false modelDisplayLabel: "Grok"