LibreChat / librechat.yaml
L3n4's picture
Update librechat.yaml
7b074ea verified
version: 1.2.1
cache: true
registration:
socialLogins:
- "discord"
- "facebook"
- "github"
- "google"
- "openid"
endpoints:
custom:
# APIpie
# https://apipie.ai/dashboard/
# Script to fetch models: https://github.com/LibreChat-AI/librechat-config-yaml/blob/main/scripts/apipie.py
- name: "APIpie"
apiKey: "${APIPIE_API_KEY}"
baseURL: "https://apipie.ai/v1/"
models:
default:
- DeepSeek-V3
- Llama-2-13b-chat-hf
- Llama-2-70b-chat-hf
- Llama-2-70b-hf
- Llama-2-7b-chat-hf
- Llama-3-70b-chat-hf
- Llama-3-8b-chat-hf
- Llama-3.1-Nemotron-70B-Instruct-HF
- Llama-3.2-11B-Vision-Instruct-Turbo
- Llama-3.2-3B-Instruct-Turbo
- Llama-3.2-90B-Vision-Instruct-Turbo
- Llama-3.3-70B-Instruct-Turbo
- Meta-Llama-3-70B-Instruct
- Meta-Llama-3-70B-Instruct-Lite
- Meta-Llama-3-70B-Instruct-Turbo
- Meta-Llama-3-8B-Instruct
- Meta-Llama-3-8B-Instruct-Lite
- Meta-Llama-3-8B-Instruct-Turbo
- Meta-Llama-3.1-70B-Instruct-Turbo
- Meta-Llama-3.1-8B-Instruct-Turbo
- Meta-Llama-3.1-8B-Instruct-Turbo-128K
- Mistral-7B-Instruct-v0.1
- Mistral-7B-Instruct-v0.2
- Mistral-7B-Instruct-v0.3
- Mixtral-8x22B-Instruct-v0.1
- Mixtral-8x22B-v0.1
- Mixtral-8x7B-Instruct-v0.1
- Mixtral-8x7B-v0.1
- MythoMax-L2-13b
- MythoMax-L2-13b-Lite
- Nous-Hermes-2-Mixtral-8x7B-DPO
- QwQ-32B-Preview
- Qwen2.5-72B-Instruct-Turbo
- Qwen2.5-7B-Instruct-Turbo
- SOLAR-10.7B-Instruct-v1.0
- WizardLM-2-7B
- WizardLM-2-8x22B
- aion-1.0
- aion-1.0-mini
- aion-rp-llama-3.1-8b
- airoboros-70b
- airoboros-l2-70b
- amazon.nova-lite-v1:0
- amazon.nova-micro-v1:0
- amazon.nova-pro-v1:0
- chatgpt-4o-latest
- chatx_cheap_128k
- chatx_cheap_32k
- chatx_cheap_4k
- chatx_cheap_64k
- chatx_cheap_8k
- chatx_mids_4k
- chatx_premium_128k
- chatx_premium_32k
- chatx_premium_4k
- chatx_premium_8k
- chronos-hermes-13b-v2
- claude-2
- claude-2.0
- claude-2.1
- claude-3-5-haiku
- claude-3-5-haiku-20241022
- claude-3-5-haiku-20241022-v1
- claude-3-5-haiku-latest
- claude-3-5-sonnet
- claude-3-5-sonnet-20240620
- claude-3-5-sonnet-20240620-v1
- claude-3-5-sonnet-20241022
- claude-3-5-sonnet-20241022-v2
- claude-3-5-sonnet-latest
- claude-3-7-sonnet-20250219
- claude-3-7-sonnet-20250219-v1
- claude-3-7-sonnet-latest
- claude-3-haiku
- claude-3-haiku-20240307
- claude-3-haiku-20240307-v1
- claude-3-opus
- claude-3-opus-20240229
- claude-3-opus-20240229-v1
- claude-3-opus-latest
- claude-3-sonnet
- claude-3-sonnet-20240229
- claude-3-sonnet-20240229-v1
- claude-3.5-haiku
- claude-3.5-haiku-20241022
- claude-3.5-sonnet
- claude-3.5-sonnet-20240620
- claude-3.7-sonnet
- claude2
- codestral-2501
- codestral-mamba
- command
- command-light
- command-light-text-v14
- command-nightly
- command-r
- command-r-03-2024
- command-r-08-2024
- command-r-plus
- command-r-plus-04-2024
- command-r-plus-08-2024
- command-r-plus-v1
- command-r-v1
- command-r7b-12-2024
- command-text-v14
- dbrx-instruct
- deepseek-chat
- deepseek-r1
- deepseek-r1-distill-llama-70b
- deepseek-r1-distill-llama-8b
- deepseek-r1-distill-qwen-1.5b
- deepseek-r1-distill-qwen-14b
- deepseek-r1-distill-qwen-32b
- dolphin-2.6-mixtral-8x7b
- dolphin-mixtral-8x22b
- dolphin-mixtral-8x7b
- dolphin3.0-mistral-24b
- dolphin3.0-r1-mistral-24b
- eva-llama-3.33-70b
- eva-qwen-2.5-32b
- eva-qwen-2.5-72b
- fimbulvetr-11b-v2
- gemini-1.5-flash
- gemini-1.5-flash-8b
- gemini-1.5-flash-8b-latest
- gemini-1.5-flash-latest
- gemini-1.5-pro
- gemini-1.5-pro-latest
- gemini-2.0-flash
- gemini-2.0-flash-001
- gemini-2.0-flash-lite-001
- gemini-2.0-flash-lite-preview-02-05
- gemini-2.0-flash-thinking-exp-1219
- gemini-2.0-pro-exp-02-05
- gemini-flash
- gemini-flash-1.5
- gemini-flash-1.5-8b
- gemini-pro
- gemini-pro-1.5
- gemini-pro-vision
- gemma-1.1-7b-it
- gemma-2-27b-it
- gemma-2-9b-it
- gemma-2b-it
- gemma-7b-it
- general
- goliath-120b
- gpt-3.5
- gpt-3.5-turbo
- gpt-3.5-turbo-0125
- gpt-3.5-turbo-0613
- gpt-3.5-turbo-1106
- gpt-3.5-turbo-16k
- gpt-3.5-turbo-instruct
- gpt-4
- gpt-4-0125-preview
- gpt-4-0314
- gpt-4-0613
- gpt-4-1106-preview
- gpt-4-1106-vision-preview
- gpt-4-32k
- gpt-4-32k-0314
- gpt-4-turbo
- gpt-4-turbo-2024-04-09
- gpt-4-turbo-preview
- gpt-4-vision-preview
- gpt-4o
- gpt-4o-2024-05-13
- gpt-4o-2024-08-06
- gpt-4o-2024-11-20
- gpt-4o-audio-preview-2024-10-01
- gpt-4o-audio-preview-2024-12-17
- gpt-4o-mini
- gpt-4o-mini-2024-07-18
- gpt-4o-mini-audio-preview
- gpt-4o-mini-audio-preview-2024-12-17
- grok-2-1212
- grok-2-vision-1212
- grok-beta
- grok-vision-beta
- hermes-2-pro-llama-3-8b
- hermes-3-llama-3.1-405b
- hermes-3-llama-3.1-70b
- inflection-3-pi
- j2-grande-instruct
- j2-jumbo-instruct
- j2-mid
- j2-mid-v1
- j2-ultra
- j2-ultra-v1
- jamba-1-5-large
- jamba-1-5-large-v1
- jamba-1-5-mini
- jamba-1-5-mini-v1
- jamba-instruct
- jamba-instruct-v1
- l3-euryale-70b
- l3-lunaris-8b
- l3.1-70b-hanami-x1
- l3.1-euryale-70b
- l3.3-euryale-70b
- lfm-3b
- lfm-40b
- lfm-7b
- llama-2-13b-chat
- llama-2-70b-chat
- llama-3-70b-instruct
- llama-3-8b-instruct
- llama-3-lumimaid-70b
- llama-3-lumimaid-8b
- llama-3-sonar-large-32k-chat
- llama-3.1-405b
- llama-3.1-405b-instruct
- llama-3.1-70b-instruct
- llama-3.1-8b-instruct
- llama-3.1-lumimaid-70b
- llama-3.1-lumimaid-8b
- llama-3.1-nemotron-70b-instruct
- llama-3.1-sonar-huge-128k-online
- llama-3.1-sonar-large-128k-chat
- llama-3.1-sonar-large-128k-online
- llama-3.1-sonar-small-128k-chat
- llama-3.1-sonar-small-128k-online
- llama-3.1-tulu-3-405b
- llama-3.2-11b-vision-instruct
- llama-3.2-1b-instruct
- llama-3.2-3b-instruct
- llama-3.2-90b-vision-instruct
- llama-3.3-70b-instruct
- llama-guard-2-8b
- llama-guard-3-8b
- llama2-13b-chat-v1
- llama2-70b-chat-v1
- llama3-1
- llama3-1-405b-instruct-v1:0
- llama3-1-70b-instruct-v1
- llama3-1-70b-instruct-v1:0
- llama3-1-8b-instruct-v1
- llama3-1-8b-instruct-v1:0
- llama3-2
- llama3-2-11b-instruct-v1
- llama3-2-1b-instruct-v1
- llama3-2-3b-instruct-v1
- llama3-2-90b-instruct-v1
- llama3-3-70b-instruct-v1
- llama3-70b-instruct-v1
- llama3-8b-instruct-v1
- magnum-72b
- magnum-v2-72b
- magnum-v4-72b
- meta-llama-3.1-8b-instruct
- midnight-rose-70b
- minimax-01
- ministral-3b
- ministral-8b
- mistral
- mistral-7b-instruct
- mistral-7b-instruct-v0
- mistral-7b-instruct-v0.1
- mistral-7b-instruct-v0.3
- mistral-large
- mistral-large-2402-v1
- mistral-large-2407
- mistral-large-2411
- mistral-large-latest
- mistral-medium
- mistral-nemo
- mistral-saba
- mistral-small
- mistral-small-2402-v1
- mistral-small-24b-instruct-2501
- mistral-small-latest
- mistral-tiny
- mixtral
- mixtral-8x22b-instruct
- mixtral-8x7b
- mixtral-8x7b-instruct
- mixtral-8x7b-instruct-v0
- mn-celeste-12b
- mn-inferor-12b
- mn-starcannon-12b
- mythalion-13b
- mythomax-l2-13b
- nai-meta-v1
- noromaid-20b
- nous-hermes-2-mixtral-8x7b-dpo
- nous-hermes-2-vision-7b
- nous-hermes-llama2-13b
- nova-canvas-v1
- nova-lite-v1
- nova-micro-v1
- nova-pro-v1
- nova-reel-v1
- o1
- o1-2024-12-17
- o1-mini
- o1-mini-2024-09-12
- o1-preview
- o1-preview-2024-09-12
- o3-mini
- o3-mini-2025-01-31
- o3-mini-high
- olympus-premier-v1
- online-llama
- openchat-7b
- openchat_3.5
- openhermes-2.5-mistral-7b
- palm-2-chat-bison
- palm-2-chat-bison-32k
- palm-2-codechat-bison
- palm-2-codechat-bison-32k
- phi-3-medium-128k-instruct
- phi-3-mini-128k-instruct
- phi-3.5-mini-128k-instruct
- phi-4
- pixtral-12b
- pixtral-large-2411
- pixtral-large-latest
- qvq-72b-preview
- qwen-2-72b-instruct
- qwen-2-vl-72b-instruct
- qwen-2-vl-7b-instruct
- qwen-2.5-72b-instruct
- qwen-2.5-7b-instruct
- qwen-2.5-coder-32b-instruct
- qwen-max
- qwen-plus
- qwen-turbo
- qwen-vl-plus
- qwen1-5
- qwen2
- qwen2.5-vl-72b-instruct
- qwq-32b-preview
- r1-1776
- remm-slerp-l2-13b
- rocinante-12b
- rogue-rose-103b-v0.2
- scb10x-llama3-typhoon-v1-5-8b-instruct
- scb10x-llama3-typhoon-v1-5x-4f316
- sonar
- sonar-reasoning
- sorcererlm-8x22b
- titan
- titan-text-express-v1
- titan-text-lite-v1
- titan-text-premier-v1
- titan-tg1-large
- toppy-m-7b
- unslopnemo-12b
- weaver
- wizardlm-2-7b
- wizardlm-2-8x22b
- xwin-lm-70b
- yi-large
- yi-vision
- zephyr-orpo-141b-A35b-v0.1
fetch: false
titleConvo: true
titleModel: "claude-3-haiku"
summarize: false
summaryModel: "claude-3-haiku"
dropParams:
- "stream"
modelDisplayLabel: "APIpie"
iconURL: "https://raw.githubusercontent.com/fuegovic/lc-config-yaml/main/icons/APIpie.png"
# cohere
# Model list: https://dashboard.cohere.com/playground/chat
- name: "cohere"
apiKey: "${COHERE_API_KEY}"
baseURL: "https://api.cohere.ai/v1"
models:
default:
- c4ai-aya-expanse-32b
- command
- command-light-nightly
- command-r
- command-r-08-2024
- command-r-plus
- command-r-plus-08-2024
- command-r7b-12-2024
fetch: false
modelDisplayLabel: "cohere"
titleModel: "command"
dropParams:
- "stop"
- "user"
- "frequency_penalty"
- "presence_penalty"
- "temperature"
- "top_p"
# deepseek
# https://platform.deepseek.com/api_keys
# Model list: https://platform.deepseek.com/api-docs/pricing
- name: "deepseek"
apiKey: "${DEEPSEEK_API_KEY}"
baseURL: "https://api.deepseek.com"
models:
default:
- deepseek-chat
- deepseek-reasoner
fetch: false
titleConvo: true
titleModel: "deepseek-chat"
summarize: false
summaryModel: "deepseek-chat"
modelDisplayLabel: "DeepSeek"
# Fireworks.ai
# Models: https://fireworks.ai/models?show=Serverless
- name: "Fireworks"
apiKey: "${FIREWORKS_API_KEY}"
baseURL: "https://api.fireworks.ai/inference/v1"
models:
default:
- accounts/fireworks/models/deepseek-r1
- accounts/fireworks/models/deepseek-v3
- accounts/fireworks/models/llama-guard-3-8b
- accounts/fireworks/models/llama-v3-70b-instruct
- accounts/fireworks/models/llama-v3-8b-instruct
- accounts/fireworks/models/llama-v3-8b-instruct-hf
- accounts/fireworks/models/llama-v3p1-405b-instruct
- accounts/fireworks/models/llama-v3p1-405b-instruct-long
- accounts/fireworks/models/llama-v3p1-70b-instruct
- accounts/fireworks/models/llama-v3p1-8b-instruct
- accounts/fireworks/models/llama-v3p2-11b-vision-instruct
- accounts/fireworks/models/llama-v3p2-3b-instruct
- accounts/fireworks/models/llama-v3p2-90b-vision-instruct
- accounts/fireworks/models/llama-v3p3-70b-instruct
- accounts/fireworks/models/mistral-small-24b-instruct-2501
- accounts/fireworks/models/mixtral-8x22b-instruct
- accounts/fireworks/models/mixtral-8x7b-instruct
- accounts/fireworks/models/mythomax-l2-13b
- accounts/fireworks/models/phi-3-vision-128k-instruct
- accounts/fireworks/models/qwen-qwq-32b-preview
- accounts/fireworks/models/qwen2-vl-72b-instruct
- accounts/fireworks/models/qwen2p5-72b-instruct
- accounts/fireworks/models/qwen2p5-coder-32b-instruct
- accounts/mels-e0299e/models/aiderlm-v0
- accounts/perplexity/models/r1-1776
- accounts/sentientfoundation/models/dobby-mini-leashed-llama-3-1-8b
- accounts/sentientfoundation/models/dobby-mini-unhinged-llama-3-1-8b
- accounts/sentientfoundation/models/dobby-unhinged-llama-3-3-70b-new
- accounts/yi-01-ai/models/yi-large
fetch: false
titleConvo: true
titleModel: "accounts/fireworks/models/llama-v2-7b-chat"
summarize: false
summaryModel: "accounts/fireworks/models/llama-v2-7b-chat"
forcePrompt: false
modelDisplayLabel: "Fireworks"
dropParams:
- "user"
# GitHub
- name: "Github Models"
iconURL: https://github.githubassets.com/assets/GitHub-Mark-ea2971cee799.png
apiKey: "${GITHUB_TOKEN}"
baseURL: "https://models.inference.ai.azure.com"
models:
default:
- AI21-Jamba-Instruct
- Cohere-command-r
- Cohere-command-r-plus
- Cohere-embed-v3-english
- Cohere-embed-v3-multilingual
- Meta-Llama-3-70B-Instruct
- Meta-Llama-3-8B-Instruct
- Meta-Llama-3.1-405B-Instruct
- Meta-Llama-3.1-70B-Instruct
- Meta-Llama-3.1-8B-Instruct
- Mistral-Nemo
- Mistral-large
- Mistral-large-2407
- Mistral-small
- Phi-3-medium-128k-instruct
- Phi-3-medium-4k-instruct
- Phi-3-mini-128k-instruct
- Phi-3-mini-4k-instruct
- Phi-3-small-128k-instruct
- Phi-3-small-8k-instruct
- Phi-3.5-mini-instruct
- gpt-4o
- gpt-4o-mini
- text-embedding-3-large
- text-embedding-3-small
fetch: false
titleConvo: true
titleModel: "gpt-4o-mini"
# groq
# Model list: https://console.groq.com/settings/limits
- name: "groq"
apiKey: "${GROQ_API_KEY}"
baseURL: "https://api.groq.com/openai/v1/"
models:
default:
- deepseek-r1-distill-llama-70b
- deepseek-r1-distill-qwen-32b
- gemma2-9b-it
- llama-3.1-8b-instant
- llama-3.2-11b-vision-preview
- llama-3.2-1b-preview
- llama-3.2-3b-preview
- llama-3.2-90b-vision-preview
- llama-3.3-70b-specdec
- llama-3.3-70b-versatile
- llama-guard-3-8b
- llama3-70b-8192
- llama3-8b-8192
- mistral-saba-24b
- mixtral-8x7b-32768
- qwen-2.5-32b
- qwen-2.5-coder-32b
fetch: false
titleConvo: true
titleModel: "mixtral-8x7b-32768"
modelDisplayLabel: "groq"
# HuggingFace
# https://huggingface.co/settings/tokens
- name: 'HuggingFace'
apiKey: '${HUGGINGFACE_TOKEN}'
baseURL: 'https://api-inference.huggingface.co/v1'
models:
default:
- AIDC-AI/Marco-o1
- BioMistral/BioMistral-7B
- CohereForAI/c4ai-command-r-plus
- CohereForAI/c4ai-command-r-v01
- HuggingFaceH4/zephyr-7b-alpha
- HuggingFaceH4/zephyr-7b-beta
- HuggingFaceTB/SmolLM2-1.7B-Instruct
- Intel/neural-chat-7b-v3-1
- MiniMaxAI/MiniMax-Text-01
- NexaAIDev/Octopus-v2
- NousResearch/Hermes-2-Pro-Mistral-7B
- NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
- NovaSky-AI/Sky-T1-32B-Preview
- Open-Orca/Mistral-7B-OpenOrca
- PygmalionAI/pygmalion-6b
- Qwen/QwQ-32B-Preview
- Qwen/Qwen2-72B-Instruct
- Qwen/Qwen2-7B-Instruct
- Qwen/Qwen2.5-72B-Instruct
- Qwen/Qwen2.5-7B-Instruct
- Qwen/Qwen2.5-Coder-32B-Instruct
- Qwen/Qwen2.5-Coder-7B-Instruct
- TheBloke/Mistral-7B-Instruct-v0.2-GGUF
- TinyLlama/TinyLlama-1.1B-Chat-v1.0
- berkeley-nest/Starling-LM-7B-alpha
- cognitivecomputations/dolphin-2.5-mixtral-8x7b
- cognitivecomputations/dolphin-2.9-llama3-8b
- databricks/dbrx-base
- databricks/dbrx-instruct
- deepseek-ai/DeepSeek-Coder-V2-Instruct
- deepseek-ai/DeepSeek-R1
- deepseek-ai/DeepSeek-R1-Distill-Llama-70B
- deepseek-ai/DeepSeek-R1-Distill-Llama-8B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
- deepseek-ai/DeepSeek-R1-Zero
- deepseek-ai/DeepSeek-V2-Chat
- deepseek-ai/DeepSeek-V2.5
- deepseek-ai/DeepSeek-V3
- deepseek-ai/deepseek-coder-33b-instruct
- google/gemma-2-27b-it
- google/gemma-2-2b-it
- google/gemma-2-9b-it
- google/gemma-2b-it
- google/gemma-7b-it
- gradientai/Llama-3-8B-Instruct-Gradient-1048k
- jinaai/ReaderLM-v2
- jinaai/reader-lm-1.5b
- mattshumer/Reflection-Llama-3.1-70B
- meta-llama/Llama-2-13b-chat-hf
- meta-llama/Llama-2-70b-chat-hf
- meta-llama/Llama-2-7b-chat-hf
- meta-llama/Llama-3.1-405B-Instruct
- meta-llama/Llama-3.1-70B-Instruct
- meta-llama/Llama-3.1-8B-Instruct
- meta-llama/Llama-3.2-1B-Instruct
- meta-llama/Llama-3.2-3B-Instruct
- meta-llama/Llama-3.3-70B-Instruct
- meta-llama/Meta-Llama-3-70B-Instruct
- meta-llama/Meta-Llama-3-8B-Instruct
- microsoft/Phi-3-mini-128k-instruct
- microsoft/Phi-3-mini-4k-instruct
- microsoft/Phi-3-vision-128k-instruct
- microsoft/Phi-3.5-MoE-instruct
- microsoft/Phi-3.5-mini-instruct
- microsoft/phi-4
- mistralai/Codestral-22B-v0.1
- mistralai/Mistral-7B-Instruct-v0.1
- mistralai/Mistral-7B-Instruct-v0.2
- mistralai/Mistral-7B-Instruct-v0.3
- mistralai/Mistral-Nemo-Instruct-2407
- mistralai/Mistral-Small-24B-Instruct-2501
- mistralai/Mixtral-8x22B-Instruct-v0.1
- mistralai/Mixtral-8x7B-Instruct-v0.1
- nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
- nvidia/Llama3-ChatQA-1.5-8B
- openchat/openchat_3.5
- shenzhi-wang/Llama3-8B-Chinese-Chat
- teknium/OpenHermes-2.5-Mistral-7B
- tiiuae/falcon-180B-chat
- tiiuae/falcon-7b-instruct
- unsloth/DeepSeek-R1-GGUF
- upstage/SOLAR-10.7B-Instruct-v1.0
- upstage/solar-pro-preview-instruct
fetch: false
titleConvo: true
titleModel: "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO"
dropParams:
- "top_p"
# Hyperbolic
# https://app.hyperbolic.xyz/models
- name: 'Hyperbolic'
apiKey: '${HYPERBOLIC_API_KEY}'
baseURL: 'https://api.hyperbolic.xyz/v1/'
models:
default:
- NousResearch/Hermes-3-Llama-3.1-70B
- Qwen/QwQ-32B-Preview
- Qwen/Qwen2-VL-72B-Instruct
- Qwen/Qwen2-VL-7B-Instruct
- Qwen/Qwen2.5-72B-Instruct
- Qwen/Qwen2.5-Coder-32B-Instruct
- deepseek-ai/DeepSeek-R1
- deepseek-ai/DeepSeek-V3
- meta-llama/Llama-3.2-3B-Instruct
- meta-llama/Llama-3.3-70B-Instruct
- meta-llama/Meta-Llama-3-70B-Instruct
- meta-llama/Meta-Llama-3.1-405B
- meta-llama/Meta-Llama-3.1-405B-FP8
- meta-llama/Meta-Llama-3.1-405B-Instruct
- meta-llama/Meta-Llama-3.1-405B-Instruct-Virtuals
- meta-llama/Meta-Llama-3.1-70B-Instruct
- meta-llama/Meta-Llama-3.1-8B-Instruct
- mistralai/Pixtral-12B-2409
fetch: false
titleConvo: true
titleModel: "meta-llama/Meta-Llama-3.1-8B-Instruct"
modelDisplayLabel: "Hyperbolic"
iconURL: "https://app.hyperbolic.xyz/icon.svg"
# kluster.ai
# https://platform.kluster.ai/apikeys
- name: "Kluster"
apiKey: "${KLUSTER_API_KEY}"
baseURL: "https://api.kluster.ai/v1/"
models:
default:
- deepseek-ai/DeepSeek-R1
- klusterai/Meta-Llama-3.1-405B-Instruct-Turbo
- klusterai/Meta-Llama-3.1-8B-Instruct-Turbo
- klusterai/Meta-Llama-3.3-70B-Instruct-Turbo
fetch: false
titleConvo: true
titleModel: 'klusterai/Meta-Llama-3.1-8B-Instruct-Turbo'
modelDisplayLabel: 'Kluster'
iconURL: "https://platform.kluster.ai/cropped-fav-1-144x144.png"
# Mistral AI API
# Model list: https://docs.mistral.ai/getting-started/models/
- name: "Mistral"
apiKey: "${MISTRAL_API_KEY}"
baseURL: "https://api.mistral.ai/v1"
models:
default:
- codestral-2405
- codestral-2411-rc5
- codestral-2412
- codestral-2501
- codestral-latest
- codestral-mamba-2407
- codestral-mamba-latest
- ministral-3b-2410
- ministral-3b-latest
- ministral-8b-2410
- ministral-8b-latest
- mistral-embed
- mistral-large-2402
- mistral-large-2407
- mistral-large-2411
- mistral-large-latest
- mistral-large-pixtral-2411
- mistral-medium
- mistral-medium-2312
- mistral-medium-latest
- mistral-moderation-2411
- mistral-moderation-latest
- mistral-saba-2502
- mistral-saba-latest
- mistral-small
- mistral-small-2312
- mistral-small-2402
- mistral-small-2409
- mistral-small-2501
- mistral-small-latest
- mistral-tiny
- mistral-tiny-2312
- mistral-tiny-2407
- mistral-tiny-latest
- open-codestral-mamba
- open-mistral-7b
- open-mistral-nemo
- open-mistral-nemo-2407
- open-mixtral-8x22b
- open-mixtral-8x22b-2404
- open-mixtral-8x7b
- pixtral-12b
- pixtral-12b-2409
- pixtral-12b-latest
- pixtral-large-2411
- pixtral-large-latest
fetch: false
titleConvo: true
titleMethod: "completion"
titleModel: "mistral-tiny"
summarize: false
summaryModel: "mistral-tiny"
forcePrompt: false
modelDisplayLabel: "Mistral"
dropParams:
- "stop"
- "user"
- "frequency_penalty"
- "presence_penalty"
# NanoGPT
# https://nano-gpt.com/api
# Model list: https://nano-gpt.com/api/models
- name: "NanoGPT"
iconURL: "https://nano-gpt.com/logo.png"
apiKey: "${NANOGPT_API_KEY}"
baseURL: "https://nano-gpt.com/api/v1/"
models:
default:
- EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0
- EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1
- EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2
- EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2
- Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B
- Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B
- GalrionSoftworks/MN-LooseCannon-12B-v1
- Gryphe/MythoMax-L2-13b
- Infermatic/MN-12B-Inferor-v0.0
- LatitudeGames/Wayfarer-Large-70B-Llama-3.3
- Llama-3.1-Tulu-3-405B
- Llama-3.3+3.1-70B-ArliAI-RPMax-v1.3
- Llama-3.3-70B-MiraiFanfare
- MarinaraSpaghetti/NemoMix-Unleashed-12B
- Meta-Llama-3-1-405B-Instruct-FP8
- Meta-Llama-3-1-8B-Instruct-FP8
- Mistral-Nemo-12B-ArliAI-RPMax-v1.2
- Mistral-Nemo-12B-Wayfarer
- NeverSleep/Llama-3-Lumimaid-70B-v0.1
- NeverSleep/Lumimaid-v0.2-70B
- Nexusflow/Athene-V2-Chat
- Qwen/QwQ-32B-Preview
- Qwen/Qwen2.5-Coder-32B-Instruct
- Qwen2.5-32B-Dazzling-Star-Aurora-32b-v0.0
- Qwen2.5-32B-EVA-v0.2
- Sao10K/L3.1-70B-Euryale-v2.2
- Sao10K/L3.1-70B-Hanami-x1
- Sao10K/L3.3-70B-Euryale-v2.3
- Steelskull/L3.3-Damascus-R1
- Steelskull/L3.3-MS-Evalebis-70b
- Steelskull/L3.3-MS-Evayale-70B
- TheDrummer/Anubis-70B-v1
- TheDrummer/Cydonia-24B-v2
- TheDrummer/Rocinante-12B-v1.1
- TheDrummer/UnslopNemo-12B-v4.1
- VongolaChouko/Starcannon-Unleashed-12B-v1.0
- abacusai/Dracarys-72B-Instruct
- aion-labs/aion-1.0
- aion-labs/aion-1.0-mini
- aion-labs/aion-rp-llama-3.1-8b
- amazon/nova-lite-v1
- amazon/nova-micro-v1
- amazon/nova-pro-v1
- anthracite-org/magnum-v2-72b
- anthracite-org/magnum-v4-72b
- azure-gpt-4-turbo
- azure-gpt-4o
- azure-gpt-4o-mini
- azure-o1
- azure-o3-mini
- chatgpt-4o-latest
- claude-3-5-haiku-20241022
- claude-3-5-sonnet-20240620
- claude-3-5-sonnet-20241022
- claude-3-7-sonnet-20250219
- claude-3-7-sonnet-thinking
- claude-3-7-sonnet-thinking:1024
- claude-3-7-sonnet-thinking:128000
- claude-3-7-sonnet-thinking:32768
- claude-3-7-sonnet-thinking:8192
- claude-3-opus-20240229
- cognitivecomputations/dolphin-mixtral-8x22b
- cohere/command-r
- cohere/command-r-plus-08-2024
- deep-research
- deepclaude
- deepseek-ai/DeepSeek-R1-Zero
- deepseek-chat
- deepseek-chat-cheaper
- deepseek-r1-llama-70b
- deepseek-r1-nano
- deepseek-r1-sambanova
- deepseek-reasoner
- deepseek-reasoner-cheaper
- dolphin-2.9.2-qwen2-72b
- doubao-1.5-pro-256k
- doubao-1.5-pro-32k
- doubao-1.5-vision-pro-32k
- eva-unit-01/eva-qwen-2.5-72b
- failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5
- free-model
- gemini-2.0-flash-001
- gemini-2.0-flash-exp-search
- gemini-2.0-flash-lite
- gemini-2.0-flash-thinking-exp-01-21
- gemini-2.0-flash-thinking-exp-1219
- gemini-2.0-pro-exp-02-05
- gemini-exp-1206
- gemini-exp-1206
- glm-4
- glm-4-air
- glm-4-air-0111
- glm-4-airx
- glm-4-flash
- glm-4-long
- glm-4-plus
- glm-4-plus-0111
- glm-zero-preview
- google/gemini-flash-1.5
- gpt-3.5-turbo
- gpt-4-turbo-preview
- gpt-4o
- gpt-4o-2024-08-06
- gpt-4o-2024-11-20
- gpt-4o-mini
- grok-2-1212
- grok-2-vision-1212
- grok-3
- grok-3-deepsearch
- grok-3-reasoner
- grok-beta
- huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated
- huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated
- huihui-ai/Llama-3.1-Nemotron-70B-Instruct-HF-abliterated
- huihui-ai/Llama-3.3-70B-Instruct-abliterated
- inflatebot/MN-12B-Mag-Mell-R1
- inflection/inflection-3-pi
- inflection/inflection-3-productivity
- kimi-k1.5-preview
- kimi-latest
- learnlm-1.5-pro-experimental
- llama-3.3-70b
- meta-llama/llama-3.1-8b-instruct
- meta-llama/llama-3.2-3b-instruct
- meta-llama/llama-3.2-90b-vision-instruct
- microsoft/wizardlm-2-7b
- microsoft/wizardlm-2-8x22b
- minimax/minimax-01
- mistralai/Mistral-Nemo-Instruct-2407
- mistralai/mistral-7b-instruct
- mistralai/mistral-large
- mistralai/mistral-saba
- mistralai/mistral-tiny
- mlabonne/NeuralDaredevil-8B-abliterated
- model-selector
- nothingiisreal/L3.1-70B-Celeste-V0.1-BF16
- nousresearch/hermes-3-llama-3.1-405b
- nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
- o1
- o1-plus
- o1-preview
- o3-mini
- o3-mini-high
- o3-mini-low
- qwen-long
- qwen-max
- qwen-plus
- qwen-turbo
- qwen/qwen-2.5-72b-instruct
- r1-1776
- raifle/sorcererlm-8x22b
- recommended-model
- sonar
- sonar-deep-research
- sonar-pro
- sonar-reasoning
- sonar-reasoning-pro
- step-2-16k
- step-2-16k-exp
- step-2-mini
- undi95/remm-slerp-l2-13b
- yi-34b-chat-0205
- yi-34b-chat-200k
- yi-large
- yi-large-turbo
- yi-lightning
- yi-medium-200k
fetch: false
titleConvo: true
titleModel: "current_model"
modelDisplayLabel: "NanoGPT"
# NVIDIA
# https://build.nvidia.com/explore/discover
- name: "Nvidia"
apiKey: "${NVIDIA_API_KEY}"
baseURL: "https://integrate.api.nvidia.com/v1/"
models:
default:
- 01-ai/yi-large
- abacusai/dracarys-llama-3.1-70b-instruct
- adept/fuyu-8b
- ai21labs/jamba-1.5-large-instruct
- ai21labs/jamba-1.5-mini-instruct
- aisingapore/sea-lion-7b-instruct
- baai/bge-m3
- baichuan-inc/baichuan2-13b-chat
- bigcode/starcoder2-15b
- bigcode/starcoder2-7b
- databricks/dbrx-instruct
- deepseek-ai/deepseek-coder-6.7b-instruct
- deepseek-ai/deepseek-r1
- google/codegemma-1.1-7b
- google/codegemma-7b
- google/deplot
- google/gemma-2-27b-it
- google/gemma-2-2b-it
- google/gemma-2-9b-it
- google/gemma-2b
- google/gemma-7b
- google/paligemma
- google/recurrentgemma-2b
- google/shieldgemma-9b
- ibm/granite-3.0-3b-a800m-instruct
- ibm/granite-3.0-8b-instruct
- ibm/granite-34b-code-instruct
- ibm/granite-8b-code-instruct
- ibm/granite-guardian-3.0-8b
- igenius/colosseum_355b_instruct_16k
- igenius/italia_10b_instruct_16k
- institute-of-science-tokyo/llama-3.1-swallow-70b-instruct-v0.1
- institute-of-science-tokyo/llama-3.1-swallow-8b-instruct-v0.1
- mediatek/breeze-7b-instruct
- meta/codellama-70b
- meta/llama-3.1-405b-instruct
- meta/llama-3.1-70b-instruct
- meta/llama-3.1-8b-instruct
- meta/llama-3.2-1b-instruct
- meta/llama-3.2-3b-instruct
- meta/llama-3.3-70b-instruct
- meta/llama2-70b
- meta/llama3-70b-instruct
- meta/llama3-8b-instruct
- microsoft/kosmos-2
- microsoft/phi-3-medium-128k-instruct
- microsoft/phi-3-medium-4k-instruct
- microsoft/phi-3-mini-128k-instruct
- microsoft/phi-3-mini-4k-instruct
- microsoft/phi-3-small-128k-instruct
- microsoft/phi-3-small-8k-instruct
- microsoft/phi-3-vision-128k-instruct
- microsoft/phi-3.5-mini-instruct
- microsoft/phi-3.5-moe-instruct
- microsoft/phi-3.5-vision-instruct
- microsoft/phi-4-mini-instruct
- mistralai/codestral-22b-instruct-v0.1
- mistralai/mamba-codestral-7b-v0.1
- mistralai/mathstral-7b-v0.1
- mistralai/mistral-7b-instruct-v0.2
- mistralai/mistral-7b-instruct-v0.3
- mistralai/mistral-large
- mistralai/mistral-large-2-instruct
- mistralai/mistral-small-24b-instruct
- mistralai/mixtral-8x22b-instruct-v0.1
- mistralai/mixtral-8x22b-v0.1
- mistralai/mixtral-8x7b-instruct-v0.1
- nv-mistralai/mistral-nemo-12b-instruct
- nvidia/embed-qa-4
- nvidia/llama-3.1-nemoguard-8b-content-safety
- nvidia/llama-3.1-nemoguard-8b-topic-control
- nvidia/llama-3.1-nemotron-51b-instruct
- nvidia/llama-3.1-nemotron-70b-instruct
- nvidia/llama-3.1-nemotron-70b-reward
- nvidia/llama-3.2-nv-embedqa-1b-v1
- nvidia/llama-3.2-nv-embedqa-1b-v2
- nvidia/llama3-chatqa-1.5-70b
- nvidia/llama3-chatqa-1.5-8b
- nvidia/mistral-nemo-minitron-8b-8k-instruct
- nvidia/mistral-nemo-minitron-8b-base
- nvidia/nemotron-4-340b-instruct
- nvidia/nemotron-4-340b-reward
- nvidia/nemotron-4-mini-hindi-4b-instruct
- nvidia/nemotron-mini-4b-instruct
- nvidia/neva-22b
- nvidia/nv-embed-v1
- nvidia/nv-embedqa-e5-v5
- nvidia/nv-embedqa-mistral-7b-v2
- nvidia/nvclip
- nvidia/usdcode-llama-3.1-70b-instruct
- nvidia/vila
- qwen/qwen2-7b-instruct
- qwen/qwen2.5-7b-instruct
- qwen/qwen2.5-coder-32b-instruct
- qwen/qwen2.5-coder-7b-instruct
- rakuten/rakutenai-7b-chat
- rakuten/rakutenai-7b-instruct
- snowflake/arctic-embed-l
- thudm/chatglm3-6b
- tiiuae/falcon3-7b-instruct
- tokyotech-llm/llama-3-swallow-70b-instruct-v0.1
- upstage/solar-10.7b-instruct
- writer/palmyra-creative-122b
- writer/palmyra-fin-70b-32k
- writer/palmyra-med-70b
- writer/palmyra-med-70b-32k
- yentinglin/llama-3-taiwan-70b-instruct
- zyphra/zamba2-7b-instruct
fetch: false
titleConvo: true
titleModel: "nvidia/nemotron-mini-4b-instruct"
modelDisplayLabel: "Nvidia"
iconURL: "https://raw.githubusercontent.com/LibreChat-AI/librechat-config-yaml/refs/heads/main/icons/nvidia.png"
# OpenRouter.ai
# Model list: https://openrouter.ai/models
# Script to fetch models: https://github.com/LibreChat-AI/librechat-config-yaml/blob/main/scripts/openrouter.py
- name: "OpenRouter"
apiKey: "${OPENROUTER_KEY}"
baseURL: "https://openrouter.ai/api/v1"
models:
default:
- openrouter/auto
- '---FREE---'
- cognitivecomputations/dolphin3.0-mistral-24b:free
- cognitivecomputations/dolphin3.0-r1-mistral-24b:free
- deepseek/deepseek-chat:free
- deepseek/deepseek-r1-distill-llama-70b:free
- deepseek/deepseek-r1:free
- google/gemini-2.0-flash-exp:free
- google/gemini-2.0-flash-lite-preview-02-05:free
- google/gemini-2.0-flash-thinking-exp-1219:free
- google/gemini-2.0-flash-thinking-exp:free
- google/gemini-2.0-pro-exp-02-05:free
- google/gemini-exp-1206:free
- google/gemma-2-9b-it:free
- google/learnlm-1.5-pro-experimental:free
- gryphe/mythomax-l2-13b:free
- huggingfaceh4/zephyr-7b-beta:free
- meta-llama/llama-3-8b-instruct:free
- meta-llama/llama-3.1-8b-instruct:free
- meta-llama/llama-3.2-11b-vision-instruct:free
- meta-llama/llama-3.2-1b-instruct:free
- meta-llama/llama-3.3-70b-instruct:free
- microsoft/phi-3-medium-128k-instruct:free
- microsoft/phi-3-mini-128k-instruct:free
- mistralai/mistral-7b-instruct:free
- mistralai/mistral-nemo:free
- mistralai/mistral-small-24b-instruct-2501:free
- nvidia/llama-3.1-nemotron-70b-instruct:free
- openchat/openchat-7b:free
- qwen/qwen-vl-plus:free
- qwen/qwen2.5-vl-72b-instruct:free
- sophosympatheia/rogue-rose-103b-v0.2:free
- undi95/toppy-m-7b:free
- '---BETA---'
- anthropic/claude-2.0:beta
- anthropic/claude-2.1:beta
- anthropic/claude-2:beta
- anthropic/claude-3-haiku:beta
- anthropic/claude-3-opus:beta
- anthropic/claude-3-sonnet:beta
- anthropic/claude-3.5-haiku-20241022:beta
- anthropic/claude-3.5-haiku:beta
- anthropic/claude-3.5-sonnet-20240620:beta
- anthropic/claude-3.5-sonnet:beta
- anthropic/claude-3.7-sonnet:beta
- '---EXTENDED---'
- neversleep/llama-3-lumimaid-8b:extended
- openai/gpt-4o:extended
- '---AI21---'
- ai21/jamba-1-5-large
- ai21/jamba-1-5-mini
- ai21/jamba-instruct
- '---AION-LABS---'
- aion-labs/aion-1.0
- aion-labs/aion-1.0-mini
- aion-labs/aion-rp-llama-3.1-8b
- '---AMAZON---'
- amazon/nova-lite-v1
- amazon/nova-micro-v1
- amazon/nova-pro-v1
- '---ANTHROPIC---'
- anthropic/claude-2
- anthropic/claude-2.0
- anthropic/claude-2.1
- anthropic/claude-3-7-sonnet
- anthropic/claude-3-haiku
- anthropic/claude-3-opus
- anthropic/claude-3-sonnet
- anthropic/claude-3.5-haiku
- anthropic/claude-3.5-haiku-20241022
- anthropic/claude-3.5-sonnet
- anthropic/claude-3.5-sonnet-20240620
- anthropic/claude-3.7-sonnet
- anthropic/claude-3.7-sonnet:thinking
- '---COHERE---'
- cohere/command
- cohere/command-r
- cohere/command-r-03-2024
- cohere/command-r-08-2024
- cohere/command-r-plus
- cohere/command-r-plus-04-2024
- cohere/command-r-plus-08-2024
- cohere/command-r7b-12-2024
- '---DEEPSEEK---'
- deepseek/deepseek-chat
- deepseek/deepseek-chat-v2.5
- deepseek/deepseek-r1
- deepseek/deepseek-r1-distill-llama-70b
- deepseek/deepseek-r1-distill-llama-8b
- deepseek/deepseek-r1-distill-qwen-1.5b
- deepseek/deepseek-r1-distill-qwen-14b
- deepseek/deepseek-r1-distill-qwen-32b
- '---EVA-UNIT-01---'
- eva-unit-01/eva-llama-3.33-70b
- eva-unit-01/eva-qwen-2.5-32b
- eva-unit-01/eva-qwen-2.5-72b
- '---GOOGLE---'
- google/gemini-2.0-flash-001
- google/gemini-2.0-flash-lite-001
- google/gemini-flash-1.5
- google/gemini-flash-1.5-8b
- google/gemini-flash-1.5-8b-exp
- google/gemini-pro
- google/gemini-pro-1.5
- google/gemini-pro-vision
- google/gemma-2-27b-it
- google/gemma-2-9b-it
- google/gemma-7b-it
- google/palm-2-chat-bison
- google/palm-2-chat-bison-32k
- google/palm-2-codechat-bison
- google/palm-2-codechat-bison-32k
- '---LIQUID---'
- liquid/lfm-3b
- liquid/lfm-40b
- liquid/lfm-7b
- '---META-LLAMA---'
- meta-llama/llama-2-13b-chat
- meta-llama/llama-2-70b-chat
- meta-llama/llama-3-70b-instruct
- meta-llama/llama-3-8b-instruct
- meta-llama/llama-3.1-405b
- meta-llama/llama-3.1-405b-instruct
- meta-llama/llama-3.1-70b-instruct
- meta-llama/llama-3.1-8b-instruct
- meta-llama/llama-3.2-11b-vision-instruct
- meta-llama/llama-3.2-1b-instruct
- meta-llama/llama-3.2-3b-instruct
- meta-llama/llama-3.2-90b-vision-instruct
- meta-llama/llama-3.3-70b-instruct
- meta-llama/llama-guard-2-8b
- meta-llama/llama-guard-3-8b
- '---MICROSOFT---'
- microsoft/phi-3-medium-128k-instruct
- microsoft/phi-3-mini-128k-instruct
- microsoft/phi-3.5-mini-128k-instruct
- microsoft/phi-4
- microsoft/wizardlm-2-7b
- microsoft/wizardlm-2-8x22b
- '---MISTRALAI---'
- mistralai/codestral-2501
- mistralai/codestral-mamba
- mistralai/ministral-3b
- mistralai/ministral-8b
- mistralai/mistral-7b-instruct
- mistralai/mistral-7b-instruct-v0.1
- mistralai/mistral-7b-instruct-v0.3
- mistralai/mistral-large
- mistralai/mistral-large-2407
- mistralai/mistral-large-2411
- mistralai/mistral-medium
- mistralai/mistral-nemo
- mistralai/mistral-saba
- mistralai/mistral-small
- mistralai/mistral-small-24b-instruct-2501
- mistralai/mistral-tiny
- mistralai/mixtral-8x22b-instruct
- mistralai/mixtral-8x7b
- mistralai/mixtral-8x7b-instruct
- mistralai/pixtral-12b
- mistralai/pixtral-large-2411
- '---NEVERSLEEP---'
- neversleep/llama-3-lumimaid-70b
- neversleep/llama-3-lumimaid-8b
- neversleep/llama-3.1-lumimaid-70b
- neversleep/llama-3.1-lumimaid-8b
- neversleep/noromaid-20b
- '---NOUSRESEARCH---'
- nousresearch/hermes-2-pro-llama-3-8b
- nousresearch/hermes-3-llama-3.1-405b
- nousresearch/hermes-3-llama-3.1-70b
- nousresearch/nous-hermes-2-mixtral-8x7b-dpo
- nousresearch/nous-hermes-llama2-13b
- '---OPENAI---'
- openai/chatgpt-4o-latest
- openai/gpt-3.5-turbo
- openai/gpt-3.5-turbo-0125
- openai/gpt-3.5-turbo-0613
- openai/gpt-3.5-turbo-1106
- openai/gpt-3.5-turbo-16k
- openai/gpt-3.5-turbo-instruct
- openai/gpt-4
- openai/gpt-4-0314
- openai/gpt-4-1106-preview
- openai/gpt-4-32k
- openai/gpt-4-32k-0314
- openai/gpt-4-turbo
- openai/gpt-4-turbo-preview
- openai/gpt-4o
- openai/gpt-4o-2024-05-13
- openai/gpt-4o-2024-08-06
- openai/gpt-4o-2024-11-20
- openai/gpt-4o-mini
- openai/gpt-4o-mini-2024-07-18
- openai/o1
- openai/o1-mini
- openai/o1-mini-2024-09-12
- openai/o1-preview
- openai/o1-preview-2024-09-12
- openai/o3-mini
- openai/o3-mini-high
- '---PERPLEXITY---'
- perplexity/llama-3.1-sonar-huge-128k-online
- perplexity/llama-3.1-sonar-large-128k-chat
- perplexity/llama-3.1-sonar-large-128k-online
- perplexity/llama-3.1-sonar-small-128k-chat
- perplexity/llama-3.1-sonar-small-128k-online
- perplexity/r1-1776
- perplexity/sonar
- perplexity/sonar-reasoning
- '---QWEN---'
- qwen/qvq-72b-preview
- qwen/qwen-2-72b-instruct
- qwen/qwen-2-vl-72b-instruct
- qwen/qwen-2-vl-7b-instruct
- qwen/qwen-2.5-72b-instruct
- qwen/qwen-2.5-7b-instruct
- qwen/qwen-2.5-coder-32b-instruct
- qwen/qwen-max
- qwen/qwen-plus
- qwen/qwen-turbo
- qwen/qwq-32b-preview
- '---SAO10K---'
- sao10k/fimbulvetr-11b-v2
- sao10k/l3-euryale-70b
- sao10k/l3-lunaris-8b
- sao10k/l3.1-70b-hanami-x1
- sao10k/l3.1-euryale-70b
- sao10k/l3.3-euryale-70b
- '---X-AI---'
- x-ai/grok-2-1212
- x-ai/grok-2-vision-1212
- x-ai/grok-beta
- x-ai/grok-vision-beta
- '---OTHERS---'
- 01-ai/yi-large
- aetherwiing/mn-starcannon-12b
- allenai/llama-3.1-tulu-3-405b
- alpindale/goliath-120b
- alpindale/magnum-72b
- anthracite-org/magnum-v2-72b
- anthracite-org/magnum-v4-72b
- cognitivecomputations/dolphin-mixtral-8x22b
- cognitivecomputations/dolphin-mixtral-8x7b
- databricks/dbrx-instruct
- gryphe/mythomax-l2-13b
- infermatic/mn-inferor-12b
- inflatebot/mn-mag-mell-r1
- inflection/inflection-3-pi
- inflection/inflection-3-productivity
- jondurbin/airoboros-l2-70b
- mancer/weaver
- minimax/minimax-01
- nothingiisreal/mn-celeste-12b
- nvidia/llama-3.1-nemotron-70b-instruct
- openchat/openchat-7b
- pygmalionai/mythalion-13b
- raifle/sorcererlm-8x22b
- sophosympatheia/midnight-rose-70b
- teknium/openhermes-2.5-mistral-7b
- thedrummer/rocinante-12b
- thedrummer/unslopnemo-12b
- undi95/remm-slerp-l2-13b
- undi95/toppy-m-7b
- xwin-lm/xwin-lm-70b
fetch: false
dropParams:
- "stop"
titleConvo: true
titleModel: "openai/gpt-4o-mini"
summarize: false
summaryModel: "openai/gpt-4o-mini"
forcePrompt: false
modelDisplayLabel: "OpenRouter"
# Preplexity
# Model list: https://docs.perplexity.ai/docs/model-cards
- name: "Perplexity"
apiKey: "${PERPLEXITY_API_KEY}"
baseURL: "https://api.perplexity.ai/"
models:
default:
- r1-1776
- sonar
- sonar-deep-research
- sonar-pro
- sonar-reasoning
- sonar-reasoning-pro
fetch: false # fetching list of models is not supported
titleConvo: true
titleModel: "llama-3.1-sonar-small-128k-chat"
summarize: false
summaryModel: "llama-3.1-sonar-small-128k-chat"
forcePrompt: false
dropParams:
- "stop"
- "frequency_penalty"
modelDisplayLabel: "Perplexity"
# SambaNova
# https://cloud.sambanova.ai/apis
- name: "SambaNova"
iconURL: "https://sambanova.ai/hubfs/logotype_sambanova_orange.png"
apiKey: "${SAMBANOVA_API_KEY}"
baseURL: "https://api.sambanova.ai/v1/"
models:
default:
- DeepSeek-R1
- DeepSeek-R1-Distill-Llama-70B
- Llama-3.1-Tulu-3-405B
- Llama-3.2-11B-Vision-Instruct
- Llama-3.2-90B-Vision-Instruct
- Meta-Llama-3.1-405B-Instruct
- Meta-Llama-3.1-70B-Instruct
- Meta-Llama-3.1-8B-Instruct
- Meta-Llama-3.2-1B-Instruct
- Meta-Llama-3.2-3B-Instruct
- Meta-Llama-3.3-70B-Instruct
- Meta-Llama-Guard-3-8B
- QwQ-32B-Preview
- Qwen2-Audio-7B-Instruct
- Qwen2.5-72B-Instruct
- Qwen2.5-Coder-32B-Instruct
fetch: false
titleConvo: true
titleModel: "Meta-Llama-3.1-8B-Instruct"
modelDisplayLabel: "SambaNova"
# together.ai
# https://api.together.ai/settings/api-keys
# Model list: https://docs.together.ai/docs/inference-models
- name: "together.ai"
apiKey: "${TOGETHERAI_API_KEY}"
baseURL: "https://api.together.xyz"
models:
default:
- Gryphe/MythoMax-L2-13b
- Gryphe/MythoMax-L2-13b-Lite
- NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO
- Qwen/QwQ-32B-Preview
- Qwen/Qwen2-72B-Instruct
- Qwen/Qwen2-VL-72B-Instruct
- Qwen/Qwen2.5-72B-Instruct-Turbo
- Qwen/Qwen2.5-7B-Instruct-Turbo
- Qwen/Qwen2.5-Coder-32B-Instruct
- databricks/dbrx-instruct
- deepseek-ai/DeepSeek-R1
- deepseek-ai/DeepSeek-R1-Distill-Llama-70B
- deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free
- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
- deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
- deepseek-ai/DeepSeek-V3
- google/gemma-2-27b-it
- google/gemma-2-9b-it
- google/gemma-2b-it
- meta-llama/Llama-2-13b-chat-hf
- meta-llama/Llama-2-7b-chat-hf
- meta-llama/Llama-3-70b-chat-hf
- meta-llama/Llama-3-8b-chat-hf
- meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo
- meta-llama/Llama-3.2-3B-Instruct-Turbo
- meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo
- meta-llama/Llama-3.3-70B-Instruct-Turbo
- meta-llama/Llama-3.3-70B-Instruct-Turbo-Free
- meta-llama/Llama-Vision-Free
- meta-llama/Meta-Llama-3-70B-Instruct-Lite
- meta-llama/Meta-Llama-3-70B-Instruct-Turbo
- meta-llama/Meta-Llama-3-8B-Instruct-Lite
- meta-llama/Meta-Llama-3-8B-Instruct-Turbo
- meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo
- meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo
- meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo
- meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo-128K
- meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo-classifier
- microsoft/WizardLM-2-8x22B
- mistralai/Mistral-7B-Instruct-v0.1
- mistralai/Mistral-7B-Instruct-v0.2
- mistralai/Mistral-7B-Instruct-v0.3
- mistralai/Mistral-Small-24B-Instruct-2501
- mistralai/Mixtral-8x22B-Instruct-v0.1
- mistralai/Mixtral-8x7B-Instruct-v0.1
- nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
- scb10x/scb10x-llama3-1-typhoon2-60256
- scb10x/scb10x-llama3-typhoon-v1-5-8b-instruct
- scb10x/scb10x-llama3-typhoon-v1-5x-4f316
- togethercomputer/MoA-1
- togethercomputer/MoA-1-Turbo
- upstage/SOLAR-10.7B-Instruct-v1.0
fetch: false
titleConvo: true
titleModel: "togethercomputer/llama-2-7b-chat"
summarize: false
summaryModel: "togethercomputer/llama-2-7b-chat"
forcePrompt: false
modelDisplayLabel: "together.ai"
# Unify
# Model list: https://unify.ai/chat
- name: "Unify"
apiKey: "${UNIFY_API_KEY}"
baseURL: "https://api.unify.ai/v0/"
models:
default:
- chatgpt-4o-latest@openai
- claude-3-haiku@anthropic
- claude-3-haiku@aws-bedrock
- claude-3-haiku@vertex-ai
- claude-3-opus@anthropic
- claude-3-opus@aws-bedrock
- claude-3-opus@vertex-ai
- claude-3-sonnet@anthropic
- claude-3-sonnet@aws-bedrock
- claude-3.5-haiku@anthropic
- claude-3.5-haiku@aws-bedrock
- claude-3.5-haiku@replicate
- claude-3.5-haiku@vertex-ai
- claude-3.5-sonnet-20240620@anthropic
- claude-3.5-sonnet-20240620@aws-bedrock
- claude-3.5-sonnet-20240620@vertex-ai
- claude-3.5-sonnet@anthropic
- claude-3.5-sonnet@aws-bedrock
- claude-3.5-sonnet@replicate
- claude-3.5-sonnet@vertex-ai
- claude-3.7-sonnet@anthropic
- claude-3.7-sonnet@aws-bedrock
- claude-3.7-sonnet@vertex-ai
- command-r-plus@aws-bedrock
- deepseek-r1@deepinfra
- deepseek-r1@deepseek
- deepseek-r1@fireworks-ai
- deepseek-r1@replicate
- deepseek-r1@together-ai
- deepseek-v3@deepinfra
- deepseek-v3@deepseek
- deepseek-v3@fireworks-ai
- deepseek-v3@together-ai
- gemini-1.0-pro-001@vertex-ai
- gemini-1.0-pro-002@vertex-ai
- gemini-1.0-pro@vertex-ai
- gemini-1.5-flash-001@vertex-ai
- gemini-1.5-flash-002@vertex-ai
- gemini-1.5-flash@vertex-ai
- gemini-1.5-pro-001@vertex-ai
- gemini-1.5-pro-002@vertex-ai
- gemini-1.5-pro@vertex-ai
- gemini-2.0-flash-lite@vertex-ai
- gemini-2.0-flash@vertex-ai
- gemma-2-27b-it@deepinfra
- gemma-2-27b-it@together-ai
- gemma-2-9b-it@deepinfra
- gemma-2-9b-it@groq
- gemma-2-9b-it@lepton-ai
- gemma-2-9b-it@together-ai
- gpt-3.5-turbo@openai
- gpt-4-turbo@openai
- gpt-4@openai
- gpt-4o-2024-05-13@openai
- gpt-4o-2024-08-06@openai
- gpt-4o-2024-11-20@openai
- gpt-4o-mini@openai
- gpt-4o@openai
- grok-2-vision@xai
- grok-2@xai
- llama-3-70b-chat@aws-bedrock
- llama-3-70b-chat@deepinfra
- llama-3-70b-chat@fireworks-ai
- llama-3-70b-chat@groq
- llama-3-70b-chat@replicate
- llama-3-70b-chat@together-ai
- llama-3-8b-chat@aws-bedrock
- llama-3-8b-chat@deepinfra
- llama-3-8b-chat@fireworks-ai
- llama-3-8b-chat@groq
- llama-3-8b-chat@replicate
- llama-3-8b-chat@together-ai
- llama-3.1-405b-chat@aws-bedrock
- llama-3.1-405b-chat@deepinfra
- llama-3.1-405b-chat@fireworks-ai
- llama-3.1-405b-chat@replicate
- llama-3.1-405b-chat@together-ai
- llama-3.1-405b-chat@vertex-ai
- llama-3.1-70b-chat@aws-bedrock
- llama-3.1-70b-chat@deepinfra
- llama-3.1-70b-chat@fireworks-ai
- llama-3.1-70b-chat@together-ai
- llama-3.1-70b-chat@vertex-ai
- llama-3.1-8b-chat@aws-bedrock
- llama-3.1-8b-chat@deepinfra
- llama-3.1-8b-chat@fireworks-ai
- llama-3.1-8b-chat@groq
- llama-3.1-8b-chat@lepton-ai
- llama-3.1-8b-chat@together-ai
- llama-3.1-8b-chat@vertex-ai
- llama-3.1-nemotron-70b-chat@deepinfra
- llama-3.2-11b-chat@deepinfra
- llama-3.2-11b-chat@fireworks-ai
- llama-3.2-11b-chat@groq
- llama-3.2-11b-chat@together-ai
- llama-3.2-11b-chat@vertex-ai
- llama-3.2-1b-chat@aws-bedrock
- llama-3.2-1b-chat@deepinfra
- llama-3.2-1b-chat@groq
- llama-3.2-1b-chat@lepton-ai
- llama-3.2-3b-chat@aws-bedrock
- llama-3.2-3b-chat@deepinfra
- llama-3.2-3b-chat@fireworks-ai
- llama-3.2-3b-chat@groq
- llama-3.2-3b-chat@lepton-ai
- llama-3.2-3b-chat@together-ai
- llama-3.2-90b-chat@deepinfra
- llama-3.2-90b-chat@fireworks-ai
- llama-3.2-90b-chat@groq
- llama-3.2-90b-chat@together-ai
- llama-3.2-90b-chat@vertex-ai
- llama-3.3-70b-chat@aws-bedrock
- llama-3.3-70b-chat@deepinfra
- llama-3.3-70b-chat@fireworks-ai
- llama-3.3-70b-chat@groq
- llama-3.3-70b-chat@lepton-ai
- llama-3.3-70b-chat@together-ai
- ministral-3b@mistral-ai
- ministral-8b@mistral-ai
- mistral-7b-instruct-v0.2@aws-bedrock
- mistral-7b-instruct-v0.3@deepinfra
- mistral-7b-instruct-v0.3@lepton-ai
- mistral-7b-instruct-v0.3@mistral-ai
- mistral-7b-instruct-v0.3@together-ai
- mistral-large@aws-bedrock
- mistral-large@mistral-ai
- mistral-large@vertex-ai
- mistral-nemo@deepinfra
- mistral-nemo@lepton-ai
- mistral-nemo@mistral-ai
- mistral-nemo@vertex-ai
- mistral-small@deepinfra
- mistral-small@fireworks-ai
- mistral-small@mistral-ai
- mistral-small@together-ai
- mixtral-8x22b-instruct-v0.1@fireworks-ai
- mixtral-8x22b-instruct-v0.1@mistral-ai
- mixtral-8x22b-instruct-v0.1@together-ai
- mixtral-8x7b-instruct-v0.1@aws-bedrock
- mixtral-8x7b-instruct-v0.1@deepinfra
- mixtral-8x7b-instruct-v0.1@fireworks-ai
- mixtral-8x7b-instruct-v0.1@groq
- mixtral-8x7b-instruct-v0.1@lepton-ai
- mixtral-8x7b-instruct-v0.1@mistral-ai
- mixtral-8x7b-instruct-v0.1@together-ai
- o1-mini@openai
- o1@openai
- o3-mini@openai
- qwen-2-72b-instruct@together-ai
- qwen-2.5-72b-instruct@deepinfra
- qwen-2.5-72b-instruct@fireworks-ai
- qwen-2.5-72b-instruct@together-ai
- qwen-2.5-7b-instruct@deepinfra
- qwen-2.5-7b-instruct@together-ai
- qwen-2.5-coder-32b-instruct@deepinfra
- qwen-2.5-coder-32b-instruct@fireworks-ai
- qwen-2.5-coder-32b-instruct@groq
- qwen-2.5-coder-32b-instruct@together-ai
- qwen-qwq-32b-preview@fireworks-ai
- qwen-qwq-32b-preview@together-ai
fetch: false
titleConvo: true
titleModel: "gpt-4o-mini@openai"
dropParams:
- "stop"
- "user"
- "frequency_penalty"
- "presence_penalty"
# xAI
# https://x.ai/api
- name: "xai"
apiKey: "${XAI_API_KEY}"
baseURL: "https://api.x.ai/v1"
models:
default:
- "grok-beta"
fetch: false
titleConvo: true
titleMethod: "completion"
titleModel: "grok-beta"
summarize: false
summaryModel: "grok-beta"
forcePrompt: false
modelDisplayLabel: "Grok"