Models

All models available

zai-org/GLM-4.6V-Flash

zai-org/GLM-4.6V-Flash

-

zai-org/GLM-4.6V

zai-org/GLM-4.6V

-

ServiceNow-AI/Apriel-1.6-15b-Thinker

ServiceNow-AI/Apriel-1.6-15b-Thinker

-

EssentialAI/rnj-1-instruct

EssentialAI/rnj-1-instruct

-

deepseek-ai/DeepSeek-V3.2

deepseek-ai/DeepSeek-V3.2

-

zai-org/AutoGLM-Phone-9B-Multilingual

zai-org/AutoGLM-Phone-9B-Multilingual

-

meta-llama/Llama-3.1-8B-Instruct

meta-llama/Llama-3.1-8B-Instruct

-

openai/gpt-oss-20b

openai/gpt-oss-20b

-

zai-org/GLM-4.6

zai-org/GLM-4.6

-

Qwen/Qwen3-4B-Instruct-2507

Qwen/Qwen3-4B-Instruct-2507

-

Qwen/Qwen3-VL-8B-Instruct

Qwen/Qwen3-VL-8B-Instruct

-

moonshotai/Kimi-K2-Thinking

moonshotai/Kimi-K2-Thinking

-

openai/gpt-oss-120b

openai/gpt-oss-120b

-

zai-org/GLM-4.6V-FP8

zai-org/GLM-4.6V-FP8

-

MiniMaxAI/MiniMax-M2

MiniMaxAI/MiniMax-M2

-

meta-llama/Llama-3.2-1B-Instruct

meta-llama/Llama-3.2-1B-Instruct

-

deepseek-ai/DeepSeek-V3.2-Exp

deepseek-ai/DeepSeek-V3.2-Exp

-

Qwen/Qwen3-VL-30B-A3B-Instruct

Qwen/Qwen3-VL-30B-A3B-Instruct

-

Qwen/Qwen3-30B-A3B-Instruct-2507

Qwen/Qwen3-30B-A3B-Instruct-2507

-

Qwen/Qwen2.5-VL-7B-Instruct

Qwen/Qwen2.5-VL-7B-Instruct

-

Qwen/Qwen3-Coder-30B-A3B-Instruct

Qwen/Qwen3-Coder-30B-A3B-Instruct

-

Qwen/Qwen2.5-7B-Instruct

Qwen/Qwen2.5-7B-Instruct

-

Qwen/Qwen3-8B

Qwen/Qwen3-8B

-

google/gemma-3-27b-it

google/gemma-3-27b-it

-

meta-llama/Llama-3.3-70B-Instruct

meta-llama/Llama-3.3-70B-Instruct

-

meta-llama/Llama-3.2-3B-Instruct

meta-llama/Llama-3.2-3B-Instruct

-

Qwen/Qwen3-4B-Thinking-2507

Qwen/Qwen3-4B-Thinking-2507

-

Qwen/Qwen3-Next-80B-A3B-Instruct

Qwen/Qwen3-Next-80B-A3B-Instruct

-

meta-llama/Meta-Llama-3-8B-Instruct

meta-llama/Meta-Llama-3-8B-Instruct

-

zai-org/GLM-4.6-FP8

zai-org/GLM-4.6-FP8

-

Qwen/Qwen3-VL-235B-A22B-Instruct

Qwen/Qwen3-VL-235B-A22B-Instruct

-

moonshotai/Kimi-K2-Instruct-0905

moonshotai/Kimi-K2-Instruct-0905

-

moonshotai/Kimi-K2-Instruct

moonshotai/Kimi-K2-Instruct

-

allenai/Olmo-3-7B-Instruct

allenai/Olmo-3-7B-Instruct

-

HuggingFaceTB/SmolLM3-3B

HuggingFaceTB/SmolLM3-3B

-

deepseek-ai/DeepSeek-R1

deepseek-ai/DeepSeek-R1

-

Qwen/Qwen3-14B

Qwen/Qwen3-14B

-

google/gemma-2-2b-it

google/gemma-2-2b-it

-

swiss-ai/Apertus-8B-Instruct-2509

swiss-ai/Apertus-8B-Instruct-2509

-

Qwen/Qwen3-30B-A3B

Qwen/Qwen3-30B-A3B

-

zai-org/GLM-4.5-Air

zai-org/GLM-4.5-Air

-

Qwen/Qwen3-VL-235B-A22B-Thinking

Qwen/Qwen3-VL-235B-A22B-Thinking

-

deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B

deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B

-

Sao10K/L3-8B-Stheno-v3.2

Sao10K/L3-8B-Stheno-v3.2

-

Qwen/Qwen3-VL-32B-Instruct

Qwen/Qwen3-VL-32B-Instruct

-

Qwen/Qwen2.5-VL-72B-Instruct

Qwen/Qwen2.5-VL-72B-Instruct

-

zai-org/GLM-4.5V

zai-org/GLM-4.5V

-

deepseek-ai/DeepSeek-R1-Distill-Qwen-14B

deepseek-ai/DeepSeek-R1-Distill-Qwen-14B

-

deepseek-ai/DeepSeek-R1-0528-Qwen3-8B

deepseek-ai/DeepSeek-R1-0528-Qwen3-8B

-

nvidia/NVIDIA-Nemotron-Nano-12B-v2

nvidia/NVIDIA-Nemotron-Nano-12B-v2

-

Qwen/Qwen3-235B-A22B-Instruct-2507

Qwen/Qwen3-235B-A22B-Instruct-2507

-

Qwen/Qwen3-235B-A22B

Qwen/Qwen3-235B-A22B

-

deepseek-ai/DeepSeek-V3.1-Terminus

deepseek-ai/DeepSeek-V3.1-Terminus

-

Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8

Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8

-

openai/gpt-oss-safeguard-20b

openai/gpt-oss-safeguard-20b

-

Qwen/Qwen3-235B-A22B-Thinking-2507

Qwen/Qwen3-235B-A22B-Thinking-2507

-

deepseek-ai/DeepSeek-V3

deepseek-ai/DeepSeek-V3

-

Qwen/Qwen3-30B-A3B-Thinking-2507

Qwen/Qwen3-30B-A3B-Thinking-2507

-

Qwen/Qwen2.5-Coder-7B-Instruct

Qwen/Qwen2.5-Coder-7B-Instruct

-

Qwen/Qwen3-32B

Qwen/Qwen3-32B

-

Qwen/Qwen2.5-Coder-32B-Instruct

Qwen/Qwen2.5-Coder-32B-Instruct

-

Qwen/Qwen2.5-72B-Instruct

Qwen/Qwen2.5-72B-Instruct

-

Qwen/QwQ-32B

Qwen/QwQ-32B

-

allenai/Olmo-3-7B-Think

allenai/Olmo-3-7B-Think

-

zai-org/GLM-4.1V-9B-Thinking

zai-org/GLM-4.1V-9B-Thinking

-

deepseek-ai/DeepSeek-V3.1

deepseek-ai/DeepSeek-V3.1

-

Qwen/Qwen3-Next-80B-A3B-Thinking

Qwen/Qwen3-Next-80B-A3B-Thinking

-

deepseek-ai/DeepSeek-R1-Distill-Qwen-7B

deepseek-ai/DeepSeek-R1-Distill-Qwen-7B

-

deepseek-ai/DeepSeek-R1-Distill-Llama-70B

deepseek-ai/DeepSeek-R1-Distill-Llama-70B

-

Qwen/Qwen3-Coder-480B-A35B-Instruct

Qwen/Qwen3-Coder-480B-A35B-Instruct

-

deepseek-ai/DeepSeek-R1-Distill-Qwen-32B

deepseek-ai/DeepSeek-R1-Distill-Qwen-32B

-

google/gemma-2-9b-it

google/gemma-2-9b-it

-

katanemo/Arch-Router-1.5B

katanemo/Arch-Router-1.5B

-

Qwen/Qwen2.5-Coder-7B

Qwen/Qwen2.5-Coder-7B

-

NousResearch/Hermes-4-405B

NousResearch/Hermes-4-405B

-

zai-org/GLM-4.5

zai-org/GLM-4.5

-

swiss-ai/Apertus-70B-Instruct-2509

swiss-ai/Apertus-70B-Instruct-2509

-

baidu/ERNIE-4.5-VL-28B-A3B-PT

baidu/ERNIE-4.5-VL-28B-A3B-PT

-

nvidia/Llama-3_1-Nemotron-Ultra-253B-v1

nvidia/Llama-3_1-Nemotron-Ultra-253B-v1

-

deepseek-ai/DeepSeek-V3-0324

deepseek-ai/DeepSeek-V3-0324

-

NousResearch/Hermes-4-70B

NousResearch/Hermes-4-70B

-

CohereLabs/c4ai-command-a-03-2025

CohereLabs/c4ai-command-a-03-2025

-

alpindale/WizardLM-2-8x22B

alpindale/WizardLM-2-8x22B

-

CohereLabs/command-a-reasoning-08-2025

CohereLabs/command-a-reasoning-08-2025

-

Sao10K/L3-70B-Euryale-v2.1

Sao10K/L3-70B-Euryale-v2.1

-

deepseek-ai/DeepSeek-R1-Distill-Llama-8B

deepseek-ai/DeepSeek-R1-Distill-Llama-8B

-

deepseek-ai/DeepSeek-Prover-V2-671B

deepseek-ai/DeepSeek-Prover-V2-671B

-

deepcogito/cogito-671b-v2.1-FP8

deepcogito/cogito-671b-v2.1-FP8

-

baidu/ERNIE-4.5-0.3B-PT

baidu/ERNIE-4.5-0.3B-PT

-

baidu/ERNIE-4.5-21B-A3B-PT

baidu/ERNIE-4.5-21B-A3B-PT

-

baichuan-inc/Baichuan-M2-32B

baichuan-inc/Baichuan-M2-32B

-

deepseek-ai/DeepSeek-R1-0528

deepseek-ai/DeepSeek-R1-0528

-

aisingapore/Gemma-SEA-LION-v4-27B-IT

aisingapore/Gemma-SEA-LION-v4-27B-IT

-

meta-llama/Meta-Llama-3-70B-Instruct

meta-llama/Meta-Llama-3-70B-Instruct

-

NousResearch/Hermes-2-Pro-Llama-3-8B

NousResearch/Hermes-2-Pro-Llama-3-8B

-

deepcogito/cogito-671b-v2.1

deepcogito/cogito-671b-v2.1

-

aisingapore/Qwen-SEA-LION-v4-32B-IT

aisingapore/Qwen-SEA-LION-v4-32B-IT

-

CohereLabs/aya-vision-32b

CohereLabs/aya-vision-32b

-

Sao10K/L3-8B-Lunaris-v1

Sao10K/L3-8B-Lunaris-v1

-

Qwen/Qwen2.5-Coder-3B-Instruct

Qwen/Qwen2.5-Coder-3B-Instruct

-

dicta-il/DictaLM-3.0-24B-Thinking

dicta-il/DictaLM-3.0-24B-Thinking

-

CohereLabs/command-a-vision-07-2025

CohereLabs/command-a-vision-07-2025

-

zai-org/GLM-4-32B-0414

zai-org/GLM-4-32B-0414

-

baidu/ERNIE-4.5-VL-424B-A47B-Base-PT

baidu/ERNIE-4.5-VL-424B-A47B-Base-PT

-

CohereLabs/c4ai-command-r-08-2024

CohereLabs/c4ai-command-r-08-2024

-

PrimeIntellect/INTELLECT-3-FP8

PrimeIntellect/INTELLECT-3-FP8

-

MiniMaxAI/MiniMax-M1-80k

MiniMaxAI/MiniMax-M1-80k

-

Qwen/Qwen3-VL-30B-A3B-Thinking

Qwen/Qwen3-VL-30B-A3B-Thinking

-

Qwen/Qwen3-235B-A22B-FP8

Qwen/Qwen3-235B-A22B-FP8

-

CohereLabs/aya-expanse-32b

CohereLabs/aya-expanse-32b

-

baidu/ERNIE-4.5-300B-A47B-Base-PT

baidu/ERNIE-4.5-300B-A47B-Base-PT

-

marin-community/marin-8b-instruct

marin-community/marin-8b-instruct

-

CohereLabs/c4ai-command-r7b-12-2024

CohereLabs/c4ai-command-r7b-12-2024

-

tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4

tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4

-

zai-org/GLM-4.5-Air-FP8

zai-org/GLM-4.5-Air-FP8

-

CohereLabs/c4ai-command-r7b-arabic-02-2025

CohereLabs/c4ai-command-r7b-arabic-02-2025

-

Qwen/Qwen2.5-VL-32B-Instruct

Qwen/Qwen2.5-VL-32B-Instruct

-

deepcogito/cogito-v2-preview-llama-70B

deepcogito/cogito-v2-preview-llama-70B

-

zai-org/GLM-4.5V-FP8

zai-org/GLM-4.5V-FP8

-

CohereLabs/command-a-translate-08-2025

CohereLabs/command-a-translate-08-2025

-

deepcogito/cogito-v2-preview-llama-405B

deepcogito/cogito-v2-preview-llama-405B

-