Extend Any Model to Unlimited Context
All open-weight models plus your own custom/self-trained GGUF models. Run with ./alphallama -m <model>.gguf --port 18080.
175 models
Params
685B
Context
160K
Run
./alphallama -m deepseek-chat-v3-0324.gguf
Params
671B
Context
160K
Run
./alphallama -m deepseek-chat-v3.1.gguf
Params
671B
Context
160K
Run
./alphallama -m deepseek-r1-0528.gguf
Params
671B
Context
160K
Run
./alphallama -m deepseek-r1.gguf
Params
480B (35B active)
Context
977K
Run
./alphallama -m qwen3-coder-plus.gguf
Params
480B (35B active)
Context
1024K
Run
./alphallama -m qwen3-coder.gguf
Params
424B (47B active)
Context
128K
Run
./alphallama -m ernie-4.5-vl-424b-a47b.gguf
Params
405B
Context
128K
Run
./alphallama -m hermes-4-405b.gguf
Params
405B
Context
128K
Run
./alphallama -m hermes-3-llama-3.1-405b.gguf
Params
397B (17B active)
Context
256K
Run
./alphallama -m qwen3.5-397b-a17b.gguf
Params
397B (17B active)
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
309B
Context
256K
Run
./alphallama -m mimo-v2-flash.gguf
Params
284B (13B active)
Context
1024K
Run
./alphallama -m deepseek-v4-flash.gguf
Params
235B (22B active)
Context
128K
Run
./alphallama -m qwen3-vl-235b-a22b-thinking.gguf
Params
235B (22B active)
Context
256K
Run
./alphallama -m qwen3-vl-235b-a22b-instruct.gguf
Params
235B (22B active)
Context
256K
Run
./alphallama -m qwen3-235b-a22b-thinking-2507.gguf
Params
235B (22B active)
Context
256K
Run
./alphallama -m qwen3-235b-a22b-2507.gguf
Params
235B (22B active)
Context
128K
Run
./alphallama -m qwen3-235b-a22b.gguf
Params
128B
Context
256K
Run
./alphallama -m mistral-medium-3-5.gguf
Params
123B
Context
256K
Run
./alphallama -m devstral-2512.gguf
Params
122B (10B active)
Context
256K
Run
./alphallama -m qwen3.5-122b-a10b.gguf
Params
122B (10B active)
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
120B (12B active)
Context
977K
Run
./alphallama -m nemotron-3-super-120b-a12b.gguf
Params
106B
Context
128K
Run
./alphallama -m intellect-3.gguf
Params
106B
Context
64K
Run
./alphallama -m glm-4.5v.gguf
Params
104B
Context
256K
Run
./alphallama -m ling-2.6-flash.gguf
Params
102B
Context
125K
Run
./alphallama -m solar-pro-3.gguf
Params
80B
Context
256K
Run
./alphallama -m qwen3-coder-next.gguf
Params
80B (3B active)
Context
256K
Run
./alphallama -m qwen3-next-80b-a3b-thinking.gguf
Params
80B (3B active)
Context
256K
Run
./alphallama -m qwen3-next-80b-a3b-instruct.gguf
Params
72B
Context
977K
Run
./alphallama -m qwen3.6-plus.gguf
Params
72B
Context
128K
Run
./alphallama -m virtuoso-large.gguf
Params
72B
Context
128K
Run
./alphallama -m qwen2.5-vl-72b-instruct.gguf
Params
72B
Context
32K
Run
./alphallama -m magnum-v4-72b.gguf
Params
72B
Context
128K
Run
./alphallama -m qwen-2.5-72b-instruct.gguf
Params
70B
Context
128K
Run
./alphallama -m hermes-4-70b.gguf
Params
70B
Context
125K
Run
./alphallama -m deepseek-r1-distill-llama-70b.gguf
Params
70B
Context
16K
Run
./alphallama -m l3.1-70b-hanami-x1.gguf
Params
70B
Context
128K
Run
./alphallama -m l3.3-euryale-70b.gguf
Params
70B
Context
128K
Run
./alphallama -m llama-3.3-70b-instruct.gguf
Params
70B
Context
128K
Run
./alphallama -m l3.1-euryale-70b.gguf
Params
70B
Context
128K
Run
./alphallama -m hermes-3-llama-3.1-70b.gguf
Params
70B
Context
128K
Run
./alphallama -m llama-3.1-70b-instruct.gguf
Params
70B
Context
8K
Run
./alphallama -m llama-3-70b-instruct.gguf
Params
63B
Context
256K
Run
./alphallama -m ring-2.6-1t.gguf
Params
55B
Context
977K
Run
./alphallama -m nemotron-3-ultra-550b-a55b.gguf
Params
49B
Context
1024K
Run
./alphallama -m deepseek-v4-pro.gguf
Params
49B
Context
128K
Run
./alphallama -m llama-3.3-nemotron-super-49b-v1.5.gguf
Params
41B
Context
256K
Run
./alphallama -m mistral-large-2512.gguf
Params
36B
Context
32K
Run
./alphallama -m skyfall-36b-v2.gguf
Params
35B (3B active)
Context
256K
Run
./alphallama -m qwen3.6-35b-a3b.gguf
Params
35B (3B active)
Context
256K
Run
./alphallama -m qwen3.5-35b-a3b.gguf
Params
35B (3B active)
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
32B
Context
977K
Run
./alphallama -m qwen3.6-flash.gguf
Params
32B
Context
64K
Run
./alphallama -m olmo-3-32b-think.gguf
Params
32B
Context
256K
Run
./alphallama -m qwen3-vl-32b-instruct.gguf
Params
32B
Context
32K
Run
./alphallama -m coder-large.gguf
Params
32B
Context
128K
Run
./alphallama -m qwen3-32b.gguf
Params
32B
Context
128K
Run
./alphallama -m aion-1.0-mini.gguf
Params
32B
Context
125K
Run
./alphallama -m deepseek-r1-distill-qwen-32b.gguf
Params
32B
Context
125K
Run
./alphallama -m qwen-2.5-coder-32b-instruct.gguf
Params
32B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
31B
Context
256K
Run
./alphallama -m gemma-4-31b-it.gguf
Params
30B
Context
198K
Run
./alphallama -m glm-4.7-flash.gguf
Params
30B (3B active)
Context
256K
Run
./alphallama -m nemotron-3-nano-30b-a3b.gguf
Params
30B (3B active)
Context
128K
Run
./alphallama -m qwen3-vl-30b-a3b-thinking.gguf
Params
30B (3B active)
Context
256K
Run
./alphallama -m qwen3-vl-30b-a3b-instruct.gguf
Params
30B (3B active)
Context
128K
Run
./alphallama -m qwen3-30b-a3b-thinking-2507.gguf
Params
30B (3B active)
Context
156K
Run
./alphallama -m qwen3-coder-30b-a3b-instruct.gguf
Params
30B (3B active)
Context
128K
Run
./alphallama -m qwen3-30b-a3b-instruct-2507.gguf
Params
30B (3B active)
Context
128K
Run
./alphallama -m qwen3-30b-a3b.gguf
Params
27B
Context
256K
Run
./alphallama -m qwen3.6-27b.gguf
Params
27B
Context
256K
Run
./alphallama -m qwen3.5-27b.gguf
Params
27B
Context
128K
Run
./alphallama -m gemma-3-27b-it.gguf
Params
27B
Context
8K
Run
./alphallama -m gemma-2-27b-it.gguf
Params
27B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
26B (4B active)
Context
256K
Run
./alphallama -m gemma-4-26b-a4b-it.gguf
Params
26B
Context
128K
Run
./alphallama -m trinity-mini.gguf
Params
24B (2B active)
Context
125K
Run
./alphallama -m lfm-2-24b-a2b.gguf
Params
24B
Context
31K
Run
./alphallama -m voxtral-small-24b-2507.gguf
Params
24B
Context
128K
Run
./alphallama -m cydonia-24b-v4.1.gguf
Params
24B
Context
125K
Run
./alphallama -m mistral-small-3.2-24b-instruct.gguf
Params
24B
Context
125K
Run
./alphallama -m mistral-small-3.1-24b-instruct.gguf
Params
24B
Context
32K
Run
./alphallama -m mistral-saba.gguf
Params
24B
Context
32K
Run
./alphallama -m mistral-small-24b-instruct-2501.gguf
Params
22B
Context
64K
Run
./alphallama -m mixtral-8x22b-instruct.gguf
Params
22B
Context
64K
Run
./alphallama -m wizardlm-2-8x22b.gguf
Params
17B
Context
1024K
Run
./alphallama -m llama-4-maverick.gguf
Params
17B
Context
9766K
Run
./alphallama -m llama-4-scout.gguf
Params
14B
Context
256K
Run
./alphallama -m ministral-14b-2512.gguf
Params
14B
Context
129K
Run
./alphallama -m qwen3-14b.gguf
Params
13B
Context
128K
Run
./alphallama -m hunyuan-a13b-instruct.gguf
Params
13B
Context
6K
Run
./alphallama -m remm-slerp-l2-13b.gguf
Params
13B
Context
4K
Run
./alphallama -m mythomax-l2-13b.gguf
Params
12B
Context
160K
Run
./alphallama -m llama-guard-4-12b.gguf
Params
12B
Context
128K
Run
./alphallama -m gemma-3-12b-it.gguf
Params
12B
Context
32K
Run
./alphallama -m unslopnemo-12b.gguf
Params
12B
Context
32K
Run
./alphallama -m rocinante-12b.gguf
Params
12B
Context
128K
Run
./alphallama -m mistral-nemo.gguf
Params
11B
Context
128K
Run
./alphallama -m llama-3.2-11b-vision-instruct.gguf
Params
9B
Context
256K
Run
./alphallama -m qwen3.5-9b.gguf
Params
9B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
8B
Context
128K
Run
./alphallama -m granite-4.1-8b.gguf
Params
8B
Context
32K
Run
./alphallama -m rnj-1-instruct.gguf
Params
8B
Context
256K
Run
./alphallama -m ministral-8b-2512.gguf
Params
8B
Context
250K
Run
./alphallama -m qwen3-vl-8b-thinking.gguf
Params
8B
Context
250K
Run
./alphallama -m qwen3-vl-8b-instruct.gguf
Params
8B
Context
128K
Run
./alphallama -m qwen3-8b.gguf
Params
8B
Context
32K
Run
./alphallama -m aion-rp-llama-3.1-8b.gguf
Params
8B
Context
8K
Run
./alphallama -m l3-lunaris-8b.gguf
Params
8B
Context
128K
Run
./alphallama -m llama-3.1-8b-instruct.gguf
Params
8B
Context
8K
Run
./alphallama -m llama-3-8b-instruct.gguf
Params
7B
Context
16K
Run
./alphallama -m reka-edge.gguf
Params
7B
Context
128K
Run
./alphallama -m qwen-2.5-7b-instruct.gguf
Params
4B
Context
32K
Run
./alphallama -m gemma-3n-e4b-it.gguf
Params
4B
Context
128K
Run
./alphallama -m gemma-3-4b-it.gguf
Params
4B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
3B
Context
128K
Run
./alphallama -m ministral-3b-2512.gguf
Params
3B
Context
128K
Run
./alphallama -m granite-4.0-h-micro.gguf
Params
3B
Context
128K
Run
./alphallama -m llama-3.2-3b-instruct.gguf
Params
2B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
1B
Context
128K
Run
./alphallama -m llama-3.2-1b-instruct.gguf
Params
1B
Context
—
Run
./alphallama -m qwen3.5.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3.7-plus.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3.7-max.gguf
Params
—
Context
32K
Run
./alphallama -m perceptron-mk1.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3.5-plus-20260420.gguf
Params
—
Context
256K
Run
./alphallama -m qwen3.6-max-preview.gguf
Params
—
Context
256K
Run
./alphallama -m ling-2.6-1t.gguf
Params
—
Context
256K
Run
./alphallama -m hy3-preview.gguf
Params
—
Context
1024K
Run
./alphallama -m mimo-v2.5-pro.gguf
Params
—
Context
1024K
Run
./alphallama -m mimo-v2.5.gguf
Params
—
Context
198K
Run
./alphallama -m glm-5.1.gguf
Params
—
Context
256K
Run
./alphallama -m trinity-large-thinking.gguf
Params
—
Context
250K
Run
./alphallama -m kat-coder-pro-v2.gguf
Params
—
Context
256K
Run
./alphallama -m mistral-small-2603.gguf
Params
—
Context
256K
Run
./alphallama -m glm-5-turbo.gguf
Params
—
Context
256K
Run
./alphallama -m seed-2.0-lite.gguf
Params
—
Context
125K
Run
./alphallama -m mercury-2.gguf
Params
—
Context
256K
Run
./alphallama -m seed-2.0-mini.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3.5-flash-02-23.gguf
Params
—
Context
128K
Run
./alphallama -m aion-2.0.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3.5-plus-02-15.gguf
Params
—
Context
198K
Run
./alphallama -m glm-5.gguf
Params
—
Context
256K
Run
./alphallama -m qwen3-max-thinking.gguf
Params
—
Context
1016K
Run
./alphallama -m palmyra-x5.gguf
Params
—
Context
256K
Run
./alphallama -m seed-1.6-flash.gguf
Params
—
Context
256K
Run
./alphallama -m seed-1.6.gguf
Params
—
Context
198K
Run
./alphallama -m glm-4.7.gguf
Params
—
Context
250K
Run
./alphallama -m relace-search.gguf
Params
—
Context
128K
Run
./alphallama -m glm-4.6v.gguf
Params
—
Context
128K
Run
./alphallama -m deepseek-v3.2.gguf
Params
—
Context
128K
Run
./alphallama -m phi-4-mini-instruct.gguf
Params
—
Context
198K
Run
./alphallama -m glm-4.6.gguf
Params
—
Context
160K
Run
./alphallama -m deepseek-v3.2-exp.gguf
Params
—
Context
250K
Run
./alphallama -m relace-apply-3.gguf
Params
—
Context
256K
Run
./alphallama -m qwen3-max.gguf
Params
—
Context
160K
Run
./alphallama -m deepseek-v3.1-terminus.gguf
Params
—
Context
977K
Run
./alphallama -m qwen3-coder-flash.gguf
Params
—
Context
977K
Run
./alphallama -m qwen-plus-2025-07-28.gguf
Params
—
Context
977K
Run
./alphallama -m qwen-plus-2025-07-28.gguf
Params
—
Context
128K
Run
./alphallama -m mistral-medium-3.1.gguf
Params
—
Context
250K
Run
./alphallama -m codestral-2508.gguf
Params
—
Context
128K
Run
./alphallama -m glm-4.5.gguf
Params
—
Context
128K
Run
./alphallama -m glm-4.5-air.gguf
Params
—
Context
128K
Run
./alphallama -m router.gguf
Params
—
Context
256K
Run
./alphallama -m morph-v3-large.gguf
Params
—
Context
80K
Run
./alphallama -m morph-v3-fast.gguf
Params
—
Context
128K
Run
./alphallama -m mistral-medium-3.gguf
Params
—
Context
64K
Run
./alphallama -m reka-flash-3.gguf
Params
—
Context
128K
Run
./alphallama -m aion-1.0.gguf
Params
—
Context
977K
Run
./alphallama -m qwen-plus.gguf
Params
—
Context
16K
Run
./alphallama -m phi-4.gguf
Params
—
Context
128K
Run
./alphallama -m deepseek-chat.gguf
Params
—
Context
8K
Run
./alphallama -m weaver.gguf
AlphaLlama downloads and optimizes models automatically.