Spaces:
Runtime error
Runtime error
add qwen3 32b awq
Browse files
app.py
CHANGED
|
@@ -39,6 +39,12 @@ MODELS = {
|
|
| 39 |
# ~235B total parameters (MoE: 22B activated) — included for reference if added later
|
| 40 |
# "Qwen3-235B-A22B-Thinking": { ... },
|
| 41 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 42 |
# 14.8B total parameters
|
| 43 |
"Qwen3-14B": {
|
| 44 |
"repo_id": "Qwen/Qwen3-14B",
|
|
|
|
| 39 |
# ~235B total parameters (MoE: 22B activated) — included for reference if added later
|
| 40 |
# "Qwen3-235B-A22B-Thinking": { ... },
|
| 41 |
|
| 42 |
+
# 32.8B total parameters
|
| 43 |
+
"Qwen3-32B-AWQ": {
|
| 44 |
+
"repo_id": "Qwen/Qwen3-32B-AWQ",
|
| 45 |
+
"description": "4-bit AWQ quantized dense causal language model with 32.8B total parameters (31.2B non-embedding), 64 layers, 64 query heads & 8 KV heads, native 32,768-token context (extendable to 131,072 via YaRN). Features seamless switching between thinking mode (for complex reasoning, math, coding) and non-thinking mode (for efficient dialogue), strong multilingual support (100+ languages), and leading open-source agent capabilities."
|
| 46 |
+
},
|
| 47 |
+
|
| 48 |
# 14.8B total parameters
|
| 49 |
"Qwen3-14B": {
|
| 50 |
"repo_id": "Qwen/Qwen3-14B",
|