Luigi commited on
Commit
b9efb74
·
verified ·
1 Parent(s): 5e03586

add qwen3 32b awq

Browse files
Files changed (1) hide show
  1. app.py +6 -0
app.py CHANGED
@@ -39,6 +39,12 @@ MODELS = {
39
  # ~235B total parameters (MoE: 22B activated) — included for reference if added later
40
  # "Qwen3-235B-A22B-Thinking": { ... },
41
 
 
 
 
 
 
 
42
  # 14.8B total parameters
43
  "Qwen3-14B": {
44
  "repo_id": "Qwen/Qwen3-14B",
 
39
  # ~235B total parameters (MoE: 22B activated) — included for reference if added later
40
  # "Qwen3-235B-A22B-Thinking": { ... },
41
 
42
+ # 32.8B total parameters
43
+ "Qwen3-32B-AWQ": {
44
+ "repo_id": "Qwen/Qwen3-32B-AWQ",
45
+ "description": "4-bit AWQ quantized dense causal language model with 32.8B total parameters (31.2B non-embedding), 64 layers, 64 query heads & 8 KV heads, native 32,768-token context (extendable to 131,072 via YaRN). Features seamless switching between thinking mode (for complex reasoning, math, coding) and non-thinking mode (for efficient dialogue), strong multilingual support (100+ languages), and leading open-source agent capabilities."
46
+ },
47
+
48
  # 14.8B total parameters
49
  "Qwen3-14B": {
50
  "repo_id": "Qwen/Qwen3-14B",