dacorvo HF Staff commited on
Commit
5e828c9
·
verified ·
1 Parent(s): 2fdfa36

Update inference-cache-config/qwen3-moe.json

Browse files
inference-cache-config/qwen3-moe.json CHANGED
@@ -9,13 +9,13 @@
9
  {
10
  "batch_size": 4,
11
  "sequence_length": 4096,
12
- "num_cores": 2,
13
  "auto_cast_type": "bf16"
14
  },
15
  {
16
  "batch_size": 8,
17
  "sequence_length": 4096,
18
- "num_cores": 2,
19
  "auto_cast_type": "bf16"
20
  }
21
  ]
 
9
  {
10
  "batch_size": 4,
11
  "sequence_length": 4096,
12
+ "num_cores": 8,
13
  "auto_cast_type": "bf16"
14
  },
15
  {
16
  "batch_size": 8,
17
  "sequence_length": 4096,
18
+ "num_cores": 8,
19
  "auto_cast_type": "bf16"
20
  }
21
  ]