dacorvo HF Staff commited on
Commit
28ae1e4
·
verified ·
1 Parent(s): b76c1a7

Update inference-cache-config/smollm3.json

Browse files
Files changed (1) hide show
  1. inference-cache-config/smollm3.json +3 -11
inference-cache-config/smollm3.json CHANGED
@@ -1,21 +1,13 @@
1
  {
2
- "HuggingFaceTB/SmolLM-360M-Instruct": [
3
- {
4
  "batch_size": 1,
5
  "sequence_length": 4096,
6
  "num_cores": 2,
7
  "auto_cast_type": "bf16"
8
  },
9
- {
10
- "batch_size": 4,
11
- "sequence_length": 4096,
12
- "num_cores": 2,
13
- "auto_cast_type": "bf16"
14
- }
15
- ],
16
- "HuggingFaceTB/SmolLM-3B-Instruct": [
17
  {
18
- "batch_size": 1,
19
  "sequence_length": 4096,
20
  "num_cores": 2,
21
  "auto_cast_type": "bf16"
 
1
  {
2
+ "HuggingFaceTB/SmolLM-3B-Instruct": [
3
+ {
4
  "batch_size": 1,
5
  "sequence_length": 4096,
6
  "num_cores": 2,
7
  "auto_cast_type": "bf16"
8
  },
 
 
 
 
 
 
 
 
9
  {
10
+ "batch_size": 4,
11
  "sequence_length": 4096,
12
  "num_cores": 2,
13
  "auto_cast_type": "bf16"