dacorvo HF Staff commited on
Commit
05a6e8d
·
verified ·
1 Parent(s): 1f93295

Create llama4.json

Browse files
Files changed (1) hide show
  1. inference-cache-config/llama4.json +18 -0
inference-cache-config/llama4.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct": [
3
+ {
4
+ "task": "text-generation",
5
+ "batch_size": 1,
6
+ "sequence_length": 4096,
7
+ "num_cores": 16,
8
+ "auto_cast_type": "bf16"
9
+ },
10
+ {
11
+ "task": "text-generation",
12
+ "batch_size": 4,
13
+ "sequence_length": 4096,
14
+ "num_cores": 16,
15
+ "auto_cast_type": "bf16"
16
+ }
17
+ ]
18
+ }