dacorvo HF staff commited on
Commit
f93cadb
1 Parent(s): f06a55a

Create llama3.json

Browse files
Files changed (1) hide show
  1. inference-cache-config/llama3.json +18 -0
inference-cache-config/llama3.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "meta-llama/Meta-Llama-3-8B": [
3
+ {
4
+ "batch_size": 1,
5
+ "sequence_length": 4096,
6
+ "num_cores": 8,
7
+ "auto_cast_type": "fp16"
8
+ }
9
+ ],
10
+ "meta-llama/Meta-Llama-3-70B": [
11
+ {
12
+ "batch_size": 1,
13
+ "sequence_length": 4096,
14
+ "num_cores": 24,
15
+ "auto_cast_type": "bf16"
16
+ }
17
+ ]
18
+ }