dacorvo HF Staff commited on
Commit
3551ea0
·
verified ·
1 Parent(s): 26418d4

Delete inference-cache-config/mistral-variants.json

Browse files
inference-cache-config/mistral-variants.json DELETED
@@ -1,54 +0,0 @@
1
- {
2
- "HuggingFaceH4/zephyr-7b-beta": [
3
- {
4
- "batch_size": 1,
5
- "sequence_length": 4096,
6
- "num_cores": 2,
7
- "auto_cast_type": "bf16"
8
- },
9
- {
10
- "batch_size": 1,
11
- "sequence_length": 4096,
12
- "num_cores": 8,
13
- "auto_cast_type": "bf16"
14
- },
15
- {
16
- "batch_size": 4,
17
- "sequence_length": 4096,
18
- "num_cores": 2,
19
- "auto_cast_type": "bf16"
20
- },
21
- {
22
- "batch_size": 4,
23
- "sequence_length": 4096,
24
- "num_cores": 8,
25
- "auto_cast_type": "bf16"
26
- },
27
- {
28
- "batch_size": 8,
29
- "sequence_length": 4096,
30
- "num_cores": 8,
31
- "auto_cast_type": "bf16"
32
- },
33
- {
34
- "batch_size": 16,
35
- "sequence_length": 4096,
36
- "num_cores": 8,
37
- "auto_cast_type": "bf16"
38
- }
39
- ],
40
- "Intel/neural-chat-7b-v3-3": [
41
- {
42
- "batch_size": 1,
43
- "sequence_length": 4096,
44
- "num_cores": 2,
45
- "auto_cast_type": "fp16"
46
- },
47
- {
48
- "batch_size": 4,
49
- "sequence_length": 4096,
50
- "num_cores": 2,
51
- "auto_cast_type": "bf16"
52
- }
53
- ]
54
- }