dacorvo HF staff commited on
Commit
545cd4d
1 Parent(s): ee458f5

Add more batch_size for mistral on smaller instances

Browse files
Files changed (1) hide show
  1. inference-cache-config/mistral.json +12 -0
inference-cache-config/mistral.json CHANGED
@@ -6,6 +6,18 @@
6
  "num_cores": 2,
7
  "auto_cast_type": "fp16"
8
  },
 
 
 
 
 
 
 
 
 
 
 
 
9
  {
10
  "batch_size": 1,
11
  "sequence_length": 4096,
 
6
  "num_cores": 2,
7
  "auto_cast_type": "fp16"
8
  },
9
+ {
10
+ "batch_size": 4,
11
+ "sequence_length": 4096,
12
+ "num_cores": 4,
13
+ "auto_cast_type": "fp16"
14
+ },
15
+ {
16
+ "batch_size": 8,
17
+ "sequence_length": 4096,
18
+ "num_cores": 2,
19
+ "auto_cast_type": "fp16"
20
+ },
21
  {
22
  "batch_size": 1,
23
  "sequence_length": 4096,