Spaces:
Running
on
Zero
Running
on
Zero
v1
Browse files- meteor/load_meteor.py +2 -2
meteor/load_meteor.py
CHANGED
@@ -17,7 +17,7 @@ def load_meteor(link, bits):
|
|
17 |
huggingface_config.update(dict(
|
18 |
torch_dtype=torch.float16,
|
19 |
low_cpu_mem_usage=True,
|
20 |
-
|
21 |
quantization_config=BitsAndBytesConfig(
|
22 |
load_in_4bit=bits == 4,
|
23 |
load_in_8bit=bits == 8,
|
@@ -33,7 +33,7 @@ def load_meteor(link, bits):
|
|
33 |
huggingface_config.update(dict(
|
34 |
torch_dtype=torch.float16,
|
35 |
low_cpu_mem_usage=True,
|
36 |
-
|
37 |
))
|
38 |
|
39 |
# loading backbone model
|
|
|
17 |
huggingface_config.update(dict(
|
18 |
torch_dtype=torch.float16,
|
19 |
low_cpu_mem_usage=True,
|
20 |
+
attn_implementation="flash_attention_2",
|
21 |
quantization_config=BitsAndBytesConfig(
|
22 |
load_in_4bit=bits == 4,
|
23 |
load_in_8bit=bits == 8,
|
|
|
33 |
huggingface_config.update(dict(
|
34 |
torch_dtype=torch.float16,
|
35 |
low_cpu_mem_usage=True,
|
36 |
+
attn_implementation="flash_attention_2",
|
37 |
))
|
38 |
|
39 |
# loading backbone model
|