Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Tom Aarsen
commited on
Commit
•
abf58d4
1
Parent(s):
9a53e83
Add dwzhu/e5-base-4k as a pytorch_model.bin model with fp16
Browse files- utils/model_size.py +6 -3
utils/model_size.py
CHANGED
@@ -5,8 +5,9 @@ from huggingface_hub import hf_hub_download
|
|
5 |
|
6 |
# Map model IDs to the number of bytes used for one parameter. So, 4 bytes for fp32, 2 bytes for fp16, etc.
|
7 |
# By default, we assume that the model is stored in fp32.
|
8 |
-
KNOWN_BYTES_PER_PARAM = {
|
9 |
-
|
|
|
10 |
|
11 |
def get_model_parameters_memory(model_info: ModelInfo):
|
12 |
'''Get the size of the model in million of parameters.'''
|
@@ -22,7 +23,9 @@ def get_model_parameters_memory(model_info: ModelInfo):
|
|
22 |
url = hf_hub_url(model_info.id, filename="pytorch_model.bin")
|
23 |
meta = get_hf_file_metadata(url)
|
24 |
bytes_per_param = KNOWN_BYTES_PER_PARAM.get(model_info.id, 4)
|
25 |
-
|
|
|
|
|
26 |
|
27 |
if "pytorch_model.bin.index.json" in filenames:
|
28 |
index_path = hf_hub_download(model_info.id, filename="pytorch_model.bin.index.json")
|
|
|
5 |
|
6 |
# Map model IDs to the number of bytes used for one parameter. So, 4 bytes for fp32, 2 bytes for fp16, etc.
|
7 |
# By default, we assume that the model is stored in fp32.
|
8 |
+
KNOWN_BYTES_PER_PARAM = {
|
9 |
+
"dwzhu/e5-base-4k": 2,
|
10 |
+
}
|
11 |
|
12 |
def get_model_parameters_memory(model_info: ModelInfo):
|
13 |
'''Get the size of the model in million of parameters.'''
|
|
|
23 |
url = hf_hub_url(model_info.id, filename="pytorch_model.bin")
|
24 |
meta = get_hf_file_metadata(url)
|
25 |
bytes_per_param = KNOWN_BYTES_PER_PARAM.get(model_info.id, 4)
|
26 |
+
num_params = round(meta.size / bytes_per_param / 1e6)
|
27 |
+
size_gb = round(meta.size * (4 / bytes_per_param) / 1024**3, 2)
|
28 |
+
return num_params, size_gb
|
29 |
|
30 |
if "pytorch_model.bin.index.json" in filenames:
|
31 |
index_path = hf_hub_download(model_info.id, filename="pytorch_model.bin.index.json")
|