Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
alozowski
commited on
Commit
·
24c603a
1
Parent(s):
37e5956
Set unknown model size to -1 and improve logging
Browse files
src/submission/check_validity.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
import json
|
2 |
import os
|
3 |
import re
|
|
|
4 |
from collections import defaultdict
|
5 |
from datetime import datetime, timedelta, timezone
|
6 |
|
@@ -75,28 +76,33 @@ def is_model_on_hub(
|
|
75 |
return False, f"was not found or misconfigured on the hub! Error raised was {e.args[0]}", None
|
76 |
|
77 |
|
78 |
-
def get_model_size(model_info: ModelInfo, precision: str):
|
79 |
size_pattern = re.compile(r"(\d+\.)?\d+(b|m)")
|
80 |
safetensors = None
|
|
|
81 |
try:
|
82 |
safetensors = get_safetensors_metadata(model_info.id)
|
83 |
except Exception as e:
|
84 |
-
|
85 |
|
86 |
if safetensors is not None:
|
87 |
model_size = round(sum(safetensors.parameter_count.values()) / 1e9, 3)
|
88 |
else:
|
89 |
try:
|
90 |
size_match = re.search(size_pattern, model_info.id.lower())
|
91 |
-
|
92 |
-
|
|
|
|
|
|
|
93 |
except AttributeError:
|
94 |
-
|
|
|
95 |
|
96 |
size_factor = 8 if (precision == "GPTQ" or "gptq" in model_info.id.lower()) else 1
|
97 |
model_size = size_factor * model_size
|
98 |
-
return model_size
|
99 |
|
|
|
100 |
|
101 |
def get_model_arch(model_info: ModelInfo):
|
102 |
return model_info.config.get("architectures", "Unknown")
|
|
|
1 |
import json
|
2 |
import os
|
3 |
import re
|
4 |
+
import logging
|
5 |
from collections import defaultdict
|
6 |
from datetime import datetime, timedelta, timezone
|
7 |
|
|
|
76 |
return False, f"was not found or misconfigured on the hub! Error raised was {e.args[0]}", None
|
77 |
|
78 |
|
79 |
+
def get_model_size(model_info: ModelInfo, precision: str) -> float:
|
80 |
size_pattern = re.compile(r"(\d+\.)?\d+(b|m)")
|
81 |
safetensors = None
|
82 |
+
|
83 |
try:
|
84 |
safetensors = get_safetensors_metadata(model_info.id)
|
85 |
except Exception as e:
|
86 |
+
logging.error(f"Failed to get safetensors metadata for model {model_info.id}: {str(e)}")
|
87 |
|
88 |
if safetensors is not None:
|
89 |
model_size = round(sum(safetensors.parameter_count.values()) / 1e9, 3)
|
90 |
else:
|
91 |
try:
|
92 |
size_match = re.search(size_pattern, model_info.id.lower())
|
93 |
+
if size_match:
|
94 |
+
model_size = size_match.group(0)
|
95 |
+
model_size = round(float(model_size[:-1]) if model_size[-1] == "b" else float(model_size[:-1]) / 1e3, 3)
|
96 |
+
else:
|
97 |
+
return -1 # Unknown model size
|
98 |
except AttributeError:
|
99 |
+
logging.warning(f"Unable to parse model size from ID: {model_info.id}")
|
100 |
+
return -1 # Unknown model size
|
101 |
|
102 |
size_factor = 8 if (precision == "GPTQ" or "gptq" in model_info.id.lower()) else 1
|
103 |
model_size = size_factor * model_size
|
|
|
104 |
|
105 |
+
return model_size
|
106 |
|
107 |
def get_model_arch(model_info: ModelInfo):
|
108 |
return model_info.config.get("architectures", "Unknown")
|