Spaces:

Dovakiins
/

qwerrwe

Build error

Nanobit commited on May 7, 2024

Commit

8b9c15b

unverified ·

1 Parent(s): 9e1480e

feat: exclude mamba blocks for jamba (#1578)

Files changed (1) hide show

src/axolotl/utils/models.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Module for models and model loading"""
 # pylint: disable=too-many-lines
 import logging
@@ -504,6 +505,9 @@ def load_model(
         bnb_config = {
             "load_in_8bit": True,
         }
         model_kwargs["quantization_config"] = BitsAndBytesConfig(
             **bnb_config,
         )

 """Module for models and model loading"""
 # pylint: disable=too-many-lines
 import logging
         bnb_config = {
             "load_in_8bit": True,
         }
+        # Exclude mamba blocks from int8 quantization for jamba
+        if cfg.model_config_type == "jamba":
+            bnb_config["llm_int8_skip_modules"] = ["mamba"]
         model_kwargs["quantization_config"] = BitsAndBytesConfig(
             **bnb_config,
         )