Spaces:

Tonic
/

Native_1-bit_LLM

Running

App Files Files Community

AI-B commited on Apr 17

Commit

667f1e5

verified ·

1 Parent(s): 5760858

🔧🚀 Updated app.py: BitNet Model Repo Swap

Browse files

swapping out the dead “microsoft/bitnet‑b1.58‑2B‑4T” identifier for the live “1bitLLM/bitnet_b1_58-large” repo—which actually carries the needed configuration_bitnet.py (and its tokenizer/model code)

Files changed (1) hide show

app.py +3 -8

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import gradio as gr
 import torch
-from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig
 # Singleton for model and tokenizer
 _model = None
@@ -9,18 +9,13 @@ _tokenizer = None
 def load_model():
     global _model, _tokenizer
     if _model is None or _tokenizer is None:
-        model_id = "microsoft/bitnet-b1.58-2B-4T"
         _tokenizer = AutoTokenizer.from_pretrained(
             model_id,
             trust_remote_code=True
         )
-        config = AutoConfig.from_pretrained(
-            model_id,
-            trust_remote_code=True
-        )
         _model = AutoModelForCausalLM.from_pretrained(
             model_id,
-            config=config,
             torch_dtype=torch.bfloat16,
             trust_remote_code=True
         )
@@ -157,4 +152,4 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
 if __name__ == "__main__":
     # Preload model to avoid threading issues
     load_model()
-    demo.launch(ssr_mode=False, share=True)

 import gradio as gr
 import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
 # Singleton for model and tokenizer
 _model = None
 def load_model():
     global _model, _tokenizer
     if _model is None or _tokenizer is None:
+        model_id = "1bitLLM/bitnet_b1_58-large"  # patched from microsoft/bitnet‑b1.58‑2B‑4T
         _tokenizer = AutoTokenizer.from_pretrained(
             model_id,
             trust_remote_code=True
         )
         _model = AutoModelForCausalLM.from_pretrained(
             model_id,
             torch_dtype=torch.bfloat16,
             trust_remote_code=True
         )
 if __name__ == "__main__":
     # Preload model to avoid threading issues
     load_model()
+    demo.launch(ssr_mode=False, share=True)