unsloth
/

Qwen2.5-Math-1.5B-Instruct-bnb-4bit

Text Generation

text-generation-inference

Inference Endpoints

4-bit precision

Model card Files Files and versions Community

danielhanchen commited on 5 days ago

Commit

e24e953

•

1 Parent(s): 2cd0ad1

Upload Qwen2ForCausalLM

Files changed (2) hide show

config.json +2 -0
generation_config.json +2 -1

config.json CHANGED Viewed

@@ -16,6 +16,7 @@
   "num_attention_heads": 12,
   "num_hidden_layers": 28,
   "num_key_value_heads": 2,
   "quantization_config": {
     "_load_in_4bit": true,
     "_load_in_8bit": false,
@@ -37,6 +38,7 @@
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.44.2",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

   "num_attention_heads": 12,
   "num_hidden_layers": 28,
   "num_key_value_heads": 2,
+  "pad_token_id": 151665,
   "quantization_config": {
     "_load_in_4bit": true,
     "_load_in_8bit": false,
   "tie_word_embeddings": true,
   "torch_dtype": "bfloat16",
   "transformers_version": "4.44.2",
+  "unsloth_fixed": true,
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151936

generation_config.json CHANGED Viewed

@@ -4,6 +4,7 @@
     151645,
     151643
   ],
-  "pad_token_id": 151643,
   "transformers_version": "4.44.2"
 }

     151645,
     151643
   ],
+  "max_length": 4096,
+  "pad_token_id": 151665,
   "transformers_version": "4.44.2"
 }