abhinavkulkarni
commited on
Commit
•
5da5f16
1
Parent(s):
6aa0aeb
Update README.md
Browse files
README.md
CHANGED
@@ -45,7 +45,7 @@ import torch
|
|
45 |
from awq.quantize.quantizer import real_quantize_model_weight
|
46 |
from transformers import AutoModelForCausalLM, AutoConfig, AutoTokenizer
|
47 |
from accelerate import init_empty_weights, load_checkpoint_and_dispatch
|
48 |
-
from huggingface_hub import
|
49 |
|
50 |
model_name = "psmathur/orca_mini_v2_13b"
|
51 |
|
@@ -62,7 +62,7 @@ q_config = {
|
|
62 |
"q_group_size": 128,
|
63 |
}
|
64 |
|
65 |
-
load_quant =
|
66 |
|
67 |
with init_empty_weights():
|
68 |
model = AutoModelForCausalLM.from_pretrained(model_name, config=config,
|
|
|
45 |
from awq.quantize.quantizer import real_quantize_model_weight
|
46 |
from transformers import AutoModelForCausalLM, AutoConfig, AutoTokenizer
|
47 |
from accelerate import init_empty_weights, load_checkpoint_and_dispatch
|
48 |
+
from huggingface_hub import snapshot_download
|
49 |
|
50 |
model_name = "psmathur/orca_mini_v2_13b"
|
51 |
|
|
|
62 |
"q_group_size": 128,
|
63 |
}
|
64 |
|
65 |
+
load_quant = snapshot_download('abhinavkulkarni/psmathur-orca_mini_v2_13b-w4-g128-awq')
|
66 |
|
67 |
with init_empty_weights():
|
68 |
model = AutoModelForCausalLM.from_pretrained(model_name, config=config,
|