Abhinav Kulkarni
commited on
Commit
·
846fb01
1
Parent(s):
5f1fe45
Updated README
Browse files
README.md
CHANGED
@@ -45,7 +45,7 @@ from transformers import AutoModelForCausalLM, AutoConfig, AutoTokenizer
|
|
45 |
from accelerate import init_empty_weights, load_checkpoint_and_dispatch
|
46 |
from huggingface_hub import snapshot_download
|
47 |
|
48 |
-
model_name = "mosaicml
|
49 |
|
50 |
# Config
|
51 |
config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
|
@@ -60,7 +60,7 @@ q_config = {
|
|
60 |
"q_group_size": 128,
|
61 |
}
|
62 |
|
63 |
-
load_quant = snapshot_download(
|
64 |
|
65 |
with init_empty_weights():
|
66 |
model = AutoModelForCausalLM.from_config(config=config,
|
|
|
45 |
from accelerate import init_empty_weights, load_checkpoint_and_dispatch
|
46 |
from huggingface_hub import snapshot_download
|
47 |
|
48 |
+
model_name = "abhinavkulkarni/mosaicml-mpt-30b-instruct-w4-g128-awq"
|
49 |
|
50 |
# Config
|
51 |
config = AutoConfig.from_pretrained(model_name, trust_remote_code=True)
|
|
|
60 |
"q_group_size": 128,
|
61 |
}
|
62 |
|
63 |
+
load_quant = snapshot_download(model_name)
|
64 |
|
65 |
with init_empty_weights():
|
66 |
model = AutoModelForCausalLM.from_config(config=config,
|