Update README.md
Browse files
README.md
CHANGED
@@ -291,11 +291,11 @@ for n, m in block.named_modules():
|
|
291 |
|
292 |
from auto_round import AutoRound
|
293 |
|
294 |
-
autoround = AutoRound(model=model, tokenizer=tokenizer, device_map=device_map,
|
295 |
batch_size=4, low_gpu_mem_usage=True, seqlen=2048,
|
296 |
)
|
297 |
autoround.quantize()
|
298 |
-
autoround.save_quantized(format="
|
299 |
|
300 |
~~~
|
301 |
|
|
|
291 |
|
292 |
from auto_round import AutoRound
|
293 |
|
294 |
+
autoround = AutoRound(model=model, tokenizer=tokenizer, device_map=device_map, nsamples=512,
|
295 |
batch_size=4, low_gpu_mem_usage=True, seqlen=2048,
|
296 |
)
|
297 |
autoround.quantize()
|
298 |
+
autoround.save_quantized(format="auto_awq", output_dir="tmp_autoround")
|
299 |
|
300 |
~~~
|
301 |
|