MultiVerse_70B_AWQ / quant_config.json
AlanRobotics's picture
Create quant_config.json
c22867e verified
raw
history blame
285 Bytes
{
"backend": "autoawq",
"bits": 4,
"do_fuse": false,
"exllama_config": null,
"fuse_max_seq_len": null,
"group_size": 128,
"modules_to_fuse": null,
"modules_to_not_convert": null,
"quant_method": "awq",
"version": "gemm",
"zero_point": true
}