alexmarques's picture
Upload folder using huggingface_hub
5a393d8 verified
raw
history blame
152 Bytes
quant_stage:
quant_modifiers:
QuantizationModifier:
ignore: [lm_head, 're:.*block_sparse_moe.gate']
scheme: FP8
targets: Linear