File size: 152 Bytes
5a393d8 |
1 2 3 4 5 6 7 |
quant_stage:
quant_modifiers:
QuantizationModifier:
ignore: [lm_head, 're:.*block_sparse_moe.gate']
scheme: FP8
targets: Linear
|
5a393d8 |
1 2 3 4 5 6 7 |
quant_stage:
quant_modifiers:
QuantizationModifier:
ignore: [lm_head, 're:.*block_sparse_moe.gate']
scheme: FP8
targets: Linear
|