File size: 152 Bytes
5a393d8
 
 
 
 
 
1
2
3
4
5
6
7
quant_stage:
  quant_modifiers:
    QuantizationModifier:
      ignore: [lm_head, 're:.*block_sparse_moe.gate']
      scheme: FP8
      targets: Linear