nm-testing
/

Meta-Llama-3-8B-Instruct-fp8-hf_compat

File size: 124 Bytes

14a1fe3

quant_stage:
  quant_modifiers:
    QuantizationModifier:
      ignore: [lm_head]
      targets: [Linear]
      scheme: FP8