orpheus-sparse-fp8 / recipe.yaml
shadowlilac's picture
Upload folder using huggingface_hub
f57058f verified
default_stage:
default_modifiers:
SparseGPTModifier:
sparsity: 0.5
mask_structure: '2:4'
sequential_update: true
targets: ['re:model.layers.\d*$']
QuantizationModifier:
targets: [Linear]
ignore: [lm_head]
scheme: FP8_DYNAMIC