reinforce20001
/

Sakura-GalTransl-14B-v3.8-NVFP4

8-bit precision

compressed-tensors

Model card Files Files and versions

Sakura-GalTransl-14B-v3.8-NVFP4

File size: 204 Bytes

f2e269a

default_stage:
  default_modifiers:
    QuantizationModifier:
      targets: [Linear]
      ignore: ['re:.*lm_head', 're:.*visual.*', 're:.*mlp.gate$', 're:.*mlp.shared_expert_gate$']
      scheme: NVFP4