Qwen3-30B-A3B.w4a16 / recipe.yaml
nytopop's picture
Upload folder using huggingface_hub
3c66597 verified
raw
history blame contribute delete
180 Bytes
default_stage:
default_modifiers:
QuantizationModifier:
ignore: [lm_head, 're:.*mlp.gate$', 're:.*mlp.shared_expert_gate$']
targets: [Linear]
scheme: W4A16