QwenLong-L1-32B-4bit-DWQ / conversion_script.py
Narutoouz's picture
Upload QwenLong-L1-32B-4bit-DWQ DWQ 4-bit quantized model with comprehensive documentation
478d3b0 verified
#!/usr/bin/env python3
"""
Conversion script used to create QwenLong-L1-32B-4bit-DWQ
"""
from mlx_lm import convert
import time
def convert_to_dwq():
config = {
"group_size": 128,
"bits": 4,
"calibration_samples": 50
}
convert(
path="WaveCut/QwenLong-L1-32B",
mlx_path="./QwenLong-L1-32B-4bit-DWQ/",
quantize=True,
q_group_size=config["group_size"],
q_bits=config["bits"]
)
if __name__ == "__main__":
convert_to_dwq()