{ "model_config": { "name": "HunyuanDense", "model_path": "/", "trust_remote_code": true, "torch_dtype": "auto", "device_map": "cpu", "low_cpu_mem_usage": true, "use_cache": false }, "compression_config": { "name": "PTQ", "quantization": { "name": "int4_awq", "bits": 4, "quant_method": { "weight": "per-group", "group_size": 128, "zero_point": true, "mse_range": false }, "quant_helpers": [], "smooth_alpha": 0.5, "low_memory": false, "modules_to_quantize": [], "zero_point": true, "mse_range": false, "ignore_layers": [ "lm_head", "model.embed_tokens" ], "quant_analyse": false } }, "dataset_config": { "name": "TextDataset", "data_path": "./dataset/PTQ_data.jsonl", "max_seq_length": 4096, "num_samples": 128, "batch_size": 1, "shuffle": false }, "global_config": { "save_path": "/", "max_seq_length": 4096, "hidden_size": 2048, "model_arch_type": "hunyuan_v1_dense", "deploy_backend": "vllm" }, "debug_info": { "python": "3.10.14 (main, Mar 6 2025, 18:16:47) [GCC 11.4.0]", "angelslim": { "name": "angelslim", "version": "be35620eca8ad4e6bf8263e84cee69d90c7045a4", "source": "git" }, "torch": { "name": "torch", "version": "2.7.0", "source": "pip" }, "transformers": { "name": "transformers", "version": "4.52.4", "source": "pip" }, "torch_cuda_version": "12.6" } }