File size: 1,844 Bytes
b0eb9e7 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 |
{
"model_config": {
"name": "HunyuanDense",
"model_path": "/",
"trust_remote_code": true,
"torch_dtype": "auto",
"device_map": "auto",
"low_cpu_mem_usage": true,
"use_cache": false
},
"compression_config": {
"name": "PTQ",
"quantization": {
"name": "fp8_static",
"bits": 8,
"quant_method": {
"weight": "per-tensor",
"activation": "per-tensor"
},
"quant_helpers": [],
"smooth_alpha": 0.5,
"low_memory": false,
"modules_to_quantize": [],
"zero_point": true,
"mse_range": false,
"ignore_layers": [
"lm_head",
"model.embed_tokens"
],
"quant_analyse": false
}
},
"dataset_config": {
"name": "TextDataset",
"data_path": "./dataset/PTQ_data.jsonl",
"max_seq_length": 4096,
"num_samples": 512,
"batch_size": 1,
"shuffle": false
},
"global_config": {
"save_path": "/",
"max_seq_length": 4096,
"hidden_size": 2048,
"model_arch_type": "hunyuan_v1_dense",
"deploy_backend": "vllm"
},
"debug_info": {
"python": "3.10.14 (main, Mar 6 2025, 18:16:47) [GCC 11.4.0]",
"angelslim": {
"name": "angelslim",
"version": "be35620eca8ad4e6bf8263e84cee69d90c7045a4",
"source": "git"
},
"torch": {
"name": "torch",
"version": "2.7.0",
"source": "pip"
},
"transformers": {
"name": "transformers",
"version": "4.52.4",
"source": "pip"
},
"torch_cuda_version": "12.6"
}
}
|