File size: 1,903 Bytes
069aff8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
{
    "model_config": {
        "name": "HunyuanDense",
        "model_path": "/",
        "trust_remote_code": true,
        "torch_dtype": "auto",
        "device_map": "cpu",
        "low_cpu_mem_usage": true,
        "use_cache": false
    },
    "compression_config": {
        "name": "PTQ",
        "quantization": {
            "name": "int4_awq",
            "bits": 4,
            "quant_method": {
                "weight": "per-group",
                "group_size": 128,
                "zero_point": true,
                "mse_range": false
            },
            "quant_helpers": [],
            "smooth_alpha": 0.5,
            "low_memory": false,
            "modules_to_quantize": [],
            "zero_point": true,
            "mse_range": false,
            "ignore_layers": [
                "lm_head",
                "model.embed_tokens"
            ],
            "quant_analyse": false
        }
    },
    "dataset_config": {
        "name": "TextDataset",
        "data_path": "./dataset/PTQ_data.jsonl",
        "max_seq_length": 4096,
        "num_samples": 128,
        "batch_size": 1,
        "shuffle": false
    },
    "global_config": {
        "save_path": "/",
        "max_seq_length": 4096,
        "hidden_size": 3072,
        "model_arch_type": "hunyuan_v1_dense",
        "deploy_backend": "vllm"
    },
    "debug_info": {
        "python": "3.10.14 (main, Mar  6 2025, 18:16:47) [GCC 11.4.0]",
        "angelslim": {
            "name": "angelslim",
            "version": "be35620eca8ad4e6bf8263e84cee69d90c7045a4",
            "source": "git"
        },
        "torch": {
            "name": "torch",
            "version": "2.7.0",
            "source": "pip"
        },
        "transformers": {
            "name": "transformers",
            "version": "4.52.4",
            "source": "pip"
        },
        "torch_cuda_version": "12.6"
    }
}