manaestras commited on
Commit
4a654bc
·
verified ·
1 Parent(s): 37e090c

Upload angelslim_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. angelslim_config.json +69 -0
angelslim_config.json ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_config": {
3
+ "name": "HunyuanDense",
4
+ "model_path": "/",
5
+ "trust_remote_code": true,
6
+ "torch_dtype": "auto",
7
+ "device_map": "cpu",
8
+ "low_cpu_mem_usage": true,
9
+ "use_cache": false
10
+ },
11
+ "compression_config": {
12
+ "name": "PTQ",
13
+ "quantization": {
14
+ "name": "int4_awq",
15
+ "bits": 4,
16
+ "quant_method": {
17
+ "weight": "per-group",
18
+ "group_size": 128,
19
+ "zero_point": true,
20
+ "mse_range": false
21
+ },
22
+ "quant_helpers": [],
23
+ "smooth_alpha": 0.5,
24
+ "low_memory": false,
25
+ "modules_to_quantize": [],
26
+ "zero_point": true,
27
+ "mse_range": false,
28
+ "ignore_layers": [
29
+ "lm_head",
30
+ "model.embed_tokens"
31
+ ],
32
+ "quant_analyse": false
33
+ }
34
+ },
35
+ "dataset_config": {
36
+ "name": "TextDataset",
37
+ "data_path": "./dataset/PTQ_data.jsonl",
38
+ "max_seq_length": 4096,
39
+ "num_samples": 128,
40
+ "batch_size": 1,
41
+ "shuffle": false
42
+ },
43
+ "global_config": {
44
+ "save_path": "/",
45
+ "max_seq_length": 4096,
46
+ "hidden_size": 4096,
47
+ "model_arch_type": "hunyuan_v1_dense",
48
+ "deploy_backend": "vllm"
49
+ },
50
+ "debug_info": {
51
+ "python": "3.10.14 (main, Mar 6 2025, 18:16:47) [GCC 11.4.0]",
52
+ "angelslim": {
53
+ "name": "angelslim",
54
+ "version": "be35620eca8ad4e6bf8263e84cee69d90c7045a4",
55
+ "source": "git"
56
+ },
57
+ "torch": {
58
+ "name": "torch",
59
+ "version": "2.7.0",
60
+ "source": "pip"
61
+ },
62
+ "transformers": {
63
+ "name": "transformers",
64
+ "version": "4.52.4",
65
+ "source": "pip"
66
+ },
67
+ "torch_cuda_version": "12.6"
68
+ }
69
+ }