OPEA
/

Safetensors
mllama
4-bit precision
auto-round
cicdatopea commited on
Commit
6be8cdf
·
verified ·
1 Parent(s): 0c9b026

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +1 -44
config.json CHANGED
@@ -26,50 +26,7 @@
26
  "scale_dtype": "torch.float16",
27
  "seqlen": 512,
28
  "sym": true,
29
- "to_quant_block_names": [
30
- [
31
- "language_model.model.layers.0",
32
- "language_model.model.layers.1",
33
- "language_model.model.layers.2",
34
- "language_model.model.layers.3",
35
- "language_model.model.layers.4",
36
- "language_model.model.layers.5",
37
- "language_model.model.layers.6",
38
- "language_model.model.layers.7",
39
- "language_model.model.layers.8",
40
- "language_model.model.layers.9",
41
- "language_model.model.layers.10",
42
- "language_model.model.layers.11",
43
- "language_model.model.layers.12",
44
- "language_model.model.layers.13",
45
- "language_model.model.layers.14",
46
- "language_model.model.layers.15",
47
- "language_model.model.layers.16",
48
- "language_model.model.layers.17",
49
- "language_model.model.layers.18",
50
- "language_model.model.layers.19",
51
- "language_model.model.layers.20",
52
- "language_model.model.layers.21",
53
- "language_model.model.layers.22",
54
- "language_model.model.layers.23",
55
- "language_model.model.layers.24",
56
- "language_model.model.layers.25",
57
- "language_model.model.layers.26",
58
- "language_model.model.layers.27",
59
- "language_model.model.layers.28",
60
- "language_model.model.layers.29",
61
- "language_model.model.layers.30",
62
- "language_model.model.layers.31",
63
- "language_model.model.layers.32",
64
- "language_model.model.layers.33",
65
- "language_model.model.layers.34",
66
- "language_model.model.layers.35",
67
- "language_model.model.layers.36",
68
- "language_model.model.layers.37",
69
- "language_model.model.layers.38",
70
- "language_model.model.layers.39"
71
- ]
72
- ]
73
  },
74
  "text_config": {
75
  "_attn_implementation_autoset": false,
 
26
  "scale_dtype": "torch.float16",
27
  "seqlen": 512,
28
  "sym": true,
29
+ "block_name_to_quantize":"language_model.model.layers"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
30
  },
31
  "text_config": {
32
  "_attn_implementation_autoset": false,