Upload model files
Browse files- config.json +2 -2
- model.safetensors +2 -2
config.json
CHANGED
@@ -16,7 +16,7 @@
|
|
16 |
"model_type": "llama",
|
17 |
"num_attention_heads": 4,
|
18 |
"num_hidden_layers": 2,
|
19 |
-
"num_key_value_heads":
|
20 |
"pretraining_tp": 1,
|
21 |
"quantization_config": {
|
22 |
"algo_config": null,
|
@@ -36,7 +36,7 @@
|
|
36 |
"weight": {
|
37 |
"ch_axis": 1,
|
38 |
"dtype": "uint4",
|
39 |
-
"group_size":
|
40 |
"is_dynamic": false,
|
41 |
"observer_cls": "PerGroupMinMaxObserver",
|
42 |
"qscheme": "per_group",
|
|
|
16 |
"model_type": "llama",
|
17 |
"num_attention_heads": 4,
|
18 |
"num_hidden_layers": 2,
|
19 |
+
"num_key_value_heads": 2,
|
20 |
"pretraining_tp": 1,
|
21 |
"quantization_config": {
|
22 |
"algo_config": null,
|
|
|
36 |
"weight": {
|
37 |
"ch_axis": 1,
|
38 |
"dtype": "uint4",
|
39 |
+
"group_size": 32,
|
40 |
"is_dynamic": false,
|
41 |
"observer_cls": "PerGroupMinMaxObserver",
|
42 |
"qscheme": "per_group",
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6adccba13f3eb67040fc2deb588948bca63a605b4e4701354b2c9a31882d13cd
|
3 |
+
size 20086792
|