Shaun Prince
commited on
Commit
·
4cb4b07
1
Parent(s):
b080700
add quant config
Browse files- README.md +1 -0
- quant_config.json +6 -0
README.md
CHANGED
@@ -1,3 +1,4 @@
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
|
|
|
1 |
---
|
2 |
license: apache-2.0
|
3 |
---
|
4 |
+
# ResplendentAI/Persephone_7B AWQ
|
quant_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"zero_point": true,
|
3 |
+
"q_group_size": 128,
|
4 |
+
"w_bit": 4,
|
5 |
+
"version": "GEMM"
|
6 |
+
}
|