Upload of AutoGPTQ quantized model

Files changed (3) hide show

config.json CHANGED Viewed

@@ -33,7 +33,7 @@
     "model_file_base_name": null,
     "model_name_or_path": null,
     "quant_method": "gptq",
-    "shrink": 0.01,
     "static_groups": false,
     "sym": false,
     "true_sequential": true

     "model_file_base_name": null,
     "model_name_or_path": null,
     "quant_method": "gptq",
+    "shrink": 0.0625,
     "static_groups": false,
     "sym": false,
     "true_sequential": true

gptq_model-4bit--1g.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64bdbc1b114418d222a7f4fd72557b09fda9f5d66c242ace7b0ff4a7f4c3970d
 size 2990657120

 version https://git-lfs.github.com/spec/v1
+oid sha256:c63030276fa9b54a46f6d3f2fea35f7637289d24638dcefcda5ad5ec903b4cd2
 size 2990657120

quantize_config.json CHANGED Viewed

@@ -9,7 +9,7 @@
   "model_name_or_path": null,
   "model_file_base_name": null,
   "exponent_hinv": 4.0,
-  "shrink": 0.01,
   "quant_method": "gptq",
   "checkpoint_format": "gptq"
 }

   "model_name_or_path": null,
   "model_file_base_name": null,
   "exponent_hinv": 4.0,
+  "shrink": 0.0625,
   "quant_method": "gptq",
   "checkpoint_format": "gptq"
 }