manaestras commited on
Commit
25718c2
·
verified ·
1 Parent(s): e3acf0a

Upload hf_quant_config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. hf_quant_config.json +10 -0
hf_quant_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "quantization": {
3
+ "exclude_modules": [
4
+ "lm_head",
5
+ "model.embed_tokens"
6
+ ],
7
+ "kv_cache_quant_algo": null,
8
+ "quant_algo": "FP8"
9
+ }
10
+ }