AngelSlim
/

Qwen2_5-1_5B_instruct_fp8_static

Safetensors

qwen2

compressed-tensors

Model card Files Files and versions

xet

Community

woodchen7 commited on Jul 22

Commit

896d04a

verified ·

1 Parent(s): e54ecbd

Upload config.json with huggingface_hub

Browse files

Files changed (1) hide show

config.json +57 -36

config.json CHANGED Viewed

@@ -1,37 +1,58 @@
 {
-  "_attn_implementation_autoset": true,
-  "architectures": [
-    "Qwen2ForCausalLM"
-  ],
-  "attention_dropout": 0.0,
-  "bos_token_id": 151643,
-  "eos_token_id": 151645,
-  "hidden_act": "silu",
-  "hidden_size": 1536,
-  "initializer_range": 0.02,
-  "intermediate_size": 8960,
-  "max_position_embeddings": 32768,
-  "max_window_layers": 21,
-  "model_type": "qwen2",
-  "num_attention_heads": 12,
-  "num_hidden_layers": 28,
-  "num_key_value_heads": 2,
-  "quantization_config": {
-    "bits": 4,
-    "group_size": 128,
-    "modules_to_not_convert": null,
-    "quant_method": "awq",
-    "version": "gemm",
-    "zero_point": true
-  },
-  "rms_norm_eps": 1e-06,
-  "rope_scaling": null,
-  "rope_theta": 1000000.0,
-  "sliding_window": 32768,
-  "tie_word_embeddings": true,
-  "torch_dtype": "float16",
-  "transformers_version": "4.51.3",
-  "use_cache": false,
-  "use_sliding_window": false,
-  "vocab_size": 151936
-}

 {
+    "architectures": [
+        "Qwen2ForCausalLM"
+    ],
+    "attention_dropout": 0.0,
+    "bos_token_id": 151643,
+    "eos_token_id": 151645,
+    "hidden_act": "silu",
+    "hidden_size": 1536,
+    "initializer_range": 0.02,
+    "intermediate_size": 8960,
+    "max_position_embeddings": 32768,
+    "max_window_layers": 21,
+    "model_type": "qwen2",
+    "num_attention_heads": 12,
+    "num_hidden_layers": 28,
+    "num_key_value_heads": 2,
+    "quantization_config": {
+        "config_groups": {
+            "group_0": {
+                "input_activations": {
+                    "dynamic": false,
+                    "num_bits": 8,
+                    "strategy": "tensor",
+                    "type": "float"
+                },
+                "output_activations": null,
+                "targets": [
+                    "Linear"
+                ],
+                "weights": {
+                    "dynamic": false,
+                    "num_bits": 8,
+                    "strategy": "tensor",
+                    "type": "float"
+                }
+            }
+        },
+        "format": "naive-quantized",
+        "kv_cache_scheme": null,
+        "quant_method": "compressed-tensors",
+        "quantization_status": "compressed",
+        "ignored_layers": [
+            "lm_head",
+            "model.embed_tokens"
+        ]
+    },
+    "rms_norm_eps": 1e-06,
+    "rope_scaling": null,
+    "rope_theta": 1000000.0,
+    "sliding_window": 32768,
+    "tie_word_embeddings": true,
+    "torch_dtype": "bfloat16",
+    "transformers_version": "4.51.3",
+    "use_cache": false,
+    "use_sliding_window": false,
+    "vocab_size": 151936
+}