diff --git a/config.json b/config.json index 2ac056bcf2c53a63450c40b5d553500182a58b65..100d719a00586c08671b85c3d72c2c816d003331 100644 --- a/config.json +++ b/config.json @@ -88,6 +88,15 @@ "model.layers.1.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.10.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.10.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.10.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.10.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -103,6 +112,15 @@ "model.layers.10.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.11.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.11.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.11.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.11.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -118,6 +136,15 @@ "model.layers.11.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.12.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.12.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.12.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.12.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -133,6 +160,15 @@ "model.layers.12.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.13.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.13.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.13.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.13.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -148,6 +184,15 @@ "model.layers.13.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.14.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.14.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.14.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.14.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -163,6 +208,15 @@ "model.layers.14.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.15.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.15.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.15.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.15.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -178,6 +232,15 @@ "model.layers.15.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.16.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.16.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.16.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.16.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -193,6 +256,15 @@ "model.layers.16.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.17.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.17.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.17.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.17.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -208,6 +280,15 @@ "model.layers.17.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.18.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.18.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.18.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.18.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -223,6 +304,15 @@ "model.layers.18.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.19.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.19.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.19.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.19.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -262,6 +352,15 @@ "model.layers.2.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.20.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.20.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.20.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.20.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -277,6 +376,15 @@ "model.layers.20.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.21.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.21.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.21.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.21.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -292,6 +400,15 @@ "model.layers.21.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.22.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.22.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.22.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.22.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -307,6 +424,15 @@ "model.layers.22.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.23.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.23.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.23.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.23.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -322,6 +448,15 @@ "model.layers.23.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.24.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.24.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.24.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.24.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -337,6 +472,15 @@ "model.layers.24.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.25.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.25.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.25.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.25.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -352,6 +496,15 @@ "model.layers.25.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.26.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.26.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.26.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.26.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -367,6 +520,15 @@ "model.layers.26.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.27.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.27.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.27.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.27.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -382,6 +544,15 @@ "model.layers.27.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.28.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.28.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.28.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.28.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -397,6 +568,15 @@ "model.layers.28.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.29.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.29.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.29.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.29.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -412,6 +592,15 @@ "model.layers.29.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.3.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.3.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.3.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.3.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -427,6 +616,15 @@ "model.layers.3.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.30.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.30.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.30.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.30.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -442,6 +640,15 @@ "model.layers.30.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.31.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.31.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.31.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.31.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -457,6 +664,15 @@ "model.layers.31.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.32.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.32.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.32.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.32.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -472,6 +688,15 @@ "model.layers.32.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.33.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.33.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.33.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.33.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -487,6 +712,15 @@ "model.layers.33.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.34.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.34.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.34.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.34.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -502,6 +736,15 @@ "model.layers.34.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.35.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.35.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.35.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.35.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -517,6 +760,15 @@ "model.layers.35.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.36.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.36.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.36.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.36.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -532,6 +784,15 @@ "model.layers.36.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.37.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.37.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.37.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.37.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -547,6 +808,15 @@ "model.layers.37.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.38.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.38.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.38.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.38.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -562,6 +832,15 @@ "model.layers.38.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.39.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.39.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.39.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.39.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -577,6 +856,15 @@ "model.layers.39.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.4.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.4.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.4.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.4.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -592,6 +880,15 @@ "model.layers.4.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.40.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.40.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.40.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.40.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -607,6 +904,15 @@ "model.layers.40.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.41.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.41.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.41.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.41.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -622,6 +928,15 @@ "model.layers.41.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.42.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.42.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.42.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.42.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -637,6 +952,15 @@ "model.layers.42.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.43.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.43.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.43.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.43.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -652,6 +976,15 @@ "model.layers.43.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.44.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.44.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.44.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.44.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -667,6 +1000,15 @@ "model.layers.44.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.45.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.45.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.45.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.45.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -682,6 +1024,15 @@ "model.layers.45.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.46.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.46.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.46.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.46.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -697,6 +1048,15 @@ "model.layers.46.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.47.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.47.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.47.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.47.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -712,6 +1072,15 @@ "model.layers.47.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.48.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.48.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.48.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.48.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -727,6 +1096,15 @@ "model.layers.48.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.49.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.49.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.49.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.49.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -742,6 +1120,15 @@ "model.layers.49.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.5.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.5.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.5.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.5.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -757,6 +1144,15 @@ "model.layers.5.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.50.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.50.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.50.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.50.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -772,6 +1168,15 @@ "model.layers.50.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.51.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.51.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.51.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.51.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -787,6 +1192,15 @@ "model.layers.51.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.52.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.52.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.52.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.52.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -802,6 +1216,15 @@ "model.layers.52.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.53.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.53.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.53.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.53.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -817,6 +1240,15 @@ "model.layers.53.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.54.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.54.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.54.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.54.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -832,6 +1264,15 @@ "model.layers.54.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.55.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.55.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.55.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.55.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -847,6 +1288,15 @@ "model.layers.55.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.56.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.56.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.56.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.56.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -862,6 +1312,15 @@ "model.layers.56.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.57.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.57.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.57.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.57.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -877,6 +1336,15 @@ "model.layers.57.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.58.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.58.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.58.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.58.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -892,6 +1360,15 @@ "model.layers.58.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.59.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.59.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.59.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.59.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -907,6 +1384,15 @@ "model.layers.59.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.6.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.6.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.6.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.6.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -922,6 +1408,15 @@ "model.layers.6.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.60.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.60.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.60.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.60.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -937,6 +1432,15 @@ "model.layers.60.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.7.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.7.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.7.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.7.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -952,6 +1456,15 @@ "model.layers.7.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.8.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.8.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.8.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.8.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, @@ -967,6 +1480,15 @@ "model.layers.8.self_attn.q_b_proj": { "bits": 8 }, + "model.layers.9.mlp.shared_experts.down_proj": { + "bits": 8 + }, + "model.layers.9.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.9.mlp.shared_experts.up_proj": { + "bits": 8 + }, "model.layers.9.self_attn.kv_a_proj_with_mqa": { "bits": 8 }, diff --git a/model-00002-of-00072.safetensors b/model-00002-of-00072.safetensors index 7c43e9a3e7f0a21cd117f9ceedd29b30df17a0b2..8b273605cecc45c3e69bdf180225c5257ec385d0 100644 --- a/model-00002-of-00072.safetensors +++ b/model-00002-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5a5ba61ae9bf2b3907e48105177902846e063f40a76301c19907c68f47c95b1 -size 5000051392 +oid sha256:0462b3a214fa5ea5bad4b053f2a70b6d65919d962a0e1ac9f894161efbc496a7 +size 4999591680 diff --git a/model-00003-of-00072.safetensors b/model-00003-of-00072.safetensors index 38ca45e88d63c0bc0cdb6fba8a17a66ec5441436..fdd9aac8fde872c0e0d27e69b3b51b1f117c7dc1 100644 --- a/model-00003-of-00072.safetensors +++ b/model-00003-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b08a3f557e84a92e41f1e92f99f550cc0d8a8442f21b95eb3fa480703eecc1f8 -size 4995991608 +oid sha256:88b741b175aa1149079d35cc5bfb86bc16aa1e0e88f1e2ebf8831fafd427c63a +size 4995762096 diff --git a/model-00004-of-00072.safetensors b/model-00004-of-00072.safetensors index a6fc634a64b3f8efc2b91e2f42a42933a48a934e..b333c9a4056bce732d84413b4d3ba937410f409d 100644 --- a/model-00004-of-00072.safetensors +++ b/model-00004-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7020b0c09d1aca0b1a508d4d3039b3904dbd74953334cd8a2769ec3608b9108b -size 5000050912 +oid sha256:8f7d2a3285f7458d3e92649afdac0b9f973ab5a08167511e6f65b6e42253d2de +size 4999591192 diff --git a/model-00005-of-00072.safetensors b/model-00005-of-00072.safetensors index 24b36a045f01fec1d6abf8d2099edb3082ed7557..b3169eacef121fb31fc820c723b84dc8c668931a 100644 --- a/model-00005-of-00072.safetensors +++ b/model-00005-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72f624ca05d3b54dfc34267ee659ba12d15d5b372db2feec13fe2b496a2d8211 -size 5000222944 +oid sha256:fd8e279298f6750bf7a9a6a9011e78a2d2558cc3478fe9aa0468ed5579dd1738 +size 4999591176 diff --git a/model-00006-of-00072.safetensors b/model-00006-of-00072.safetensors index 0b81da868750f62e580ef23b0a66494337189984..1b71c3e82bc8328f0c4ccc006128a25c589d2733 100644 --- a/model-00006-of-00072.safetensors +++ b/model-00006-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3a0f1fb2164bab6a13fa7a54501d09996c34d7e41a6cb2d39d9d621e0410ad4 -size 4992940416 +oid sha256:525493633455c0f46e00b6bb06417ecc803a746b8848132d9c2a30f88b6f1087 +size 4999591384 diff --git a/model-00007-of-00072.safetensors b/model-00007-of-00072.safetensors index b944b3d8cf2acaf8283289bf543b87b1eaf62342..20977e8ca1beac28914ff104402d3664fb91530b 100644 --- a/model-00007-of-00072.safetensors +++ b/model-00007-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4be835f87031118ce99f89b55553273a1956f44fb987f632e5bdc7374688407 -size 5000051336 +oid sha256:3aae5be40df7755d18385d1292b3ab4ca53f2897238760bdeca657d75181a48f +size 4999591608 diff --git a/model-00008-of-00072.safetensors b/model-00008-of-00072.safetensors index 87c7ff2541be836a0c9d21e536cbf23656053ec9..4f800ddaf05ec148794deb2de4d817058cd09991 100644 --- a/model-00008-of-00072.safetensors +++ b/model-00008-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f68acaf80fe8ed102b0a1f946c9fc49548de37d408c89460d8fd3a49d98f49dd -size 4995991936 +oid sha256:dfa4a06b23c694d9afe0b166d7bb9a2baf60eb2ff20eb34177e935e9a24411c3 +size 4995762400 diff --git a/model-00009-of-00072.safetensors b/model-00009-of-00072.safetensors index 09cef47077f8fcba4dc64deac8c90e4c5d5e8987..a40f4102f29ee9696bd2e12ebc6aebb6058684d3 100644 --- a/model-00009-of-00072.safetensors +++ b/model-00009-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:347da340973bc3c9e78814c9b0b37007d2342092961b2260ecb8360db190d912 -size 5000050912 +oid sha256:2c838136cccadf85d169666aca32792bd1cb29c2dc973c81946887c41e4d87fb +size 4999591192 diff --git a/model-00010-of-00072.safetensors b/model-00010-of-00072.safetensors index a9fc20777b07f008a24ef63e919909356efe86be..cd5610603a339f3b40d3dee1efe3deaa5606a0e6 100644 --- a/model-00010-of-00072.safetensors +++ b/model-00010-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f808ce67c8deee35f928cd4f507d0b7d91b9782752adce381940569cb390982f -size 5000224376 +oid sha256:370201acc095b9bed2173c26048e6e003c19bc62ed36958c35bf33687c3687b1 +size 4999592560 diff --git a/model-00011-of-00072.safetensors b/model-00011-of-00072.safetensors index ead1533dbd762cc0ca6e0f8d6b5e64f0dd0b4cb8..50acde506c2491d79ba6745ebc69d5c38838af89 100644 --- a/model-00011-of-00072.safetensors +++ b/model-00011-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9c32b02f7fc2fbaa588c4a1a561c3c845b5cdcc97e4f9d4d990558d3db30414 -size 4992942152 +oid sha256:a40bc6754a40b1b52f337f904f10b0b7466e89e7d44a9a5267781b2ed6ff36e7 +size 4999593080 diff --git a/model-00012-of-00072.safetensors b/model-00012-of-00072.safetensors index b97d7c3e4c07464cce6f1a3bdc811d732ee1a72d..d759225a27ce53b240eefcc2c447a3fbc6c7c244 100644 --- a/model-00012-of-00072.safetensors +++ b/model-00012-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9112c487f3ecf185605d4cf4dac92138519dbe5ace64f3a9be1c9a04630eea4b -size 5000053152 +oid sha256:d06ca481c6a2acac2274992d5b0969d64b2e13de8bf2ae5455dfaea0fa0ee548 +size 4999593480 diff --git a/model-00013-of-00072.safetensors b/model-00013-of-00072.safetensors index d2a5627b139b920b1a1a3e41f0828ee268b01d67..b0be7952e2df001ad10ad9d6acac765221974919 100644 --- a/model-00013-of-00072.safetensors +++ b/model-00013-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c184fc0ee3bf5e33047f40f4c2855844c909040a4b95b2cff34bc99b018ff625 -size 5000225280 +oid sha256:5b486cbea28c5e55dd0c9c17257eac85a5f0f7744440e0acc6fe646e764aad94 +size 4999593536 diff --git a/model-00014-of-00072.safetensors b/model-00014-of-00072.safetensors index 65a72693e417de7b145349a766f9076f94fcdb0a..f316fce5f4ecf75cd47932cb0cb2f945931afe1f 100644 --- a/model-00014-of-00072.safetensors +++ b/model-00014-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9909ab2a8a7ce7bc5a7c5b19feeb2d9f3e060c4d0ca8179c58db9a738be83436 -size 4996051216 +oid sha256:ce5a242eb6094293854ffa84c07120c31a1be234b9778d6c3d3c8328fa35c106 +size 4995764144 diff --git a/model-00015-of-00072.safetensors b/model-00015-of-00072.safetensors index 70a14e2ced56d20684c8d89adb382a8abbdb7393..bbf14cf552edf799d017eb730d9dc843842d152d 100644 --- a/model-00015-of-00072.safetensors +++ b/model-00015-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:da31552606f00a3a21049637416f845c0f55cedc40e060f120114447503cf0d3 -size 5000052816 +oid sha256:af629bee2dc2c2b286e5249a4df175ded456fb124f4cd5ba956c24cc409b4644 +size 4999593096 diff --git a/model-00016-of-00072.safetensors b/model-00016-of-00072.safetensors index 9b75f63ae70967783e5dea033f10a1df94155eea..4f2c3ea14cf9a65d3143488ad741012cf8deace0 100644 --- a/model-00016-of-00072.safetensors +++ b/model-00016-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0bc3bad1cac7808d24cd57b4cb3409052a9b06de766d9413fea2f8c868b6600 -size 5000224856 +oid sha256:204e129139fd8ea6951f2d6f171d7380b6a0edf4dddbb0a6bbd5a9f5567e01c7 +size 4999593080 diff --git a/model-00017-of-00072.safetensors b/model-00017-of-00072.safetensors index 871c5557faa0fc409e5791fa4e45817cd8d648d0..2108b3de5d93e03dcc837eea1beb7715daba2539 100644 --- a/model-00017-of-00072.safetensors +++ b/model-00017-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:17b5c9c247567c7624beea886458abeae76c9958aacf888925f01879dd5ac209 -size 4992942208 +oid sha256:0a05e3ae2f3998deb65c2a457e23ce91dabe6d91da413b29990dd44c02673804 +size 4999593248 diff --git a/model-00018-of-00072.safetensors b/model-00018-of-00072.safetensors index a337fc9e1b38046a5685310d6f26b5f14af92d57..fea1e64d3d72676032dea4e63bf87da80c427846 100644 --- a/model-00018-of-00072.safetensors +++ b/model-00018-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c04f2c0095391732d42259480fda5d2219e457d01e0179e36e450ca078f4db3 -size 5000053248 +oid sha256:09edbe9a68debfa5c46ab73d29e69e98de50676e96c8be8f3f004e1abfc4e142 +size 4999593512 diff --git a/model-00019-of-00072.safetensors b/model-00019-of-00072.safetensors index 7ca1358945a21d895ca565a4a5ad85674b6cff29..1e6b8464c4c245d00fdeda43dfb1f6b058a2a897 100644 --- a/model-00019-of-00072.safetensors +++ b/model-00019-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a7aba70afcdf3ce089821a36d63c5dbfec323c4bac17c8354057770ecb9a11e3 -size 4887946080 +oid sha256:baa360db2d5af6ceca018b5c9dbf11341f4671f2eb6469d450cdbd95e69a2017 +size 4995764408 diff --git a/model-00020-of-00072.safetensors b/model-00020-of-00072.safetensors index d4f3a21dee6d77236eb662524b60d62d5407f524..97679ec0a9bbc9c852d7b7146e5a095d5bc0fdf3 100644 --- a/model-00020-of-00072.safetensors +++ b/model-00020-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:10a936066825e6e83310f5beda543af76caa7454c228261ccb6ebcecb388b5d9 -size 4993923416 +oid sha256:9426b4e92393fde4ae09268bd50dacaf35c2712534250a9f957198d4ff6ccaea +size 4999593096 diff --git a/model-00021-of-00072.safetensors b/model-00021-of-00072.safetensors index 8ba950db4933be48d6422fac2c20efed41bf109f..53e3e36d5b70834e61c9e22576c30052413b0477 100644 --- a/model-00021-of-00072.safetensors +++ b/model-00021-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dbf954fdfee1482d82ae4b7dd3b81f3c96e94503c3cd0b879cd84d8601f39e6b -size 5000052816 +oid sha256:92a858c6b64bb5062e27e82fb71e29bc56acf0be7bc2ec690941de70f31ca4c8 +size 4999593080 diff --git a/model-00022-of-00072.safetensors b/model-00022-of-00072.safetensors index 42fd783b23324f236b700ff2206569e0fe1e34ad..bbd36005281622d909ec13df9dc13cf93677aedb 100644 --- a/model-00022-of-00072.safetensors +++ b/model-00022-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b1e391cdccc84a5b3ec1723c5f871e2070a0d521ff77c356bf36ae76f6878b03 -size 5000224856 +oid sha256:8964b092f1345171f6c942c2dc3c4643e80e26120160b562b22a62f907b62174 +size 4999593080 diff --git a/model-00023-of-00072.safetensors b/model-00023-of-00072.safetensors index f7170a015b9d2b921e73db345eeea2a5f8c51933..9e04e8e29b614116a28ec90aece508fde4f98217 100644 --- a/model-00023-of-00072.safetensors +++ b/model-00023-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:702015a7919d71819afb95f0c9e3cf74216fcf4596f9062189e73fcf569f9d39 -size 4992942408 +oid sha256:06df694bb89764e1845a26c86b71b9102a95c8deee7852cafcf605d2f9a9a64d +size 4999593440 diff --git a/model-00024-of-00072.safetensors b/model-00024-of-00072.safetensors index 9f5597153a90f651426f8a558b7f6e0c796fb292..df2a4f44a1b895bfce992fb9eb389a7a72d91243 100644 --- a/model-00024-of-00072.safetensors +++ b/model-00024-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:422dd7e4209744716eeaa76779f30457b7d1b2e6bf105d4947e671ce6921e523 -size 5000053248 +oid sha256:94ecaee51f1a488ab3626a2f9119b563cfeaa6433f89eb59cc416eadec984022 +size 4999593512 diff --git a/model-00025-of-00072.safetensors b/model-00025-of-00072.safetensors index 03c1f8bee6306f574cca1102c09773dedf628bda..be9d78946600ee8982a111b33e264866c3bdfef7 100644 --- a/model-00025-of-00072.safetensors +++ b/model-00025-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:476c13bc42d1fffcabcf1f83229aa435201c5a2f92e008305e3278d674fa792e -size 4995993824 +oid sha256:14c7cb322477eb98733db90c8b08b3e753e25fb61026c00684cf6da1804607ef +size 4995764216 diff --git a/model-00026-of-00072.safetensors b/model-00026-of-00072.safetensors index 46339a144b25a3477a40533e5109c4b8ab70fce1..433b6a8329379064df8f6c1f66b4d6de3ebd4abb 100644 --- a/model-00026-of-00072.safetensors +++ b/model-00026-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:441cf0656c2358e3e15a326b8f280de0ae09a4b7481e0752d85571a6e7ad76c1 -size 5000052816 +oid sha256:5ee4323ce69e1141320852699c39ccb8a7c29e9541af4a8d5ba8a384d7450430 +size 4999593096 diff --git a/model-00027-of-00072.safetensors b/model-00027-of-00072.safetensors index a4f52a15118774e0c55d02f101625b960b2ae428..f239d79841e1d3310dcf3018df265c311a2f2845 100644 --- a/model-00027-of-00072.safetensors +++ b/model-00027-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0c0eaca5ef29ed2e0b985af88687d13699f075332e45f006c66530e0c740985c -size 5000224856 +oid sha256:3586365b51e3ef370eb3d62a637013040b5fc558dd94ae9563698d9ea04d45bd +size 4999593080 diff --git a/model-00028-of-00072.safetensors b/model-00028-of-00072.safetensors index 7a9ab3e83ba67e3915bd024b4fdd9a23fa2d448a..99f06e7c0e7174eda81e67daa08ab491c31b99c9 100644 --- a/model-00028-of-00072.safetensors +++ b/model-00028-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4db427a1585b57fdd8fc3b84138c00548c9b310e0d5fb2fe3f69944eae6dc5d0 -size 4992942152 +oid sha256:0eea128b89640d9864d22ff5543adecc4200dba21cf272c3c2ade8341541a837 +size 4999593208 diff --git a/model-00029-of-00072.safetensors b/model-00029-of-00072.safetensors index 02bb046841aadf86cf1d004ecbd0c1764acc81fc..45a9159347b37032f7c412ac690b7f2fa550fbf4 100644 --- a/model-00029-of-00072.safetensors +++ b/model-00029-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e276ebe719c214518a53b38396ad526159d32071d8df3fbd99316e9add87be57 -size 5000053232 +oid sha256:61efba4225c03154ffd9ac51d9c05d195058986934fbdb175bfca9e9cf89df93 +size 4999593512 diff --git a/model-00030-of-00072.safetensors b/model-00030-of-00072.safetensors index 6b8733ed6ddc8d3971bebbe1ad9805efff00a44b..7a42700dd7304084b7c5be5d41bf108cdeb6d828 100644 --- a/model-00030-of-00072.safetensors +++ b/model-00030-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b9ae27cc538f8ab8da4ce267c76d7b0f4dc33bccaf5067a0b12ba5cf143a2e31 -size 5000225304 +oid sha256:8c0d0d0c31bee444b012680d07a2a3432474cfda0a71574dfcbceb3cfbd2f8fd +size 4999205472 diff --git a/model-00031-of-00072.safetensors b/model-00031-of-00072.safetensors index c43dd80b6f912a4321a8bce8e5e319032a86f08f..2face0ffef6b102b4a8025d40b48fda6a28afe8c 100644 --- a/model-00031-of-00072.safetensors +++ b/model-00031-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:983b30e8172ebda2b844d5287959e8c50d731fa3371a207257d680aa5b9121cb -size 4996051112 +oid sha256:3dc916619de62cd657edc348e89feae03adfefea7efb8feef09ec2927fd37bc3 +size 4996152080 diff --git a/model-00032-of-00072.safetensors b/model-00032-of-00072.safetensors index 53c7c40e7d3362d9a72455589b506330dcde3de3..5329d21612129bba31a74fa98e26b8fb4ad36485 100644 --- a/model-00032-of-00072.safetensors +++ b/model-00032-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ee2587fcdbcb7966e2e46e557b9a86df222f86fc9ff3c78a37b08b45c1134b5 -size 5000052816 +oid sha256:e0f92fe783a8acc864054da76d0ca2d75d30c951b0bbffae1bac2340ceffd120 +size 4999593080 diff --git a/model-00033-of-00072.safetensors b/model-00033-of-00072.safetensors index 860de077aa1c90803a84718302658b95bf71f7ad..dcb3928b6a8486465fbcbbb876740bb1af104e0f 100644 --- a/model-00033-of-00072.safetensors +++ b/model-00033-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3d88968cec7322b8b0559f518f0d2b3fab1adbbe1940a3e0078fdb810f4a040 -size 5000224856 +oid sha256:d398780f22d6402471e7220b0e29074f8d89675698197ac5d9ee441c06dcbac3 +size 4999593080 diff --git a/model-00034-of-00072.safetensors b/model-00034-of-00072.safetensors index 29624521b4cb6e68329a87866596f7c67c96fa71..a66d1a65836f4014a2a907cde06b652e8cbacf88 100644 --- a/model-00034-of-00072.safetensors +++ b/model-00034-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0f2715617fe58702606a3891d3eff57ce5f6b402cbeeefacea858a64b3f0b01 -size 4992942288 +oid sha256:d7d991a04fd2d0341fcc2a25b8a177f945e2520a68622199f27a5c9dfafbbf51 +size 4999593400 diff --git a/model-00035-of-00072.safetensors b/model-00035-of-00072.safetensors index 9f53c7f9843aa197d93154f14b7a996154140c5f..7f466899e61d90204dc2da5ee8fc79ea3f825f50 100644 --- a/model-00035-of-00072.safetensors +++ b/model-00035-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa403dc7a766d421d56db4fab0e8144c33307cbface657e58ce08dd0723a21d7 -size 5000053248 +oid sha256:ba2bbff3643ddb289667d98511aa0df31893007fda01d413cea8bfad500ae95c +size 4999593512 diff --git a/model-00036-of-00072.safetensors b/model-00036-of-00072.safetensors index d1b947295fc216b42e6096251738b68cd399965b..2c5c4d80e93737be12a14f4da7b43e8d18ece471 100644 --- a/model-00036-of-00072.safetensors +++ b/model-00036-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3af20d5f58e03c46ebcb02a9127eb3a80cd96257e778c7000b2a28a609c1864f -size 4999664696 +oid sha256:c076d23a0c6bee26147aa7d18e4c54fe39a1e0bf15f389351a0ead3ccb13095c +size 4995764256 diff --git a/model-00037-of-00072.safetensors b/model-00037-of-00072.safetensors index 457ba7caf66aa16383a21c5276d491d2dee33166..a091f28dbfc00929cf6187d2afe4c4d6f0d37869 100644 --- a/model-00037-of-00072.safetensors +++ b/model-00037-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:74459e2953f3b36afa8426eab858336930b597ac3c652bb16e30ba4fb2f301db -size 4996611560 +oid sha256:bf065e01d8d893952a188ffe99a3a9b6303bebe80a310632ec5ad8f1a84e59f2 +size 4999593096 diff --git a/model-00038-of-00072.safetensors b/model-00038-of-00072.safetensors index 630695ef1878d97009803381afea0d5d58e1681b..11010d6ef8c1ad53806ebb1ac6d66fcd39a548ba 100644 --- a/model-00038-of-00072.safetensors +++ b/model-00038-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3d06df18ed937935a1fbafb1d212ac8c0c5225f2a32285f8f364092586c45f5 -size 5000052816 +oid sha256:faebe749b3e0a34c2dd74c18c6194cf45c8c306310c8388b3e3f7a2cffaf4285 +size 4999593080 diff --git a/model-00039-of-00072.safetensors b/model-00039-of-00072.safetensors index cbdd743498d346f4897a16e20c76d10099642227..b9e9d9e4f867dafa29215a6caa2b71be8b9df6c5 100644 --- a/model-00039-of-00072.safetensors +++ b/model-00039-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8de186711e1ef31eea8eb178c4cb45f39130d77623617982726c2f73ec384667 -size 5000224856 +oid sha256:c2e7e686f371d25e83370114112e11a0b48bbf7d578741bbef4ed240dd28a4ee +size 4999593160 diff --git a/model-00040-of-00072.safetensors b/model-00040-of-00072.safetensors index e31b495c7b5fc321b75b567ed627556ecfa8ddcf..069010abbf27228bef6216c54bdd4e95a3768d51 100644 --- a/model-00040-of-00072.safetensors +++ b/model-00040-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f5ab209db638b7e349a3f8266abed57b7bcb84320b4e33aff59e8e2aff184f5b -size 4992942440 +oid sha256:ea1f8e8784ad460c66fb17164e34674b002e4bbb161f1c616a0897007183f4b2 +size 4999593512 diff --git a/model-00041-of-00072.safetensors b/model-00041-of-00072.safetensors index d1e519bc8b64d6646775e4c78370c0e739f6c7d6..c38bb0b28d94ab9fb84520fffdd9b83fe67da5d6 100644 --- a/model-00041-of-00072.safetensors +++ b/model-00041-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b52b41a366e94ca5c038940517cd4f594850c5bcc2cc65f27686e267e99b7675 -size 5000053248 +oid sha256:88c5b246725c00848b61517495f2006aa421c0dea9191ae62f65b8d92c64cc40 +size 4993807032 diff --git a/model-00042-of-00072.safetensors b/model-00042-of-00072.safetensors index 58afb6ec7af6308859f909ca14ed43886b51ff9a..4ccec909db897e15e1247799f1b39fde6ffc1efb 100644 --- a/model-00042-of-00072.safetensors +++ b/model-00042-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d4f148561dd6769a5ff5c8242aaea132cbe7c13031dc6af0f5b7a72bb5800d2a -size 4995993792 +oid sha256:5894290536addb4b108a7bd5597e32d036ccb0eee11834fd98ee188983724852 +size 4993923416 diff --git a/model-00043-of-00072.safetensors b/model-00043-of-00072.safetensors index df90e513fa1a029ccfaba7194f12f2d87a5d579f..04e9e2965efe7acb00eca015457d5174015d3ce6 100644 --- a/model-00043-of-00072.safetensors +++ b/model-00043-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b06564b3422d93e8d8a171ab270de1baff4e4aca1d997b06a496079b1078f78c -size 5000052816 +oid sha256:4659c84b744787225d253bc2774d9f2ef0af1117d379b7f726a67be479c825d8 +size 4999593096 diff --git a/model-00044-of-00072.safetensors b/model-00044-of-00072.safetensors index 557d11c13b2a4452509bd826959b2ff2903a09f7..a48ae29542237ded38f938805f61f8afcf292d4b 100644 --- a/model-00044-of-00072.safetensors +++ b/model-00044-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ff9c0c8c6a4aef00b34a1b2766ae347ab853629c7da6f9c48e942c65a55c381c -size 5000224856 +oid sha256:a3154593a83985f8cc0bbc80e79fa387ca5a077af6690ac9cc5201ae471399a6 +size 4999593080 diff --git a/model-00045-of-00072.safetensors b/model-00045-of-00072.safetensors index 8fa56761c53f7b0c1c4bff8be7e6eabe8449b16f..60cd070fa5396460d12830e302fff7ea0b688f05 100644 --- a/model-00045-of-00072.safetensors +++ b/model-00045-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1c4b7abd0c88a285639dcefe4ed905d0d0b31958c94ea3353df623737a0e3f27 -size 4992942176 +oid sha256:cdd23d19b26a6c8d381b3acc906c190f6ddb27724803a81d2ffd42cb9f785aee +size 4999593360 diff --git a/model-00046-of-00072.safetensors b/model-00046-of-00072.safetensors index da0fafacee33611992ec512083b78136c1ae2278..b88afa5619f760db28a97ea8b844971304a97ea5 100644 --- a/model-00046-of-00072.safetensors +++ b/model-00046-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2139f7b5a065a037e76b1d3a88e60f86157040fc93608e629c7fbc3d2390c289 -size 5000053248 +oid sha256:3bea09251968dc9ca17adc10092e10161e79e9858f4e7509d94cbb12486da76d +size 4999593512 diff --git a/model-00047-of-00072.safetensors b/model-00047-of-00072.safetensors index ffc3f0763dbae79fbfa1b78c190307ab8b98bb76..7a10f8ae8280f9a7a26254efee9e56c42eb65c17 100644 --- a/model-00047-of-00072.safetensors +++ b/model-00047-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:07bef778b2417fa450ee481f892353398c18abc875b238478112bc3677691e89 -size 5000225336 +oid sha256:207264998aad27b1f372140968aa40d061b6128f6db5d4cf57086a4240f99bf6 +size 4995764296 diff --git a/model-00048-of-00072.safetensors b/model-00048-of-00072.safetensors index 6408627be78376cd5a90f7eba3a387537c6424dd..efc84c6d74331053662815b4d044a4bb4bfa890e 100644 --- a/model-00048-of-00072.safetensors +++ b/model-00048-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c50b59bc6c2522e7bd5fc0ff827fd239a6cc8cbc3b0f6f9ee608a5eba8f294fe -size 4996051040 +oid sha256:799f9792c3a5025b0849b50976fa3250302b9e910504230317ffaa2576ae86c6 +size 4999593096 diff --git a/model-00049-of-00072.safetensors b/model-00049-of-00072.safetensors index f9e16352e3f0b9f0fd24d68330c158cd7e007c76..32bc05aa0e8af80f386b945f3bd34708f831dca7 100644 --- a/model-00049-of-00072.safetensors +++ b/model-00049-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8834e9c291ed773cbae76ff5f7b29df7641639d6dd3abcc03f0c9de82126a510 -size 5000052816 +oid sha256:bbe6bbd60af7680e0642aeba1bd9b1041ec9171cde7613530f9f03d5c83144d1 +size 4999593080 diff --git a/model-00050-of-00072.safetensors b/model-00050-of-00072.safetensors index 63c6739271c8d3d0e3f38f7ade7cdd58ae3ccd2f..e195e8da7bf867d0a194af4c4791d1fc44d9c47a 100644 --- a/model-00050-of-00072.safetensors +++ b/model-00050-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:51501512b569be6b1756375d1c980e6ac1884e479ef303345619cd78a7960105 -size 5000224856 +oid sha256:73cbdc09aefed8d32ddbe0f214e07f7c891c5a15c906c57d7253f32c54cec09a +size 4999593120 diff --git a/model-00051-of-00072.safetensors b/model-00051-of-00072.safetensors index 9179e581efb5f6fa5ccceeaa62afad733d11bd68..ac6f22e6163d9f58b53bffe62aa180813cd7d8b7 100644 --- a/model-00051-of-00072.safetensors +++ b/model-00051-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f9e61d7ea7b55ec136ab6d29e0a2592a1185fa8b60a0ce715f81154a864d7ced -size 4992942328 +oid sha256:878077cad9ba3cdf62d25b5774e773e1a6c402971e37147ad237a59fe2a8a035 +size 4999593512 diff --git a/model-00052-of-00072.safetensors b/model-00052-of-00072.safetensors index bcb7566c8b07a4a942d2abc57053a6bcf0768edf..b16d0414383321ce2c4db5243320e7cfb65bd662 100644 --- a/model-00052-of-00072.safetensors +++ b/model-00052-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:27e0bbb2c8172afd2a75548962cb59758b3f48f4e2a244fbbc5ff038b75a6120 -size 5000053248 +oid sha256:7d5fc30f5580673d5ef2523c8849032b6fe29df609c389b5fd06d2aa60527def +size 4894654464 diff --git a/model-00053-of-00072.safetensors b/model-00053-of-00072.safetensors index 6042bba88dc8e5d20bbfce3af88e4b068d008cb7..11c946768346d3f4e9a0c547ceaa0bf355606c2f 100644 --- a/model-00053-of-00072.safetensors +++ b/model-00053-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:56923823e881b37799d2c2c601eeb8278dc04b2b6640355d90d3d6c20fee5f64 -size 4995993904 +oid sha256:3a6d8411ef4808e03752e9cab24f824ba2f80505a99507273eeb66c5e9069aaf +size 4993923416 diff --git a/model-00054-of-00072.safetensors b/model-00054-of-00072.safetensors index 868a6d0e11683187ee54fc936a110a18b7500f95..1997430048233f236b923e1438e9322a561f19ae 100644 --- a/model-00054-of-00072.safetensors +++ b/model-00054-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3a7a3f224ed2d871cdca39c5577098ecd0b7568a2b423706a3e7697344a2c587 -size 5000052816 +oid sha256:beb3e1f7111ea8cd8c952f2c9d083ff71c0416cb46eae9013e5f1f82a5599b92 +size 4999593096 diff --git a/model-00055-of-00072.safetensors b/model-00055-of-00072.safetensors index 957f8594ddade708c03a460952b3b8a204fb7645..a48fabdb63d57f5c22abd025bffead1e2c1d4552 100644 --- a/model-00055-of-00072.safetensors +++ b/model-00055-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3a4c0dbdf5f115159487fa50a33d23f50f458b7604836c9385f1745c8c213cc -size 5000224856 +oid sha256:b4036e8ebbcc0756607c62e75a5601bc188abe33c46adbe195f0eea2bfaaef5a +size 4999593080 diff --git a/model-00056-of-00072.safetensors b/model-00056-of-00072.safetensors index b6822f64e614d0dfea2cc100f2ccbc2f789bbc49..c949c5f02a8f389415c37799e160851c516ed280 100644 --- a/model-00056-of-00072.safetensors +++ b/model-00056-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8c7064f55c72f3af78445384e87612fce6841d6f04f235024718904fce66054 -size 4992942152 +oid sha256:ddf1001f354502d4a4f072617c894a3a82b4131af228720dea4eb15b87f9667e +size 4999593360 diff --git a/model-00057-of-00072.safetensors b/model-00057-of-00072.safetensors index da6c1dff0842622213b4eef853f0fb61604c61a2..99eeaccd213531b17284183a940ced1a0cf2043f 100644 --- a/model-00057-of-00072.safetensors +++ b/model-00057-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:70f07d553599a2e087db1d6afd60fdf0fd90dcee32dcf5a44231f9968fcd534d -size 5000053152 +oid sha256:2e4caf9e755ecd9a13e1e298680383e2786585a265a82f7863a246798af9539e +size 4999593512 diff --git a/model-00058-of-00072.safetensors b/model-00058-of-00072.safetensors index 57584ba4179e7d297e4e08b6cdc8aaf72fbb8de4..d880697b3c66080bb49650e212f00e9f041dbeb0 100644 --- a/model-00058-of-00072.safetensors +++ b/model-00058-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4af06bb7aa0cd953cd20edb694a313d3ac9800f7cae77b1afd63682981b502f5 -size 5000225280 +oid sha256:e00aa2dabc8ac06ec43f4598ad21e0356ecf30f70a956cb13e423e196153e95e +size 4995764296 diff --git a/model-00059-of-00072.safetensors b/model-00059-of-00072.safetensors index e0f782127dfb00e3bcbee5c303caf8830f738d32..23fb13430995287255f8cfab7906811d3222e7bc 100644 --- a/model-00059-of-00072.safetensors +++ b/model-00059-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de55ec7a12bc95b42cac774f81e8337c3890ffc43e40b0a11928011afaa30cdf -size 4996051216 +oid sha256:52b2e02edd4d33810875627c7b74ee3e9999d7564a4b20f5fdd557b28d7eb0a6 +size 4999593096 diff --git a/model-00060-of-00072.safetensors b/model-00060-of-00072.safetensors index 28dbb2bdb84bffb9cca355ba5b7a510e955c7d8d..7e721172fccbd57aa954fc1e7ea88e0f85090f39 100644 --- a/model-00060-of-00072.safetensors +++ b/model-00060-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4b6569fab736fe0dac1d9542b4fdbb548ea82e3e9c6d5c8242de1d9ea3115fbb -size 5000052816 +oid sha256:53f8d5a74e94840111a0e36646c930fe8f1b6cf2cb380edc320af49236e0bde0 +size 4999593080 diff --git a/model-00061-of-00072.safetensors b/model-00061-of-00072.safetensors index 4fe3a01626abf8415cb841f87a42f0f6373a84f7..f8c2db1b2998a901b2acff0ccbd7f77161450ff9 100644 --- a/model-00061-of-00072.safetensors +++ b/model-00061-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a5f24047192f5650937d48237c74590c0590702a783d9775851dd28a32375d88 -size 5000224856 +oid sha256:6eb278384b6f06a543b0619dbe873dca7701d54b7113a86c5a7455de3bd6a387 +size 4999593120 diff --git a/model-00062-of-00072.safetensors b/model-00062-of-00072.safetensors index 5eb42474f5ec7bc6e8dd9c747995ab5e2fb561f1..499f9ebeef468dc0e224f496ccdc5c3a2750881e 100644 --- a/model-00062-of-00072.safetensors +++ b/model-00062-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ce6517451b886943d1e87dccb1bf8631f757ac5ac46e5a01e21cbae35fb608f -size 4992942208 +oid sha256:65907531aa536a677af3ca2981f82505b97278c6a5dfcd8c808ac903fe2a1d51 +size 4999593512 diff --git a/model-00063-of-00072.safetensors b/model-00063-of-00072.safetensors index e283b9115686ac31a1e0a9a916e72b6a64e5a1d7..111e4abe13f2e86818d8b020980a78714e863ec7 100644 --- a/model-00063-of-00072.safetensors +++ b/model-00063-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:48eda43b518c1fde298ec5fcfcb639db024c9f5afa901509bb8720f9b92c6437 -size 5000053248 +oid sha256:d9f7a06a906b81880289f409a2ec2627f0d0e531b56b9cbbc25052679b723367 +size 4894654464 diff --git a/model-00064-of-00072.safetensors b/model-00064-of-00072.safetensors index 2756a2fc70a20751f5dab81056673a6819472ba4..e65d08b8042843bab0be7552b6ff334eb76a5831 100644 --- a/model-00064-of-00072.safetensors +++ b/model-00064-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c2106f5686fbacb01dca47853c9f4ac958722806bcb2482cf18ad26fd0aa185a -size 4887946080 +oid sha256:f2831f7b05ba68b2e2ef423934c74d04a360fd54f5584dbdd19cc36ccf6d665d +size 4993923416 diff --git a/model-00065-of-00072.safetensors b/model-00065-of-00072.safetensors index 8699a49d4bb21e436c6bca8c333fe83d452499c0..d8af10c6b4fc78c8d4331b8930ddd9516f71a546 100644 --- a/model-00065-of-00072.safetensors +++ b/model-00065-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a68929f5379ce843f28b0a0bc73118946287a740781fad62ad7107b0c8e1c963 -size 4993923416 +oid sha256:7c208dfb7d822c1fbfe0621081b8caa0e3daf05178aaf6dfc55a2d4a7913fc1c +size 4999593096 diff --git a/model-00066-of-00072.safetensors b/model-00066-of-00072.safetensors index f9c753763f8ee15313888bf0b2a186ef13ca623c..6dfd54786e3f660633e579243cdb4817da899f4f 100644 --- a/model-00066-of-00072.safetensors +++ b/model-00066-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f569e1cebb5312de240677205d9a58214e41cfbd12d8c99b3b1310b9d5107d69 -size 5000052816 +oid sha256:b94088a188bfadcf10307d7fef9def1d0db5f467879c88ec4710ffa79ea64e26 +size 4999593080 diff --git a/model-00067-of-00072.safetensors b/model-00067-of-00072.safetensors index efdef3179ea884cb61748eeb8c6bf79bfc350d96..77f28c9de2958c0db5fb2d4ae91330c3d86b87b4 100644 --- a/model-00067-of-00072.safetensors +++ b/model-00067-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:47f0837193d404b6a90a23d6fbc6d2610da0ac12e48148733ee74e69ee36d7c8 -size 5000224856 +oid sha256:c9f523bf0aee2406fa678e2f16cdcb786cf609c574f1fc9735ddc4f0237f76ac +size 4999593360 diff --git a/model-00068-of-00072.safetensors b/model-00068-of-00072.safetensors index e0c014adf63e64842900075bc0b05925a54f258f..0b48f1c792071ce44d227e556aee338a1039eeee 100644 --- a/model-00068-of-00072.safetensors +++ b/model-00068-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6c2ab7695aea108755ccac8252ea8b2deb1ba98354c6e0e0a3300db59a2794a9 -size 4992942408 +oid sha256:3fcec2a8ab1417a4d49f4d2459afc166e40d8bdb6f5674ba8196927520dae8dc +size 4999593512 diff --git a/model-00069-of-00072.safetensors b/model-00069-of-00072.safetensors index 444892fdf32c2d2bc1c3d2d49896cfe742f73eec..bf07ede8d05feddb9de99e413b4abd26a877d6b9 100644 --- a/model-00069-of-00072.safetensors +++ b/model-00069-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:06e1452b7efb3a4812c2463751ac7fa37f1f2f5220d5c6f5288022687c8564bb -size 5000053248 +oid sha256:e3bcda3c330463c8ba9338f9639d5718a2156852f7fdb28dc12bb57dbd586f02 +size 4995764296 diff --git a/model-00070-of-00072.safetensors b/model-00070-of-00072.safetensors index 01c99f5201f6972899f9ee3ee3e2437a513d7cc4..14c50c2f2227cd25c751de2a1c525786e8badabb 100644 --- a/model-00070-of-00072.safetensors +++ b/model-00070-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d13a7640a21579ef46203ccb1d754b8f129edab66824203d5fd7fd7714d63685 -size 4995993824 +oid sha256:7d766d9efdccfe0827bfab3a57590f9f2daa5ddeca17123f5457c896d7ff5633 +size 4999593096 diff --git a/model-00071-of-00072.safetensors b/model-00071-of-00072.safetensors index 0aece903e9c02b3788da2f06f226acb56d53c06c..ce9259ece944b7349aa71a1e923d9d5450bae9c5 100644 --- a/model-00071-of-00072.safetensors +++ b/model-00071-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1aec8d173a17adb707bf722502152ed6c2e907a7d0b365a006fcaa4d4cf0b2d1 -size 5000052816 +oid sha256:1c008675706189e2947087cd15a95d0c3469607547a3b84205328f11cefdd88c +size 4999593080 diff --git a/model-00072-of-00072.safetensors b/model-00072-of-00072.safetensors index d64857d4465fd0ccc8593765bc9555983c38dcc1..29b4fd10e6cf26851a090b4713d25fb258d5b23d 100644 --- a/model-00072-of-00072.safetensors +++ b/model-00072-of-00072.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a510bead7d51875d9cf57dfc5106bc90de4895c07967201980186058658d6dd5 -size 3253064736 +oid sha256:15d6b75b8321597ea3222520fb78366da5c9709d4e3d8b1d43daf1077b32697a +size 4480112800 diff --git a/model.safetensors.index.json b/model.safetensors.index.json index efb6c941cb8f0d084458ede0f9612e518009d0d4..d2623326c2e06dd8f6571766ca3f2884c69f803a 100644 --- a/model.safetensors.index.json +++ b/model.safetensors.index.json @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3948d7fcfcea2b3b535767b2c177d6bdfb7c6a8852c506c3bdb63363fa731d76 +oid sha256:96cf82a8c3e119ada985720d07f0eb18b6d370c6a814933f6587ce6a5df2b055 size 12338633 diff --git a/quantization_config.json b/quantization_config.json index 174018cd9cf5827157b117beeb50a01a54bbae87..feb57e3092d165fbaf5eec9368dc637283054cd9 100644 --- a/quantization_config.json +++ b/quantization_config.json @@ -95,6 +95,15 @@ "model.layers.3.self_attn.o_proj": { "bits": 8 }, + "model.layers.3.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.3.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.3.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.4.self_attn.q_a_proj": { "bits": 8 }, @@ -110,6 +119,15 @@ "model.layers.4.self_attn.o_proj": { "bits": 8 }, + "model.layers.4.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.4.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.4.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.5.self_attn.q_a_proj": { "bits": 8 }, @@ -125,6 +143,15 @@ "model.layers.5.self_attn.o_proj": { "bits": 8 }, + "model.layers.5.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.5.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.5.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.6.self_attn.q_a_proj": { "bits": 8 }, @@ -140,6 +167,15 @@ "model.layers.6.self_attn.o_proj": { "bits": 8 }, + "model.layers.6.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.6.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.6.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.7.self_attn.q_a_proj": { "bits": 8 }, @@ -155,6 +191,15 @@ "model.layers.7.self_attn.o_proj": { "bits": 8 }, + "model.layers.7.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.7.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.7.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.8.self_attn.q_a_proj": { "bits": 8 }, @@ -170,6 +215,15 @@ "model.layers.8.self_attn.o_proj": { "bits": 8 }, + "model.layers.8.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.8.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.8.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.9.self_attn.q_a_proj": { "bits": 8 }, @@ -185,6 +239,15 @@ "model.layers.9.self_attn.o_proj": { "bits": 8 }, + "model.layers.9.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.9.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.9.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.10.self_attn.q_a_proj": { "bits": 8 }, @@ -200,6 +263,15 @@ "model.layers.10.self_attn.o_proj": { "bits": 8 }, + "model.layers.10.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.10.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.10.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.11.self_attn.q_a_proj": { "bits": 8 }, @@ -215,6 +287,15 @@ "model.layers.11.self_attn.o_proj": { "bits": 8 }, + "model.layers.11.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.11.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.11.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.12.self_attn.q_a_proj": { "bits": 8 }, @@ -230,6 +311,15 @@ "model.layers.12.self_attn.o_proj": { "bits": 8 }, + "model.layers.12.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.12.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.12.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.13.self_attn.q_a_proj": { "bits": 8 }, @@ -245,6 +335,15 @@ "model.layers.13.self_attn.o_proj": { "bits": 8 }, + "model.layers.13.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.13.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.13.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.14.self_attn.q_a_proj": { "bits": 8 }, @@ -260,6 +359,15 @@ "model.layers.14.self_attn.o_proj": { "bits": 8 }, + "model.layers.14.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.14.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.14.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.15.self_attn.q_a_proj": { "bits": 8 }, @@ -275,6 +383,15 @@ "model.layers.15.self_attn.o_proj": { "bits": 8 }, + "model.layers.15.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.15.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.15.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.16.self_attn.q_a_proj": { "bits": 8 }, @@ -290,6 +407,15 @@ "model.layers.16.self_attn.o_proj": { "bits": 8 }, + "model.layers.16.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.16.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.16.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.17.self_attn.q_a_proj": { "bits": 8 }, @@ -305,6 +431,15 @@ "model.layers.17.self_attn.o_proj": { "bits": 8 }, + "model.layers.17.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.17.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.17.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.18.self_attn.q_a_proj": { "bits": 8 }, @@ -320,6 +455,15 @@ "model.layers.18.self_attn.o_proj": { "bits": 8 }, + "model.layers.18.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.18.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.18.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.19.self_attn.q_a_proj": { "bits": 8 }, @@ -335,6 +479,15 @@ "model.layers.19.self_attn.o_proj": { "bits": 8 }, + "model.layers.19.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.19.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.19.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.20.self_attn.q_a_proj": { "bits": 8 }, @@ -350,6 +503,15 @@ "model.layers.20.self_attn.o_proj": { "bits": 8 }, + "model.layers.20.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.20.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.20.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.21.self_attn.q_a_proj": { "bits": 8 }, @@ -365,6 +527,15 @@ "model.layers.21.self_attn.o_proj": { "bits": 8 }, + "model.layers.21.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.21.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.21.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.22.self_attn.q_a_proj": { "bits": 8 }, @@ -380,6 +551,15 @@ "model.layers.22.self_attn.o_proj": { "bits": 8 }, + "model.layers.22.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.22.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.22.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.23.self_attn.q_a_proj": { "bits": 8 }, @@ -395,6 +575,15 @@ "model.layers.23.self_attn.o_proj": { "bits": 8 }, + "model.layers.23.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.23.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.23.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.24.self_attn.q_a_proj": { "bits": 8 }, @@ -410,6 +599,15 @@ "model.layers.24.self_attn.o_proj": { "bits": 8 }, + "model.layers.24.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.24.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.24.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.25.self_attn.q_a_proj": { "bits": 8 }, @@ -425,6 +623,15 @@ "model.layers.25.self_attn.o_proj": { "bits": 8 }, + "model.layers.25.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.25.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.25.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.26.self_attn.q_a_proj": { "bits": 8 }, @@ -440,6 +647,15 @@ "model.layers.26.self_attn.o_proj": { "bits": 8 }, + "model.layers.26.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.26.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.26.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.27.self_attn.q_a_proj": { "bits": 8 }, @@ -455,6 +671,15 @@ "model.layers.27.self_attn.o_proj": { "bits": 8 }, + "model.layers.27.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.27.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.27.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.28.self_attn.q_a_proj": { "bits": 8 }, @@ -470,6 +695,15 @@ "model.layers.28.self_attn.o_proj": { "bits": 8 }, + "model.layers.28.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.28.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.28.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.29.self_attn.q_a_proj": { "bits": 8 }, @@ -485,6 +719,15 @@ "model.layers.29.self_attn.o_proj": { "bits": 8 }, + "model.layers.29.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.29.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.29.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.30.self_attn.q_a_proj": { "bits": 8 }, @@ -500,6 +743,15 @@ "model.layers.30.self_attn.o_proj": { "bits": 8 }, + "model.layers.30.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.30.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.30.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.31.self_attn.q_a_proj": { "bits": 8 }, @@ -515,6 +767,15 @@ "model.layers.31.self_attn.o_proj": { "bits": 8 }, + "model.layers.31.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.31.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.31.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.32.self_attn.q_a_proj": { "bits": 8 }, @@ -530,6 +791,15 @@ "model.layers.32.self_attn.o_proj": { "bits": 8 }, + "model.layers.32.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.32.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.32.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.33.self_attn.q_a_proj": { "bits": 8 }, @@ -545,6 +815,15 @@ "model.layers.33.self_attn.o_proj": { "bits": 8 }, + "model.layers.33.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.33.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.33.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.34.self_attn.q_a_proj": { "bits": 8 }, @@ -560,6 +839,15 @@ "model.layers.34.self_attn.o_proj": { "bits": 8 }, + "model.layers.34.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.34.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.34.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.35.self_attn.q_a_proj": { "bits": 8 }, @@ -575,6 +863,15 @@ "model.layers.35.self_attn.o_proj": { "bits": 8 }, + "model.layers.35.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.35.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.35.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.36.self_attn.q_a_proj": { "bits": 8 }, @@ -590,6 +887,15 @@ "model.layers.36.self_attn.o_proj": { "bits": 8 }, + "model.layers.36.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.36.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.36.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.37.self_attn.q_a_proj": { "bits": 8 }, @@ -605,6 +911,15 @@ "model.layers.37.self_attn.o_proj": { "bits": 8 }, + "model.layers.37.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.37.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.37.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.38.self_attn.q_a_proj": { "bits": 8 }, @@ -620,6 +935,15 @@ "model.layers.38.self_attn.o_proj": { "bits": 8 }, + "model.layers.38.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.38.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.38.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.39.self_attn.q_a_proj": { "bits": 8 }, @@ -635,6 +959,15 @@ "model.layers.39.self_attn.o_proj": { "bits": 8 }, + "model.layers.39.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.39.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.39.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.40.self_attn.q_a_proj": { "bits": 8 }, @@ -650,6 +983,15 @@ "model.layers.40.self_attn.o_proj": { "bits": 8 }, + "model.layers.40.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.40.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.40.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.41.self_attn.q_a_proj": { "bits": 8 }, @@ -665,6 +1007,15 @@ "model.layers.41.self_attn.o_proj": { "bits": 8 }, + "model.layers.41.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.41.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.41.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.42.self_attn.q_a_proj": { "bits": 8 }, @@ -680,6 +1031,15 @@ "model.layers.42.self_attn.o_proj": { "bits": 8 }, + "model.layers.42.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.42.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.42.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.43.self_attn.q_a_proj": { "bits": 8 }, @@ -695,6 +1055,15 @@ "model.layers.43.self_attn.o_proj": { "bits": 8 }, + "model.layers.43.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.43.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.43.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.44.self_attn.q_a_proj": { "bits": 8 }, @@ -710,6 +1079,15 @@ "model.layers.44.self_attn.o_proj": { "bits": 8 }, + "model.layers.44.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.44.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.44.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.45.self_attn.q_a_proj": { "bits": 8 }, @@ -725,6 +1103,15 @@ "model.layers.45.self_attn.o_proj": { "bits": 8 }, + "model.layers.45.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.45.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.45.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.46.self_attn.q_a_proj": { "bits": 8 }, @@ -740,6 +1127,15 @@ "model.layers.46.self_attn.o_proj": { "bits": 8 }, + "model.layers.46.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.46.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.46.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.47.self_attn.q_a_proj": { "bits": 8 }, @@ -755,6 +1151,15 @@ "model.layers.47.self_attn.o_proj": { "bits": 8 }, + "model.layers.47.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.47.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.47.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.48.self_attn.q_a_proj": { "bits": 8 }, @@ -770,6 +1175,15 @@ "model.layers.48.self_attn.o_proj": { "bits": 8 }, + "model.layers.48.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.48.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.48.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.49.self_attn.q_a_proj": { "bits": 8 }, @@ -785,6 +1199,15 @@ "model.layers.49.self_attn.o_proj": { "bits": 8 }, + "model.layers.49.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.49.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.49.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.50.self_attn.q_a_proj": { "bits": 8 }, @@ -800,6 +1223,15 @@ "model.layers.50.self_attn.o_proj": { "bits": 8 }, + "model.layers.50.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.50.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.50.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.51.self_attn.q_a_proj": { "bits": 8 }, @@ -815,6 +1247,15 @@ "model.layers.51.self_attn.o_proj": { "bits": 8 }, + "model.layers.51.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.51.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.51.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.52.self_attn.q_a_proj": { "bits": 8 }, @@ -830,6 +1271,15 @@ "model.layers.52.self_attn.o_proj": { "bits": 8 }, + "model.layers.52.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.52.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.52.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.53.self_attn.q_a_proj": { "bits": 8 }, @@ -845,6 +1295,15 @@ "model.layers.53.self_attn.o_proj": { "bits": 8 }, + "model.layers.53.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.53.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.53.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.54.self_attn.q_a_proj": { "bits": 8 }, @@ -860,6 +1319,15 @@ "model.layers.54.self_attn.o_proj": { "bits": 8 }, + "model.layers.54.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.54.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.54.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.55.self_attn.q_a_proj": { "bits": 8 }, @@ -875,6 +1343,15 @@ "model.layers.55.self_attn.o_proj": { "bits": 8 }, + "model.layers.55.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.55.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.55.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.56.self_attn.q_a_proj": { "bits": 8 }, @@ -890,6 +1367,15 @@ "model.layers.56.self_attn.o_proj": { "bits": 8 }, + "model.layers.56.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.56.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.56.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.57.self_attn.q_a_proj": { "bits": 8 }, @@ -905,6 +1391,15 @@ "model.layers.57.self_attn.o_proj": { "bits": 8 }, + "model.layers.57.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.57.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.57.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.58.self_attn.q_a_proj": { "bits": 8 }, @@ -920,6 +1415,15 @@ "model.layers.58.self_attn.o_proj": { "bits": 8 }, + "model.layers.58.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.58.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.58.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.59.self_attn.q_a_proj": { "bits": 8 }, @@ -935,6 +1439,15 @@ "model.layers.59.self_attn.o_proj": { "bits": 8 }, + "model.layers.59.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.59.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.59.mlp.shared_experts.down_proj": { + "bits": 8 + }, "model.layers.60.self_attn.q_a_proj": { "bits": 8 }, @@ -949,6 +1462,15 @@ }, "model.layers.60.self_attn.o_proj": { "bits": 8 + }, + "model.layers.60.mlp.shared_experts.gate_proj": { + "bits": 8 + }, + "model.layers.60.mlp.shared_experts.up_proj": { + "bits": 8 + }, + "model.layers.60.mlp.shared_experts.down_proj": { + "bits": 8 } } } \ No newline at end of file