Update models
Browse files- .gitattributes +13 -0
- config.json +54 -0
- gemma-3-270m-it-Q2_K.gguf +3 -0
- gemma-3-270m-it-Q3_K_L.gguf +3 -0
- gemma-3-270m-it-Q3_K_M.gguf +3 -0
- gemma-3-270m-it-Q3_K_S.gguf +3 -0
- gemma-3-270m-it-Q4_0.gguf +3 -0
- gemma-3-270m-it-Q4_K_M.gguf +3 -0
- gemma-3-270m-it-Q4_K_S.gguf +3 -0
- gemma-3-270m-it-Q5_0.gguf +3 -0
- gemma-3-270m-it-Q5_K_M.gguf +3 -0
- gemma-3-270m-it-Q5_K_S.gguf +3 -0
- gemma-3-270m-it-Q6_K.gguf +3 -0
- gemma-3-270m-it-Q8_0.gguf +3 -0
- gemma-3-270m-it-f16.gguf +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
gemma-3-270m-it-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
gemma-3-270m-it-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
gemma-3-270m-it-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
39 |
+
gemma-3-270m-it-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
40 |
+
gemma-3-270m-it-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
41 |
+
gemma-3-270m-it-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
42 |
+
gemma-3-270m-it-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
43 |
+
gemma-3-270m-it-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
44 |
+
gemma-3-270m-it-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
45 |
+
gemma-3-270m-it-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
46 |
+
gemma-3-270m-it-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
47 |
+
gemma-3-270m-it-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
48 |
+
gemma-3-270m-it-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
config.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_sliding_window_pattern": 6,
|
3 |
+
"architectures": [
|
4 |
+
"Gemma3ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"attn_logit_softcapping": null,
|
9 |
+
"bos_token_id": 2,
|
10 |
+
"eos_token_id": 1,
|
11 |
+
"final_logit_softcapping": null,
|
12 |
+
"head_dim": 256,
|
13 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
14 |
+
"hidden_size": 640,
|
15 |
+
"initializer_range": 0.02,
|
16 |
+
"intermediate_size": 2048,
|
17 |
+
"layer_types": [
|
18 |
+
"sliding_attention",
|
19 |
+
"sliding_attention",
|
20 |
+
"sliding_attention",
|
21 |
+
"sliding_attention",
|
22 |
+
"sliding_attention",
|
23 |
+
"full_attention",
|
24 |
+
"sliding_attention",
|
25 |
+
"sliding_attention",
|
26 |
+
"sliding_attention",
|
27 |
+
"sliding_attention",
|
28 |
+
"sliding_attention",
|
29 |
+
"full_attention",
|
30 |
+
"sliding_attention",
|
31 |
+
"sliding_attention",
|
32 |
+
"sliding_attention",
|
33 |
+
"sliding_attention",
|
34 |
+
"sliding_attention",
|
35 |
+
"full_attention"
|
36 |
+
],
|
37 |
+
"max_position_embeddings": 32768,
|
38 |
+
"model_type": "gemma3_text",
|
39 |
+
"num_attention_heads": 4,
|
40 |
+
"num_hidden_layers": 18,
|
41 |
+
"num_key_value_heads": 1,
|
42 |
+
"pad_token_id": 0,
|
43 |
+
"query_pre_attn_scalar": 256,
|
44 |
+
"rms_norm_eps": 1e-06,
|
45 |
+
"rope_local_base_freq": 10000.0,
|
46 |
+
"rope_scaling": null,
|
47 |
+
"rope_theta": 1000000.0,
|
48 |
+
"sliding_window": 512,
|
49 |
+
"torch_dtype": "bfloat16",
|
50 |
+
"transformers_version": "4.55.0.dev0",
|
51 |
+
"use_bidirectional_attention": false,
|
52 |
+
"use_cache": true,
|
53 |
+
"vocab_size": 262144
|
54 |
+
}
|
gemma-3-270m-it-Q2_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5abaaccdcd69192bb100a6f66146ad1e0e092b23d088d6d626cc15f8ad5af670
|
3 |
+
size 237079040
|
gemma-3-270m-it-Q3_K_L.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae4f47ade6d03993a223fb372a46fb5f52fce72f49cc7f32c2b6fe37a3b1d8a2
|
3 |
+
size 246387200
|
gemma-3-270m-it-Q3_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38022a57a75a63705db55b8f75b4f655fb2a1dc412ce2523451c4fa3c0640a72
|
3 |
+
size 241963520
|
gemma-3-270m-it-Q3_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1ae7f5b09fb8dd5595e863f883e61570dab19fbe2b71c819603776a9c4cf990
|
3 |
+
size 236710400
|
gemma-3-270m-it-Q4_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:542c1a0aa267b9aad9bac7a285aa513f9a932346263bff6dd27e9ba3102b0e7d
|
3 |
+
size 241410560
|
gemma-3-270m-it-Q4_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57bbce8f2095939bde118bafbb65279c6e36ee8bcb09ee258f7f5d6a7b8e7f39
|
3 |
+
size 253114880
|
gemma-3-270m-it-Q4_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39cbb18495fb272f26738cae50454cb35b0fb9a5910d8dcea907664d134ed42b
|
3 |
+
size 249889280
|
gemma-3-270m-it-Q5_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d19335c73a3359d0f2643eb0efda378cd9fd9a3b0ddf96b113416463eaae8649
|
3 |
+
size 253944320
|
gemma-3-270m-it-Q5_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bf42ab816603a57a54c280d26b64dbdc3ec34d76d404db676f31c4dffc77a95
|
3 |
+
size 260026880
|
gemma-3-270m-it-Q5_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2dbfd9a04f767c7cfe83aaa7e2683c9611540092cf7d78633df80556662596d
|
3 |
+
size 257999360
|
gemma-3-270m-it-Q6_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7211704d68295495e756642a3097efb17ccb4b06964fccb49d57a891205e500a
|
3 |
+
size 282974720
|
gemma-3-270m-it-Q8_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ef57d2c838458a1952664260dcba38e5bdda37494f3af732f06e4add24068e3
|
3 |
+
size 291545600
|
gemma-3-270m-it-f16.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f96c9a2740dc6eb5ca11c3ed19c97820259e1d1927ac959fd597735ab02c07
|
3 |
+
size 542835200
|