ctigges commited on
Commit
fccc682
·
verified ·
1 Parent(s): 6e8bb54

Upload 2 files

Browse files
tied-per-target-layerwise-token-topk/cfg.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_features": 32768,
3
+ "num_layers": 12,
4
+ "d_model": 768,
5
+ "activation_fn": "topk",
6
+ "topk_k": 16,
7
+ "topk_straight_through": true,
8
+ "topk_mode": "per_layer",
9
+ "decoder_tying": "per_target",
10
+ "enable_feature_offset": false,
11
+ "enable_feature_scale": false,
12
+ "skip_connection": false,
13
+ "normalization_method": "mean_std"
14
+ }
tied-per-target-layerwise-token-topk/clt_checkpoint_97689.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a78e598ec49dde9f7039786c97a9228defc8e1cac305f91accab4ba408d5908a
3
+ size 2417534048