TF-Keras
chrisdonahue-goog commited on
Commit
a221639
·
verified ·
1 Parent(s): 621b846

Add files using upload-large-folder tool

Browse files
Files changed (29) hide show
  1. .gitattributes +28 -0
  2. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.value.kernel/0.0 +3 -0
  3. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.query.kernel/0.0 +3 -0
  4. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_14.mlp.wi_0.kernel/0.0 +3 -0
  5. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_15.self_attention.out.kernel/0.0 +3 -0
  6. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 +3 -0
  7. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.mlp.wi_0.kernel/0.0 +3 -0
  8. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.self_attention.value.kernel/0.0 +3 -0
  9. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.key.kernel/0.0 +3 -0
  10. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.out.kernel/0.0 +3 -0
  11. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.encoder_decoder_attention.query.kernel/0.0 +3 -0
  12. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.mlp.wo.kernel/0.0 +3 -0
  13. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.value.kernel/0.0 +3 -0
  14. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_5.encoder_decoder_attention.out.kernel/0.0 +3 -0
  15. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wo.kernel/0.0 +3 -0
  16. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.out.kernel/0.0 +3 -0
  17. checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.value.kernel/0.0 +3 -0
  18. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_0.attention.key.kernel/0.0 +3 -0
  19. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.attention.value.kernel/0.0 +3 -0
  20. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.mlp.wo.kernel/0.0 +3 -0
  21. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_10.attention.key.kernel/0.0 +3 -0
  22. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.attention.key.kernel/0.0 +3 -0
  23. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.mlp.wo.kernel/0.0 +3 -0
  24. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_3.attention.out.kernel/0.0 +3 -0
  25. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_4.mlp.wi_1.kernel/0.0 +3 -0
  26. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_7.attention.query.kernel/0.0 +3 -0
  27. checkpoints/llm_base_x4286_c1860k/target.encoder.layers_9.attention.key.kernel/0.0 +3 -0
  28. checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/0.0 +3 -0
  29. checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/1.0 +3 -0
.gitattributes CHANGED
@@ -1184,3 +1184,31 @@ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers
1184
  checkpoints/llm_base_x4286_c1860k/target.encoder.layers_8.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1185
  checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_1.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1186
  checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1184
  checkpoints/llm_base_x4286_c1860k/target.encoder.layers_8.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1185
  checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_1.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1186
  checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1187
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_10.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1188
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1189
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_9.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1190
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_3.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1191
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_0.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1192
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1193
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1194
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1195
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1196
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_7.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1197
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_5.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1198
+ checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/0.0 filter=lfs diff=lfs merge=lfs -text
1199
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1200
+ checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/1.0 filter=lfs diff=lfs merge=lfs -text
1201
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1202
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1203
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1204
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_4.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1205
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1206
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1207
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1208
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1209
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1210
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_14.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1211
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1212
+ checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1213
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_15.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
1214
+ checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36e02cb4148ca3896f5fb05963956db2341c49489bdb8d3b5e14e3198c8d0a24
3
+ size 2197975
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73f9b65fbcd4c045ec025389fa97171146b57243031f01443a928f7680d7559e
3
+ size 2193405
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_14.mlp.wi_0.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11d12f5c7f6a63010373f61040dd5c52a8126a7752aac4968d9cd2775e9977fc
3
+ size 5867924
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_15.self_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f908133b6f3a4d6cbdc1fbed0207f0d1ebb36429dd91e2a3ecefad7b224399f
3
+ size 2199897
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.encoder_decoder_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa09a69aee80f5c7e83941df85c2e516a35894bf38f36de911b36a3f4751fb8a
3
+ size 2193362
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.mlp.wi_0.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:381944b5686ab10fbb7fea75f5b69ab69bcf2e3b6d1f091668aa9994d7fe4b07
3
+ size 5867668
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_16.self_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5192ac33b8b4a6778767076a382907dba9715067f499a73e3c8cca54c480c7c7
3
+ size 2199819
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b9c48528a03b28362eb3b62a81fcc0a21ef0e2e793497a7948a2b09a7399e44
3
+ size 2199637
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57ca26ffdee13a17fd503335007a5694e9ced2d8ec907886d0b6ba7ddb2afea5
3
+ size 2200312
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.encoder_decoder_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39b54dc39ba87b2b0dfb6807762f2fbb6408e7d2f8bc8deb94caee7f2a32ff51
3
+ size 2193629
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_18.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee388de2ec18cc203acbbf113ffdbbfe89c6fca37b0278b84e2aa753aff45580
3
+ size 5872793
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dae84993077fc728bafea0b4e1097d0db67c57790c6e8f3f6e63aec86fe13cac
3
+ size 2196190
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_5.encoder_decoder_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa5ceee2116fe149fdf27b262d68e6669c71124e3c7419758118d0f95fa2b796
3
+ size 2195682
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:215f601d6c8c68364e21235569dd42af35642e836dd86bd4a305c7476dc63dae
3
+ size 5878898
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbcd34a8c25944ada1cd4031fcdcf060a87021dacae8cda1a3343d79dd52fb11
3
+ size 2198712
checkpoints/llm_base_x4286_c1860k/target.decoder.decoder.temporal_decoder.layers_9.self_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cf8349618460ebbdf5cb44e2e8984a79da5a2836df05a8eece6a54ce215b1f3
3
+ size 2196894
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_0.attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34f1de424e3484b31dc6558dbd12cb1455626878b86f47056888ceb25e195255
3
+ size 2201013
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb200c739fd407cb0b78c421f6f78ab54281cf5948c7c34513c5eba3265dee31
3
+ size 2200147
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_1.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e1b2c4cd42036029f10b8f141afbebe96190fb281d6c48fe6431267538d3b1
3
+ size 5870960
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_10.attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4df428d5978bd553b8c871ac8e76fc934143a03105cedd116987f43627001b9
3
+ size 2198723
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce5250412638529150256f828c5c7d6dd04172a3cfaa0870f2d7e913cbb326b3
3
+ size 2198631
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_11.mlp.wo.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:067bad8b5db3acc70b57940160a79f62747f618efa8c894d151d3e4c1bf97130
3
+ size 5880527
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_3.attention.out.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47b3077fdb4e2482a253dbef65bae774960f1ba4f4dbd9ded16fbd193d4a85f3
3
+ size 2199621
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_4.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48569f89c0a8b7bdf2f52e84aee93e4f330665a18a92c8cf802999066383ca86
3
+ size 5862866
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_7.attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64cde5843072e77d758343f1e53e458d4bec25078caa77c9971e05b735b77afa
3
+ size 2193058
checkpoints/llm_base_x4286_c1860k/target.encoder.layers_9.attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2c60932cb91f96d313d8b11b0c299f92fc3ca979421b28ae2e0e02f11b75828
3
+ size 2198483
checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7379a28c9e05a2407c43f538ba7c132a4f3f55cfe04b4a58369a62c3ac591485
3
+ size 42817251
checkpoints/llm_base_x4286_c1860k/target.token_embedder.embedding/1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53ddfda9ffd2a7d48b60536b33b1d0ea9d15df1a6b8e967640871081d8b4668b
3
+ size 42672400