TF-Keras
chrisdonahue-goog commited on
Commit
6613f63
·
verified ·
1 Parent(s): 488cb7e

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +2 -0
  2. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.depth_decoder.depth_layers_0.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.depth_decoder.depth_layers_0.pre_self_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  5. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_11.pre_mlp_layer_norm.scale.v/0 +0 -0
  6. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
  7. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +0 -0
  8. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  9. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +0 -0
  10. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
  11. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 +0 -0
  12. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  13. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/0 +0 -0
  14. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray +1 -0
  15. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0 +0 -0
  16. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  17. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_mlp_layer_norm.scale.v/0 +0 -0
  18. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/.zarray +1 -0
  19. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/0 +0 -0
  20. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/.zarray +1 -0
  21. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/.zarray +1 -0
  22. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/.zarray +1 -0
  23. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/.zarray +1 -0
  24. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.0 +3 -0
  25. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.1 +3 -0
  26. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/.zarray +1 -0
  27. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/.zarray +1 -0
  28. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/.zarray +1 -0
  29. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/.zarray +1 -0
  30. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.pre_mlp_layer_norm.scale/.zarray +1 -0
  31. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.pre_mlp_layer_norm.scale/0 +0 -0
  32. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/.zarray +1 -0
  33. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/.zarray +1 -0
  34. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/.zarray +1 -0
  35. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/.zarray +1 -0
  36. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/.zarray +1 -0
  37. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/.zarray +1 -0
  38. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/.zarray +1 -0
  39. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.pre_self_attention_layer_norm.scale/.zarray +1 -0
  40. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.pre_self_attention_layer_norm.scale/0 +0 -0
  41. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/.zarray +1 -0
  42. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_16.pre_self_attention_layer_norm.scale/.zarray +1 -0
  43. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/.zarray +1 -0
  44. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/.zarray +1 -0
  45. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.pre_mlp_layer_norm.scale/.zarray +1 -0
  46. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.pre_mlp_layer_norm.scale/0 +0 -0
  47. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/.zarray +1 -0
  48. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/.zarray +1 -0
  49. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale/.zarray +1 -0
  50. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale/0 +0 -0
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
37
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.depth_decoder.depth_layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.depth_decoder.depth_layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (3.7 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_11.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_11.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 ADDED
Binary file (3.7 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (3.8 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_cross_attention_layer_norm.scale.v/0 ADDED
Binary file (3.73 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_1.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.73 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_15.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.76 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_22.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:362a4551f684f50d275cfd52b94706c453921ed496636187314cb5351860fc2e
3
+ size 1954341
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.encoder_decoder_attention.value.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95dc531f3af19c09d80d4bff8fae60cca272e9296a34258421b0c61335810f60
3
+ size 1953662
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1408,1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[2816,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.pre_mlp_layer_norm.scale/0 ADDED
Binary file (3.66 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.pre_self_attention_layer_norm.scale/0 ADDED
Binary file (3.68 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_16.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.pre_mlp_layer_norm.scale/0 ADDED
Binary file (3.65 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[512,1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale/0 ADDED
Binary file (3.64 kB). View file