TF-Keras
chrisdonahue-goog commited on
Commit
d940c77
·
verified ·
1 Parent(s): 5908681

Add files using upload-large-folder tool

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +103 -0
  2. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  5. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0 +0 -0
  6. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
  7. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0 +0 -0
  8. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  9. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
  10. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  11. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +0 -0
  12. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
  13. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  14. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +0 -0
  15. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  16. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +0 -0
  17. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  18. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  19. checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +0 -0
  20. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray +1 -0
  21. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0 +0 -0
  22. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray +1 -0
  23. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0 +0 -0
  24. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray +1 -0
  25. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0 +0 -0
  26. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  27. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
  28. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray +1 -0
  29. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
  30. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0 +0 -0
  31. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray +1 -0
  32. checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0 +0 -0
  33. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 +3 -0
  34. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 +3 -0
  35. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray +1 -0
  36. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0 +0 -0
  37. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 +3 -0
  38. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 +3 -0
  39. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray +1 -0
  40. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 +3 -0
  41. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 +3 -0
  42. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 +3 -0
  43. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 +3 -0
  44. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 +3 -0
  45. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 +3 -0
  46. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray +1 -0
  47. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray +1 -0
  48. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0 +0 -0
  49. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 +3 -0
  50. checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 +3 -0
.gitattributes CHANGED
@@ -151,3 +151,106 @@ savedmodels/ssv2_48k_stereo/encoder/variables/variables.data-00000-of-00001 filt
151
  checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
152
  checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
153
  checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
152
  checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
153
  checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
154
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
155
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
156
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
157
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
158
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
159
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
160
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
161
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
162
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
163
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
164
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
165
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
166
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
167
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
168
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
169
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_14.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
170
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
171
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
172
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
173
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
174
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
175
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
176
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
177
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
178
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
179
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
180
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
181
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
182
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
183
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
184
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
185
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
186
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
187
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
188
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
189
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
190
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
191
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
192
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
193
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
194
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
195
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
196
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
197
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
198
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
199
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
200
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
201
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
202
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
203
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
204
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
205
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
206
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
207
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
208
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
209
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
210
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
211
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
212
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
213
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
214
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
215
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
216
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
217
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
218
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
219
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
220
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
221
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
222
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
223
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
224
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
225
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
226
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
227
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
228
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
229
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
230
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
231
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
232
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
233
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
234
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
235
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
236
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
237
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
238
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
239
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
240
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
241
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
242
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
243
+ savedmodels/ssv2_48k_stereo/quantizer/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
244
+ savedmodels/ssv2_48k_stereo/decoder/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
245
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
246
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
247
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
248
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
249
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
250
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
251
+ checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
252
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
253
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
254
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
255
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
256
+ checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.7 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0 ADDED
Binary file (3.73 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.69 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.81 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.8 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (3.8 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.78 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.75 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.73 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.76 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0 ADDED
Binary file (3.72 kB). View file
 
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (3.76 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bc9789afff3d109c8cd02dfa39a113e5bb9dafab1869459850c38a3f85014eb
3
+ size 5375616
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44613ec7f32c4b91b2441f34d7364f5f4ad890f427b83316432010098afcbc0c
3
+ size 5376204
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0 ADDED
Binary file (3.63 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a835b892ec73db060b5466c44cf49ba7deef452f8529cf7345e3bb469ae563d3
3
+ size 1951644
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4246e371181134272185aabf24e806e1b4e5d6106d50e1607062e664a210752
3
+ size 1953408
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f195eee82d215b60f7b036c8378d4485e16687df1f0fb44271356d98206e3f
3
+ size 5372139
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d176b83c8a1727f1fc43be6dd2e0ecaf0ed82f6fe794d2fc4b30f37ee4f99240
3
+ size 5373342
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1702ddae7bc9f4d72f69ec33f7e4a81fcc65eac67de6a28d50299abb441d4270
3
+ size 1952734
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e7d24122091a487d923e2ea11abb3ef33a00e5b59b625102d5f00d3ec0e21da
3
+ size 1952226
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bea8f1491535a5521aaaec8be459664fc002b2b0571d11c9bed8451cbb103ec
3
+ size 1955079
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46f820e55ca19a091ddaab6b54a6c91be76638edcda51bbb94bbb6047934299b
3
+ size 1954809
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0 ADDED
Binary file (3.83 kB). View file
 
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9504e6066f24c4f7a931fc42fb2e9cde65c486bc210467aef7fb02b7728701aa
3
+ size 1953829
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8acfb3777db8e2713fc1fc8a8fd0453c2c2bbb04242ec0d30f98ab67051bf157
3
+ size 1953555