Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +103 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 +3 -0
.gitattributes
CHANGED
@@ -151,3 +151,106 @@ savedmodels/ssv2_48k_stereo/encoder/variables/variables.data-00000-of-00001 filt
|
|
151 |
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
152 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
153 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
151 |
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
152 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
153 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
154 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
155 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
156 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
157 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
158 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
159 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
160 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
161 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
162 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
163 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
164 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
165 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
166 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
167 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
168 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
169 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_14.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
170 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
171 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
172 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
173 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
174 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
175 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
176 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
177 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
178 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
179 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
180 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
181 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
182 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
183 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
184 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
185 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
186 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
187 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
188 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
189 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
190 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
191 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
192 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
193 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
194 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
195 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
196 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
197 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
198 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
199 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
200 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
201 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
202 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
203 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
204 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
205 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
206 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
207 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
208 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
209 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
210 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
211 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
212 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
213 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
214 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
215 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
216 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
217 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
218 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
219 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
220 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
221 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
222 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
223 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
224 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
225 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
226 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
227 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
228 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
229 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
230 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
231 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
232 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
233 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
234 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
235 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
236 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
237 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
238 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
239 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
240 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
241 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
242 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
243 |
+
savedmodels/ssv2_48k_stereo/quantizer/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
244 |
+
savedmodels/ssv2_48k_stereo/decoder/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
245 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
246 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
247 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
248 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
249 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
250 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
251 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
252 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
253 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
254 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
255 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
256 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (3.72 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.7 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0
ADDED
Binary file (3.73 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.69 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.81 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.8 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (3.8 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.78 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (3.75 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (3.73 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (3.72 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.76 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
Binary file (3.72 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (3.76 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bc9789afff3d109c8cd02dfa39a113e5bb9dafab1869459850c38a3f85014eb
|
3 |
+
size 5375616
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44613ec7f32c4b91b2441f34d7364f5f4ad890f427b83316432010098afcbc0c
|
3 |
+
size 5376204
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0
ADDED
Binary file (3.63 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a835b892ec73db060b5466c44cf49ba7deef452f8529cf7345e3bb469ae563d3
|
3 |
+
size 1951644
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4246e371181134272185aabf24e806e1b4e5d6106d50e1607062e664a210752
|
3 |
+
size 1953408
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67f195eee82d215b60f7b036c8378d4485e16687df1f0fb44271356d98206e3f
|
3 |
+
size 5372139
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d176b83c8a1727f1fc43be6dd2e0ecaf0ed82f6fe794d2fc4b30f37ee4f99240
|
3 |
+
size 5373342
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1702ddae7bc9f4d72f69ec33f7e4a81fcc65eac67de6a28d50299abb441d4270
|
3 |
+
size 1952734
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e7d24122091a487d923e2ea11abb3ef33a00e5b59b625102d5f00d3ec0e21da
|
3 |
+
size 1952226
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bea8f1491535a5521aaaec8be459664fc002b2b0571d11c9bed8451cbb103ec
|
3 |
+
size 1955079
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46f820e55ca19a091ddaab6b54a6c91be76638edcda51bbb94bbb6047934299b
|
3 |
+
size 1954809
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0
ADDED
Binary file (3.83 kB). View file
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9504e6066f24c4f7a931fc42fb2e9cde65c486bc210467aef7fb02b7728701aa
|
3 |
+
size 1953829
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8acfb3777db8e2713fc1fc8a8fd0453c2c2bbb04242ec0d30f98ab67051bf157
|
3 |
+
size 1953555
|