Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +103 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray +1 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0 +0 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 +3 -0
.gitattributes
CHANGED
|
@@ -151,3 +151,106 @@ savedmodels/ssv2_48k_stereo/encoder/variables/variables.data-00000-of-00001 filt
|
|
| 151 |
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 152 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 153 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 151 |
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 152 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 153 |
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 154 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 155 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 156 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_19.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 157 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 158 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_8.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 159 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_2.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 160 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 161 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 162 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 163 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_6.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 164 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 165 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 166 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 167 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_10.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 168 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 169 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_14.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 170 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 171 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 172 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 173 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 176 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 177 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 178 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 179 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 180 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 181 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 182 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 183 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 184 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 185 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_6.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 186 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 187 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_9.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 188 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 189 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 190 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.encoder_decoder_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 191 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 192 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 193 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 194 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_1.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 195 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 196 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 197 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 198 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_8.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 199 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_20.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 200 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 201 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 202 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 203 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 204 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 205 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 206 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 207 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 208 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 209 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 210 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 211 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_7.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 212 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 213 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_14.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 214 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 215 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 216 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 217 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 218 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 219 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 220 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 221 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 222 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 223 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 224 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 225 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 226 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 227 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 228 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_18.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 229 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_10.self_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 230 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 231 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_13.self_attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 232 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 233 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_19.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 234 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 235 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_5.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 236 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 237 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 238 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 239 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 240 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_2.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 241 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 242 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_15.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 243 |
+
savedmodels/ssv2_48k_stereo/quantizer/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 244 |
+
savedmodels/ssv2_48k_stereo/decoder/variables/variables.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text
|
| 245 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 246 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_11.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 247 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_3.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 248 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 249 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 250 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_9.attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 251 |
+
checkpoints/llm_large_x3047_c1860k/target.encoder.layers_17.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 252 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_17.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 253 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_4.encoder_decoder_attention.out.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
| 254 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
| 255 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
| 256 |
+
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_12.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_0.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.72 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_16.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.7 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_cross_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.73 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_19.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.69 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_3.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.81 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.8 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_5.pre_self_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.8 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.decoder.decoder.temporal_decoder.layers_7.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.78 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_16.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.75 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_2.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.73 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_21.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.72 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_4.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.76 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_6.pre_mlp_layer_norm.scale.v/0
ADDED
|
Binary file (3.72 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/state.param_states.encoder.layers_9.pre_attention_layer_norm.scale.v/0
ADDED
|
Binary file (3.76 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bc9789afff3d109c8cd02dfa39a113e5bb9dafab1869459850c38a3f85014eb
|
| 3 |
+
size 5375616
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_0.mlp.wi_0.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44613ec7f32c4b91b2441f34d7364f5f4ad890f427b83316432010098afcbc0c
|
| 3 |
+
size 5376204
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.pre_self_attention_layer_norm.scale/0
ADDED
|
Binary file (3.63 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a835b892ec73db060b5466c44cf49ba7deef452f8529cf7345e3bb469ae563d3
|
| 3 |
+
size 1951644
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_2.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4246e371181134272185aabf24e806e1b4e5d6106d50e1607062e664a210752
|
| 3 |
+
size 1953408
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024,1408],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,2816],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:67f195eee82d215b60f7b036c8378d4485e16687df1f0fb44271356d98206e3f
|
| 3 |
+
size 5372139
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.mlp.wi_1.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d176b83c8a1727f1fc43be6dd2e0ecaf0ed82f6fe794d2fc4b30f37ee4f99240
|
| 3 |
+
size 5373342
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1702ddae7bc9f4d72f69ec33f7e4a81fcc65eac67de6a28d50299abb441d4270
|
| 3 |
+
size 1952734
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e7d24122091a487d923e2ea11abb3ef33a00e5b59b625102d5f00d3ec0e21da
|
| 3 |
+
size 1952226
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3bea8f1491535a5521aaaec8be459664fc002b2b0571d11c9bed8451cbb103ec
|
| 3 |
+
size 1955079
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.query.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46f820e55ca19a091ddaab6b54a6c91be76638edcda51bbb94bbb6047934299b
|
| 3 |
+
size 1954809
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.depth_decoder.depth_layers_3.self_attention.value.kernel/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024,1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/.zarray
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"chunks":[1024],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[1024],"zarr_format":2}
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_0.pre_cross_attention_layer_norm.scale/0
ADDED
|
Binary file (3.83 kB). View file
|
|
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9504e6066f24c4f7a931fc42fb2e9cde65c486bc210467aef7fb02b7728701aa
|
| 3 |
+
size 1953829
|
checkpoints/llm_large_x3047_c1860k/target.decoder.decoder.temporal_decoder.layers_1.encoder_decoder_attention.key.kernel/0.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8acfb3777db8e2713fc1fc8a8fd0453c2c2bbb04242ec0d30f98ab67051bf157
|
| 3 |
+
size 1953555
|