Commit
·
0b42be6
1
Parent(s):
02a5523
Upload part 62
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +45 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp12261106114141997915.~1663960300599472~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp16218328866158248878.~1663960300471383~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp1685086716695868863.~1663960300685126~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp16856896936629569167.~1663960300547251~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp4116509858351261080.~1663960300775157~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp8507979600702850460.~1663960300610909~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp9907378130920738197.~1663960301068073~ +1 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_7.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_7.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp10178358361871653998.~1663960300983803~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp10255521947259571973.~1663960300986785~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp11025281758045122489.~1663960300685555~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp13376935660037902763.~1663960300776626~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp15135451771888956814.~1663960300940448~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp15357963553081218798.~1663960300599634~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp2620812036374037652.~1663960300941903~ +1 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.4 +3 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.5 +3 -0
- checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.6 +3 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp12114443691839504661.~1663960300778860~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16105360201878462234.~1663960300421302~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16729537588758869116.~1663960300548059~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16981634325977950481.~1663960300863342~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp18331493733337094116.~1663960300886062~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp3769154678623319437.~1663960300686995~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp9580632581366964217.~1663960300626625~ +1 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.0 +3 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.1 +3 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.2 +3 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.3 +3 -0
- checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.4 +3 -0
.gitattributes
CHANGED
@@ -3101,3 +3101,48 @@ checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.2 filter=lfs diff=l
|
|
3101 |
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3102 |
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3103 |
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3101 |
checkpoint_1007000/target.decoder.layers_1.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3102 |
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3103 |
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3104 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3105 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3106 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3107 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3108 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3109 |
+
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3110 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3111 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3112 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3113 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3114 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3115 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3116 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3117 |
+
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3118 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3119 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3120 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3121 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3122 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3123 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3124 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3125 |
+
checkpoint_1007000/target.encoder.layers_23.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3126 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3127 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3128 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3129 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3130 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3131 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3132 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3133 |
+
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3134 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3135 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3136 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3137 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3138 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3139 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3140 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
3141 |
+
checkpoint_1007000/target.encoder.layers_7.attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
3142 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
3143 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
3144 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
3145 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
3146 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
3147 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
3148 |
+
checkpoint_1007000/target.encoder.layers_3.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_11.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (15 kB). View file
|
|
checkpoint_1007000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_15.pre_cross_attention_layer_norm.scale.v/0
ADDED
Binary file (14.8 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp12261106114141997915.~1663960300599472~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp16218328866158248878.~1663960300471383~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp1685086716695868863.~1663960300685126~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp16856896936629569167.~1663960300547251~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp4116509858351261080.~1663960300775157~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp8507979600702850460.~1663960300610909~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/.zarray.__tmp9907378130920738197.~1663960301068073~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e2ee0c292add1a41314639b09db9d49e5e887be12375de666e2268dc83e0f63
|
3 |
+
size 7812161
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0affdbc0370e7682479e79454f9e346cf85c6562a1d574b3d44dff2cee23bc18
|
3 |
+
size 7812215
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:869f59da84aa74bb20f6289bd07889e142476626ee3e24e9b0505ecbe27b69d9
|
3 |
+
size 7812155
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb2f98c4c7d1b2dd7a668af971606e86ba10efd8d421e033d61941f5374a5c98
|
3 |
+
size 7816106
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb0aece5e77ae4a6cee2f55a3daa6aae636bf61c4b4d24c6abccd85eb49953fb
|
3 |
+
size 7821683
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:407eca64d9913122c353e7158479a51389bf695b2402abb4ac1cf3632086943c
|
3 |
+
size 7818042
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe9567e74ab9a4b262670e7f63b4b1ffc3585087733236672565471f53dfdcdc
|
3 |
+
size 7813669
|
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.key.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a454d8f6c006ca5c9628ce782aa90dd9e70d21711189abc1632ed1d10ae4a6d8
|
3 |
+
size 7812556
|
checkpoint_1007000/target.decoder.layers_7.pre_self_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_7.pre_self_attention_layer_norm.scale/0
ADDED
Binary file (15 kB). View file
|
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp10178358361871653998.~1663960300983803~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp10255521947259571973.~1663960300986785~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp11025281758045122489.~1663960300685555~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp13376935660037902763.~1663960300776626~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp15135451771888956814.~1663960300940448~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp15357963553081218798.~1663960300599634~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/.zarray.__tmp2620812036374037652.~1663960300941903~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:000632d2eb97d11d93568e989a7d0c9d5483c794959bc3b51442333a8311335a
|
3 |
+
size 19545713
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e1bdecd1fff11d6564b5b192aa646c8dc0be1bb84beaf64416893d93dd21a22
|
3 |
+
size 19544666
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1000a65235eeb651f473bd1ee43f905a52fc8e544f0b1611459936ecda8cc5c6
|
3 |
+
size 19544273
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33322390952fb0c3c8aebfc2d14eaeee0d4f61b9c2cfa158411ec4bf29ff8381
|
3 |
+
size 19544188
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c82e9aa542962420dea96c867350fd4fcfec4d3e2fe51e8442d72b49e3bbad0a
|
3 |
+
size 19544288
|
checkpoint_1007000/target.encoder.layers_11.mlp.wi_1.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2bfa04fafd050abe7623c5d080e35bb401c882c571f1ee91599e311f5afd1f04
|
3 |
+
size 19544395
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp12114443691839504661.~1663960300778860~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16105360201878462234.~1663960300421302~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16729537588758869116.~1663960300548059~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp16981634325977950481.~1663960300863342~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp18331493733337094116.~1663960300886062~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp3769154678623319437.~1663960300686995~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/.zarray.__tmp9580632581366964217.~1663960300626625~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:154608b2cd0a552099e190a323d4fb70204134f79b2d1b7cee38d5587e253a81
|
3 |
+
size 7823748
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d545d7966b12ee15f510d160e4d7ac0c8d45e8147792fe4f8c7effe20146db12
|
3 |
+
size 7823373
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:634d3977388eb205203183170f581ca6b227aae1ca10c3aa566c2effcc26457e
|
3 |
+
size 7822576
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbe13e0367b70c1263a0e03ce21bbc251b7b48b8c52dc2ff3b7185d22b6af31c
|
3 |
+
size 7822117
|
checkpoint_1007000/target.encoder.layers_21.attention.value.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0ed60f4fcde32a47f695dfb9c9a49f7a08ff3dafa3d7c8adc564e197b19d9d7
|
3 |
+
size 7822223
|