Commit
·
d38c4eb
1
Parent(s):
a349b9b
Upload part 48
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +45 -0
- checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/.zarray +1 -0
- checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/0 +0 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp11388929281291012784.~1663960300777529~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp15408944531962108593.~1663960300425676~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp3478453131278811786.~1663960300016402~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp4231906932503099425.~1663960300018110~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp6692212168669761562.~1663960299927504~ +1 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp11221331478812435637.~1663960300865791~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp16906819682476284264.~1663960300865325~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2270484310615939027.~1663960300546742~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2349333016348064455.~1663960300827348~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2361301302702635123.~1663960300601360~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp7291065410866952681.~1663960300385543~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp907707751639812339.~1663960300774042~ +1 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/0 +0 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp10448794869755293873.~1663960300420703~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp11106886688829216473.~1663960300685559~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp12010709428620963921.~1663960301029038~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1320971340224479062.~1663960300779399~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp13481401145456933929.~1663960300501314~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp15793081268148901456.~1663960300827397~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1583414768807989616.~1663960300386596~ +1 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6 +3 -0
- checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7 +3 -0
.gitattributes
CHANGED
@@ -2437,3 +2437,48 @@ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kerne
|
|
2437 |
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2438 |
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2439 |
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2437 |
checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2438 |
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2439 |
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2440 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2441 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2442 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2443 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2444 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2445 |
+
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2446 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2447 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2448 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2449 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2450 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2451 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2452 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2453 |
+
checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2454 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
|
2455 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
|
2456 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
|
2457 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2458 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
|
2459 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
|
2460 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
|
2461 |
+
checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
|
2462 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2463 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2464 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2465 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2466 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2467 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2468 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2469 |
+
checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2470 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2471 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2472 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2473 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2474 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2475 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2476 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
2477 |
+
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
|
2478 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
|
2479 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
|
2480 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
|
2481 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
|
2482 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
|
2483 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
|
2484 |
+
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
|
checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0
ADDED
Binary file (15.1 kB). View file
|
|
checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/0
ADDED
Binary file (15.3 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp11388929281291012784.~1663960300777529~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp15408944531962108593.~1663960300425676~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp3478453131278811786.~1663960300016402~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp4231906932503099425.~1663960300018110~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp6692212168669761562.~1663960299927504~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16cc4b350c67bd3694d8eb55387534e65757ee94b2a0fd06258ea477366516e3
|
3 |
+
size 7804869
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ece3f9c4526f984bb2bb5032aec2f966452d669dfe09e12d6ffe079c5280ca12
|
3 |
+
size 7805609
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e036c449283de0859089911166abae9a58e14244eadb91d6521952574aa3bf9
|
3 |
+
size 7805423
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b3b5770b4739035ed38c025521445b2693c2d06fa8a3c84a0258700c43d7af7
|
3 |
+
size 7806437
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:657a6404a7fd95149b7e3a7510b078a35d96ddc3e7d8f262a5aa8e3a13e5134d
|
3 |
+
size 7807599
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9193945c79a1cf6525b20afe5981b9064314277fa627191c1d7778ccfab3db54
|
3 |
+
size 7808392
|
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:360aa9813f97cec8a1ca60195dd1e951db321550de918e2afe317674457873c1
|
3 |
+
size 7804791
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp11221331478812435637.~1663960300865791~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp16906819682476284264.~1663960300865325~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2270484310615939027.~1663960300546742~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2349333016348064455.~1663960300827348~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2361301302702635123.~1663960300601360~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp7291065410866952681.~1663960300385543~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp907707751639812339.~1663960300774042~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:346543e9bf86b3fbe70c72d5bcfdab2d60983e39eeba2cc37be18d8307c2e50f
|
3 |
+
size 7802759
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be34f87b406639029b849110121eb3bffa8e514dee521be86a913d3d8a92b403
|
3 |
+
size 7805389
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfaa8e543e160a3c1899e6a46573cb50e82fc2d350258deddb207d7045608e5e
|
3 |
+
size 7803234
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56ac3a34050e95d1d28af8dd265e9f5b3111a31269ab73da986cae39d0ec3731
|
3 |
+
size 7801647
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:564cca01fe48d062666bd188c1156c63ed34030aa73b8d877029f4a4ab108f76
|
3 |
+
size 7802842
|
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:689f566351326650526f38ccf494d86a272472893b6a554d6bf60d977ab7376b
|
3 |
+
size 7801624
|
checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/0
ADDED
Binary file (14.9 kB). View file
|
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp10448794869755293873.~1663960300420703~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp11106886688829216473.~1663960300685559~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp12010709428620963921.~1663960301029038~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1320971340224479062.~1663960300779399~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp13481401145456933929.~1663960300501314~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp15793081268148901456.~1663960300827397~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1583414768807989616.~1663960300386596~
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f27871d2ca5479491c8f11e708f3a4b07d4869dd8583cb3fc8b29dfd20f0a54
|
3 |
+
size 7814955
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf96bf39c85d3e5edb07cb015f2859f171a5967d2da4e2303d61d615e2edca09
|
3 |
+
size 7808347
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b82211954c78503fd73446351d9e08cce75b9746f163c724e72e97a710bc9b7
|
3 |
+
size 7808660
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f638e097bae496293f86733b096b6eb5acc5f5add71a6a56ceda323df180e7e3
|
3 |
+
size 7811946
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e9a354cd9fe6bddf7390bba3db9674c051fe64998e7e017a3cb215cf0f6b864
|
3 |
+
size 7823885
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e836460108d8aa9747f0f4d65ffff76f41c68c58d83f970c353a105e6f89d9f
|
3 |
+
size 7810257
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de3b9f014715a46b6142ba78e6f016b82399835f1481619dab2aa0f2779d75f9
|
3 |
+
size 7823000
|
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e12ba658947c9f8baf00b05daceae49039104127c3f697c556d4a13c45b9127
|
3 |
+
size 7810649
|