TimeRobber commited on
Commit
d38c4eb
·
1 Parent(s): a349b9b

Upload part 48

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +45 -0
  2. checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/.zarray +1 -0
  5. checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/0 +0 -0
  6. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray +1 -0
  7. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp11388929281291012784.~1663960300777529~ +1 -0
  8. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp15408944531962108593.~1663960300425676~ +1 -0
  9. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp3478453131278811786.~1663960300016402~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp4231906932503099425.~1663960300018110~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp6692212168669761562.~1663960299927504~ +1 -0
  12. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0 +3 -0
  13. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1 +3 -0
  14. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2 +3 -0
  15. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3 +3 -0
  16. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5 +3 -0
  17. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6 +3 -0
  18. checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7 +3 -0
  19. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray +1 -0
  20. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp11221331478812435637.~1663960300865791~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp16906819682476284264.~1663960300865325~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2270484310615939027.~1663960300546742~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2349333016348064455.~1663960300827348~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2361301302702635123.~1663960300601360~ +1 -0
  25. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp7291065410866952681.~1663960300385543~ +1 -0
  26. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp907707751639812339.~1663960300774042~ +1 -0
  27. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0 +3 -0
  28. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2 +3 -0
  29. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3 +3 -0
  30. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4 +3 -0
  31. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5 +3 -0
  32. checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6 +3 -0
  33. checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/.zarray +1 -0
  34. checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/0 +0 -0
  35. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray +1 -0
  36. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp10448794869755293873.~1663960300420703~ +1 -0
  37. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp11106886688829216473.~1663960300685559~ +1 -0
  38. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp12010709428620963921.~1663960301029038~ +1 -0
  39. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1320971340224479062.~1663960300779399~ +1 -0
  40. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp13481401145456933929.~1663960300501314~ +1 -0
  41. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp15793081268148901456.~1663960300827397~ +1 -0
  42. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1583414768807989616.~1663960300386596~ +1 -0
  43. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0 +3 -0
  44. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1 +3 -0
  45. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2 +3 -0
  46. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3 +3 -0
  47. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4 +3 -0
  48. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5 +3 -0
  49. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6 +3 -0
  50. checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7 +3 -0
.gitattributes CHANGED
@@ -2437,3 +2437,48 @@ checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kerne
2437
  checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2438
  checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2439
  checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2437
  checkpoint_1007000/target.decoder.layers_2.encoder_decoder_attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2438
  checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2439
  checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2440
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2441
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2442
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2443
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2444
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2445
+ checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2446
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2447
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2448
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2449
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2450
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2451
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2452
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2453
+ checkpoint_1007000/target.decoder.layers_3.encoder_decoder_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2454
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/6.0 filter=lfs diff=lfs merge=lfs -text
2455
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/1.0 filter=lfs diff=lfs merge=lfs -text
2456
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/3.0 filter=lfs diff=lfs merge=lfs -text
2457
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2458
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/7.0 filter=lfs diff=lfs merge=lfs -text
2459
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2460
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2461
+ checkpoint_1007000/target.decoder.layers_6.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2462
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2463
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2464
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2465
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2466
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2467
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2468
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2469
+ checkpoint_1007000/target.decoder.layers_8.encoder_decoder_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2470
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2471
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2472
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2473
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2474
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2475
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2476
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2477
+ checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2478
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2479
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2480
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2481
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2482
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2483
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2484
+ checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_14.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (15.1 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_8.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (15.3 kB). View file
 
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp11388929281291012784.~1663960300777529~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp15408944531962108593.~1663960300425676~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp3478453131278811786.~1663960300016402~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp4231906932503099425.~1663960300018110~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/.zarray.__tmp6692212168669761562.~1663960299927504~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16cc4b350c67bd3694d8eb55387534e65757ee94b2a0fd06258ea477366516e3
3
+ size 7804869
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ece3f9c4526f984bb2bb5032aec2f966452d669dfe09e12d6ffe079c5280ca12
3
+ size 7805609
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e036c449283de0859089911166abae9a58e14244eadb91d6521952574aa3bf9
3
+ size 7805423
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b3b5770b4739035ed38c025521445b2693c2d06fa8a3c84a0258700c43d7af7
3
+ size 7806437
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:657a6404a7fd95149b7e3a7510b078a35d96ddc3e7d8f262a5aa8e3a13e5134d
3
+ size 7807599
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9193945c79a1cf6525b20afe5981b9064314277fa627191c1d7778ccfab3db54
3
+ size 7808392
checkpoint_1007000/target.decoder.layers_10.encoder_decoder_attention.key.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:360aa9813f97cec8a1ca60195dd1e951db321550de918e2afe317674457873c1
3
+ size 7804791
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp11221331478812435637.~1663960300865791~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp16906819682476284264.~1663960300865325~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2270484310615939027.~1663960300546742~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2349333016348064455.~1663960300827348~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp2361301302702635123.~1663960300601360~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp7291065410866952681.~1663960300385543~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/.zarray.__tmp907707751639812339.~1663960300774042~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:346543e9bf86b3fbe70c72d5bcfdab2d60983e39eeba2cc37be18d8307c2e50f
3
+ size 7802759
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be34f87b406639029b849110121eb3bffa8e514dee521be86a913d3d8a92b403
3
+ size 7805389
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfaa8e543e160a3c1899e6a46573cb50e82fc2d350258deddb207d7045608e5e
3
+ size 7803234
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56ac3a34050e95d1d28af8dd265e9f5b3111a31269ab73da986cae39d0ec3731
3
+ size 7801647
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:564cca01fe48d062666bd188c1156c63ed34030aa73b8d877029f4a4ab108f76
3
+ size 7802842
checkpoint_1007000/target.decoder.layers_18.encoder_decoder_attention.key.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:689f566351326650526f38ccf494d86a272472893b6a554d6bf60d977ab7376b
3
+ size 7801624
checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.pre_self_attention_layer_norm.scale/0 ADDED
Binary file (14.9 kB). View file
 
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp10448794869755293873.~1663960300420703~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp11106886688829216473.~1663960300685559~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp12010709428620963921.~1663960301029038~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1320971340224479062.~1663960300779399~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp13481401145456933929.~1663960300501314~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp15793081268148901456.~1663960300827397~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/.zarray.__tmp1583414768807989616.~1663960300386596~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f27871d2ca5479491c8f11e708f3a4b07d4869dd8583cb3fc8b29dfd20f0a54
3
+ size 7814955
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf96bf39c85d3e5edb07cb015f2859f171a5967d2da4e2303d61d615e2edca09
3
+ size 7808347
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b82211954c78503fd73446351d9e08cce75b9746f163c724e72e97a710bc9b7
3
+ size 7808660
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f638e097bae496293f86733b096b6eb5acc5f5add71a6a56ceda323df180e7e3
3
+ size 7811946
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e9a354cd9fe6bddf7390bba3db9674c051fe64998e7e017a3cb215cf0f6b864
3
+ size 7823885
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e836460108d8aa9747f0f4d65ffff76f41c68c58d83f970c353a105e6f89d9f
3
+ size 7810257
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de3b9f014715a46b6142ba78e6f016b82399835f1481619dab2aa0f2779d75f9
3
+ size 7823000
checkpoint_1007000/target.decoder.layers_20.self_attention.query.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e12ba658947c9f8baf00b05daceae49039104127c3f697c556d4a13c45b9127
3
+ size 7810649