stas commited on
Commit
883eb1b
Β·
1 Parent(s): fc0659b
This view is limited to 50 files because it contains too many changes. Β  See raw diff
Files changed (50) hide show
  1. {exp12 β†’ exp12-1}/000-module.3.input_layernorm/events.out.tfevents.1638219661.r6i6n8.58256.4 +0 -0
  2. {exp12 β†’ exp12-1}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.12 +0 -0
  3. {exp12 β†’ exp12-1}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.11 +0 -0
  4. {exp12 β†’ exp12-1}/000-module.3.mlp/events.out.tfevents.1638219662.r6i6n8.58256.13 +0 -0
  5. {exp12 β†’ exp12-1}/000-module.3.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.10 +0 -0
  6. {exp12 β†’ exp12-1}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638219661.r6i6n8.58256.7 +0 -0
  7. {exp12 β†’ exp12-1}/000-module.3.self_attention.dense/events.out.tfevents.1638219661.r6i6n8.58256.8 +0 -0
  8. {exp12 β†’ exp12-1}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638219661.r6i6n8.58256.5 +0 -0
  9. {exp12 β†’ exp12-1}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638219661.r6i6n8.58256.6 +0 -0
  10. {exp12 β†’ exp12-1}/000-module.3.self_attention/events.out.tfevents.1638219661.r6i6n8.58256.9 +0 -0
  11. {exp12 β†’ exp12-1}/000-module.3/events.out.tfevents.1638219662.r6i6n8.58256.14 +0 -0
  12. {exp12 β†’ exp12-1}/000-module.4.input_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.15 +0 -0
  13. {exp12 β†’ exp12-1}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.23 +0 -0
  14. {exp12 β†’ exp12-1}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.22 +0 -0
  15. {exp12 β†’ exp12-1}/000-module.4.mlp/events.out.tfevents.1638219662.r6i6n8.58256.24 +0 -0
  16. {exp12 β†’ exp12-1}/000-module.4.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.21 +0 -0
  17. {exp12 β†’ exp12-1}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638219662.r6i6n8.58256.18 +0 -0
  18. {exp12 β†’ exp12-1}/000-module.4.self_attention.dense/events.out.tfevents.1638219662.r6i6n8.58256.19 +0 -0
  19. {exp12 β†’ exp12-1}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638219662.r6i6n8.58256.16 +0 -0
  20. {exp12 β†’ exp12-1}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638219662.r6i6n8.58256.17 +0 -0
  21. {exp12 β†’ exp12-1}/000-module.4.self_attention/events.out.tfevents.1638219662.r6i6n8.58256.20 +0 -0
  22. {exp12 β†’ exp12-1}/000-module.4/events.out.tfevents.1638219662.r6i6n8.58256.25 +0 -0
  23. {exp12 β†’ exp12-1}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638219661.r6i6n8.58256.2 +0 -0
  24. {exp12 β†’ exp12-1}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.1 +0 -0
  25. {exp12 β†’ exp12-1}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.0 +0 -0
  26. {exp12 β†’ exp12-1}/000-module.tied_modules.embed/events.out.tfevents.1638219661.r6i6n8.58256.3 +0 -0
  27. {exp12 β†’ exp12-1}/000-module/events.out.tfevents.1638219662.r6i6n8.58256.26 +0 -0
  28. {exp12 β†’ exp12-1}/028-module.17.input_layernorm/events.out.tfevents.1638219673.r6i7n6.58182.0 +0 -0
  29. {exp12 β†’ exp12-1}/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.8 +0 -0
  30. {exp12 β†’ exp12-1}/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.7 +0 -0
  31. {exp12 β†’ exp12-1}/028-module.17.mlp/events.out.tfevents.1638219674.r6i7n6.58182.9 +0 -0
  32. {exp12 β†’ exp12-1}/028-module.17.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.6 +0 -0
  33. {exp12 β†’ exp12-1}/028-module.17.self_attention.attention_dropout/events.out.tfevents.1638219673.r6i7n6.58182.3 +0 -0
  34. {exp12 β†’ exp12-1}/028-module.17.self_attention.dense/events.out.tfevents.1638219673.r6i7n6.58182.4 +0 -0
  35. {exp12 β†’ exp12-1}/028-module.17.self_attention.query_key_value/events.out.tfevents.1638219673.r6i7n6.58182.1 +0 -0
  36. {exp12 β†’ exp12-1}/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638219673.r6i7n6.58182.2 +0 -0
  37. {exp12 β†’ exp12-1}/028-module.17.self_attention/events.out.tfevents.1638219673.r6i7n6.58182.5 +0 -0
  38. {exp12 β†’ exp12-1}/028-module.17/events.out.tfevents.1638219674.r6i7n6.58182.10 +0 -0
  39. {exp12 β†’ exp12-1}/028-module.18.input_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.11 +0 -0
  40. {exp12 β†’ exp12-1}/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.19 +0 -0
  41. {exp12 β†’ exp12-1}/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.18 +0 -0
  42. {exp12 β†’ exp12-1}/028-module.18.mlp/events.out.tfevents.1638219674.r6i7n6.58182.20 +0 -0
  43. {exp12 β†’ exp12-1}/028-module.18.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.17 +0 -0
  44. {exp12 β†’ exp12-1}/028-module.18.self_attention.attention_dropout/events.out.tfevents.1638219674.r6i7n6.58182.14 +0 -0
  45. {exp12 β†’ exp12-1}/028-module.18.self_attention.dense/events.out.tfevents.1638219674.r6i7n6.58182.15 +0 -0
  46. {exp12 β†’ exp12-1}/028-module.18.self_attention.query_key_value/events.out.tfevents.1638219674.r6i7n6.58182.12 +0 -0
  47. {exp12 β†’ exp12-1}/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638219674.r6i7n6.58182.13 +0 -0
  48. {exp12 β†’ exp12-1}/028-module.18.self_attention/events.out.tfevents.1638219674.r6i7n6.58182.16 +0 -0
  49. {exp12 β†’ exp12-1}/028-module.18/events.out.tfevents.1638219674.r6i7n6.58182.21 +0 -0
  50. {exp12 β†’ exp12-1}/028-module/events.out.tfevents.1638219674.r6i7n6.58182.22 +0 -0
{exp12 β†’ exp12-1}/000-module.3.input_layernorm/events.out.tfevents.1638219661.r6i6n8.58256.4 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.12 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.11 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.mlp/events.out.tfevents.1638219662.r6i6n8.58256.13 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.10 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638219661.r6i6n8.58256.7 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.self_attention.dense/events.out.tfevents.1638219661.r6i6n8.58256.8 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638219661.r6i6n8.58256.5 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638219661.r6i6n8.58256.6 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3.self_attention/events.out.tfevents.1638219661.r6i6n8.58256.9 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.3/events.out.tfevents.1638219662.r6i6n8.58256.14 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.input_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.15 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.23 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.22 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.mlp/events.out.tfevents.1638219662.r6i6n8.58256.24 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.21 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638219662.r6i6n8.58256.18 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.self_attention.dense/events.out.tfevents.1638219662.r6i6n8.58256.19 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638219662.r6i6n8.58256.16 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638219662.r6i6n8.58256.17 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4.self_attention/events.out.tfevents.1638219662.r6i6n8.58256.20 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.4/events.out.tfevents.1638219662.r6i6n8.58256.25 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638219661.r6i6n8.58256.2 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.1 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.0 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module.tied_modules.embed/events.out.tfevents.1638219661.r6i6n8.58256.3 RENAMED
File without changes
{exp12 β†’ exp12-1}/000-module/events.out.tfevents.1638219662.r6i6n8.58256.26 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.input_layernorm/events.out.tfevents.1638219673.r6i7n6.58182.0 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.8 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.7 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.mlp/events.out.tfevents.1638219674.r6i7n6.58182.9 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.6 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.self_attention.attention_dropout/events.out.tfevents.1638219673.r6i7n6.58182.3 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.self_attention.dense/events.out.tfevents.1638219673.r6i7n6.58182.4 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.self_attention.query_key_value/events.out.tfevents.1638219673.r6i7n6.58182.1 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638219673.r6i7n6.58182.2 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17.self_attention/events.out.tfevents.1638219673.r6i7n6.58182.5 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.17/events.out.tfevents.1638219674.r6i7n6.58182.10 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.input_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.11 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.19 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.18 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.mlp/events.out.tfevents.1638219674.r6i7n6.58182.20 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.17 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.self_attention.attention_dropout/events.out.tfevents.1638219674.r6i7n6.58182.14 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.self_attention.dense/events.out.tfevents.1638219674.r6i7n6.58182.15 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.self_attention.query_key_value/events.out.tfevents.1638219674.r6i7n6.58182.12 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638219674.r6i7n6.58182.13 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18.self_attention/events.out.tfevents.1638219674.r6i7n6.58182.16 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module.18/events.out.tfevents.1638219674.r6i7n6.58182.21 RENAMED
File without changes
{exp12 β†’ exp12-1}/028-module/events.out.tfevents.1638219674.r6i7n6.58182.22 RENAMED
File without changes