mv
Browse filesThis view is limited to 50 files because it contains too many changes. Β
See raw diff
- {exp12 β exp12-1}/000-module.3.input_layernorm/events.out.tfevents.1638219661.r6i6n8.58256.4 +0 -0
- {exp12 β exp12-1}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.12 +0 -0
- {exp12 β exp12-1}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.11 +0 -0
- {exp12 β exp12-1}/000-module.3.mlp/events.out.tfevents.1638219662.r6i6n8.58256.13 +0 -0
- {exp12 β exp12-1}/000-module.3.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.10 +0 -0
- {exp12 β exp12-1}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638219661.r6i6n8.58256.7 +0 -0
- {exp12 β exp12-1}/000-module.3.self_attention.dense/events.out.tfevents.1638219661.r6i6n8.58256.8 +0 -0
- {exp12 β exp12-1}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638219661.r6i6n8.58256.5 +0 -0
- {exp12 β exp12-1}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638219661.r6i6n8.58256.6 +0 -0
- {exp12 β exp12-1}/000-module.3.self_attention/events.out.tfevents.1638219661.r6i6n8.58256.9 +0 -0
- {exp12 β exp12-1}/000-module.3/events.out.tfevents.1638219662.r6i6n8.58256.14 +0 -0
- {exp12 β exp12-1}/000-module.4.input_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.15 +0 -0
- {exp12 β exp12-1}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.23 +0 -0
- {exp12 β exp12-1}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.22 +0 -0
- {exp12 β exp12-1}/000-module.4.mlp/events.out.tfevents.1638219662.r6i6n8.58256.24 +0 -0
- {exp12 β exp12-1}/000-module.4.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.21 +0 -0
- {exp12 β exp12-1}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638219662.r6i6n8.58256.18 +0 -0
- {exp12 β exp12-1}/000-module.4.self_attention.dense/events.out.tfevents.1638219662.r6i6n8.58256.19 +0 -0
- {exp12 β exp12-1}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638219662.r6i6n8.58256.16 +0 -0
- {exp12 β exp12-1}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638219662.r6i6n8.58256.17 +0 -0
- {exp12 β exp12-1}/000-module.4.self_attention/events.out.tfevents.1638219662.r6i6n8.58256.20 +0 -0
- {exp12 β exp12-1}/000-module.4/events.out.tfevents.1638219662.r6i6n8.58256.25 +0 -0
- {exp12 β exp12-1}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638219661.r6i6n8.58256.2 +0 -0
- {exp12 β exp12-1}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.1 +0 -0
- {exp12 β exp12-1}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.0 +0 -0
- {exp12 β exp12-1}/000-module.tied_modules.embed/events.out.tfevents.1638219661.r6i6n8.58256.3 +0 -0
- {exp12 β exp12-1}/000-module/events.out.tfevents.1638219662.r6i6n8.58256.26 +0 -0
- {exp12 β exp12-1}/028-module.17.input_layernorm/events.out.tfevents.1638219673.r6i7n6.58182.0 +0 -0
- {exp12 β exp12-1}/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.8 +0 -0
- {exp12 β exp12-1}/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.7 +0 -0
- {exp12 β exp12-1}/028-module.17.mlp/events.out.tfevents.1638219674.r6i7n6.58182.9 +0 -0
- {exp12 β exp12-1}/028-module.17.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.6 +0 -0
- {exp12 β exp12-1}/028-module.17.self_attention.attention_dropout/events.out.tfevents.1638219673.r6i7n6.58182.3 +0 -0
- {exp12 β exp12-1}/028-module.17.self_attention.dense/events.out.tfevents.1638219673.r6i7n6.58182.4 +0 -0
- {exp12 β exp12-1}/028-module.17.self_attention.query_key_value/events.out.tfevents.1638219673.r6i7n6.58182.1 +0 -0
- {exp12 β exp12-1}/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638219673.r6i7n6.58182.2 +0 -0
- {exp12 β exp12-1}/028-module.17.self_attention/events.out.tfevents.1638219673.r6i7n6.58182.5 +0 -0
- {exp12 β exp12-1}/028-module.17/events.out.tfevents.1638219674.r6i7n6.58182.10 +0 -0
- {exp12 β exp12-1}/028-module.18.input_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.11 +0 -0
- {exp12 β exp12-1}/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.19 +0 -0
- {exp12 β exp12-1}/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.18 +0 -0
- {exp12 β exp12-1}/028-module.18.mlp/events.out.tfevents.1638219674.r6i7n6.58182.20 +0 -0
- {exp12 β exp12-1}/028-module.18.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.17 +0 -0
- {exp12 β exp12-1}/028-module.18.self_attention.attention_dropout/events.out.tfevents.1638219674.r6i7n6.58182.14 +0 -0
- {exp12 β exp12-1}/028-module.18.self_attention.dense/events.out.tfevents.1638219674.r6i7n6.58182.15 +0 -0
- {exp12 β exp12-1}/028-module.18.self_attention.query_key_value/events.out.tfevents.1638219674.r6i7n6.58182.12 +0 -0
- {exp12 β exp12-1}/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638219674.r6i7n6.58182.13 +0 -0
- {exp12 β exp12-1}/028-module.18.self_attention/events.out.tfevents.1638219674.r6i7n6.58182.16 +0 -0
- {exp12 β exp12-1}/028-module.18/events.out.tfevents.1638219674.r6i7n6.58182.21 +0 -0
- {exp12 β exp12-1}/028-module/events.out.tfevents.1638219674.r6i7n6.58182.22 +0 -0
{exp12 β exp12-1}/000-module.3.input_layernorm/events.out.tfevents.1638219661.r6i6n8.58256.4
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.12
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.11
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.mlp/events.out.tfevents.1638219662.r6i6n8.58256.13
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.10
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.self_attention.attention_dropout/events.out.tfevents.1638219661.r6i6n8.58256.7
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.self_attention.dense/events.out.tfevents.1638219661.r6i6n8.58256.8
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.self_attention.query_key_value/events.out.tfevents.1638219661.r6i6n8.58256.5
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.self_attention.scale_mask_softmax/events.out.tfevents.1638219661.r6i6n8.58256.6
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3.self_attention/events.out.tfevents.1638219661.r6i6n8.58256.9
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.3/events.out.tfevents.1638219662.r6i6n8.58256.14
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.input_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.15
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.mlp.dense_4h_to_h/events.out.tfevents.1638219662.r6i6n8.58256.23
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.mlp.dense_h_to_4h/events.out.tfevents.1638219662.r6i6n8.58256.22
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.mlp/events.out.tfevents.1638219662.r6i6n8.58256.24
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.post_attention_layernorm/events.out.tfevents.1638219662.r6i6n8.58256.21
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.self_attention.attention_dropout/events.out.tfevents.1638219662.r6i6n8.58256.18
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.self_attention.dense/events.out.tfevents.1638219662.r6i6n8.58256.19
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.self_attention.query_key_value/events.out.tfevents.1638219662.r6i6n8.58256.16
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.self_attention.scale_mask_softmax/events.out.tfevents.1638219662.r6i6n8.58256.17
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4.self_attention/events.out.tfevents.1638219662.r6i6n8.58256.20
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.4/events.out.tfevents.1638219662.r6i6n8.58256.25
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.tied_modules.embed.embedding_dropout/events.out.tfevents.1638219661.r6i6n8.58256.2
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.tied_modules.embed.position_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.1
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.tied_modules.embed.word_embeddings/events.out.tfevents.1638219661.r6i6n8.58256.0
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module.tied_modules.embed/events.out.tfevents.1638219661.r6i6n8.58256.3
RENAMED
File without changes
|
{exp12 β exp12-1}/000-module/events.out.tfevents.1638219662.r6i6n8.58256.26
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.input_layernorm/events.out.tfevents.1638219673.r6i7n6.58182.0
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.8
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.7
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.mlp/events.out.tfevents.1638219674.r6i7n6.58182.9
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.6
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.self_attention.attention_dropout/events.out.tfevents.1638219673.r6i7n6.58182.3
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.self_attention.dense/events.out.tfevents.1638219673.r6i7n6.58182.4
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.self_attention.query_key_value/events.out.tfevents.1638219673.r6i7n6.58182.1
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.self_attention.scale_mask_softmax/events.out.tfevents.1638219673.r6i7n6.58182.2
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17.self_attention/events.out.tfevents.1638219673.r6i7n6.58182.5
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.17/events.out.tfevents.1638219674.r6i7n6.58182.10
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.input_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.11
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.mlp.dense_4h_to_h/events.out.tfevents.1638219674.r6i7n6.58182.19
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.mlp.dense_h_to_4h/events.out.tfevents.1638219674.r6i7n6.58182.18
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.mlp/events.out.tfevents.1638219674.r6i7n6.58182.20
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.post_attention_layernorm/events.out.tfevents.1638219674.r6i7n6.58182.17
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.self_attention.attention_dropout/events.out.tfevents.1638219674.r6i7n6.58182.14
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.self_attention.dense/events.out.tfevents.1638219674.r6i7n6.58182.15
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.self_attention.query_key_value/events.out.tfevents.1638219674.r6i7n6.58182.12
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.self_attention.scale_mask_softmax/events.out.tfevents.1638219674.r6i7n6.58182.13
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18.self_attention/events.out.tfevents.1638219674.r6i7n6.58182.16
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module.18/events.out.tfevents.1638219674.r6i7n6.58182.21
RENAMED
File without changes
|
{exp12 β exp12-1}/028-module/events.out.tfevents.1638219674.r6i7n6.58182.22
RENAMED
File without changes
|