Dr. Jorge Abreu Vicente commited on
Commit
e4d816f
·
1 Parent(s): dd7fe74

End of training

Browse files
Files changed (20) hide show
  1. config.json +14 -23
  2. pytorch_model.bin +2 -2
  3. runs/Jan25_13-13-49_74c6fcc0d76a/1674652572.4056435/events.out.tfevents.1674652572.74c6fcc0d76a.6394.1 +3 -0
  4. runs/Jan25_13-13-49_74c6fcc0d76a/events.out.tfevents.1674652572.74c6fcc0d76a.6394.0 +3 -0
  5. runs/Jan25_13-13-49_74c6fcc0d76a/losses_main_loss_eval/events.out.tfevents.1674653105.74c6fcc0d76a.6394.5 +3 -0
  6. runs/Jan25_13-13-49_74c6fcc0d76a/losses_main_loss_train/events.out.tfevents.1674652583.74c6fcc0d76a.6394.2 +3 -0
  7. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_epoch_epoch/events.out.tfevents.1674652583.74c6fcc0d76a.6394.4 +3 -0
  8. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_accuracy_score_eval_accuracy_score/events.out.tfevents.1674653105.74c6fcc0d76a.6394.6 +3 -0
  9. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_f1_eval_f1/events.out.tfevents.1674653105.74c6fcc0d76a.6394.9 +3 -0
  10. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_precision_eval_precision/events.out.tfevents.1674653105.74c6fcc0d76a.6394.7 +3 -0
  11. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_recall_eval_recall/events.out.tfevents.1674653105.74c6fcc0d76a.6394.8 +3 -0
  12. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_runtime_eval_runtime/events.out.tfevents.1674653105.74c6fcc0d76a.6394.10 +3 -0
  13. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_samples_per_second_eval_samples_per_second/events.out.tfevents.1674653105.74c6fcc0d76a.6394.11 +3 -0
  14. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_steps_per_second_eval_steps_per_second/events.out.tfevents.1674653105.74c6fcc0d76a.6394.12 +3 -0
  15. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_learning_rate_learning_rate/events.out.tfevents.1674652583.74c6fcc0d76a.6394.3 +3 -0
  16. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_loss_train_loss/events.out.tfevents.1674653112.74c6fcc0d76a.6394.16 +3 -0
  17. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_runtime_train_runtime/events.out.tfevents.1674653112.74c6fcc0d76a.6394.13 +3 -0
  18. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_samples_per_second_train_samples_per_second/events.out.tfevents.1674653112.74c6fcc0d76a.6394.14 +3 -0
  19. runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_steps_per_second_train_steps_per_second/events.out.tfevents.1674653112.74c6fcc0d76a.6394.15 +3 -0
  20. training_args.bin +1 -1
config.json CHANGED
@@ -1,46 +1,37 @@
1
  {
2
- "_name_or_path": "/lm_models/excell-roberta/v3-training-512bs/checkpoint-2716290",
3
  "architectures": [
4
- "EXcellRobertaForTokenClassification"
5
  ],
6
- "attention_probs_dropout_prob": 0.2,
7
- "bias_dense_layers": false,
8
- "bias_norm": false,
9
- "bos_token_id": 0,
10
  "classifier_dropout": null,
11
- "dense_layer_bias": false,
12
- "eos_token_id": 1,
13
  "hidden_act": "gelu",
14
- "hidden_dropout_prob": 0.2,
15
- "hidden_size": 768,
16
  "id2label": {
17
  "0": "O",
18
  "1": "B-PANEL_START",
19
  "2": "I-PANEL_START"
20
  },
21
  "initializer_range": 0.02,
22
- "intermediate_size": 3072,
23
  "label2id": {
24
  "B-PANEL_START": 1,
25
  "I-PANEL_START": 2,
26
  "O": 0
27
  },
28
  "layer_norm_eps": 1e-12,
29
- "max_position_embeddings": 514,
30
  "max_length": 512,
31
- "model_type": "roberta",
32
- "num_attention_heads": 12,
33
- "num_hidden_layers": 12,
34
- "pad_token_id": 3,
 
35
  "position_embedding_type": "absolute",
36
- "return_dict": false,
37
- "sep_token_id": 1,
38
- "swiglu": true,
39
- "swiglu_reduction": 2,
40
- "tokenizer_class": "RobertaTokenizerFast",
41
  "torch_dtype": "float32",
42
  "transformers_version": "4.20.0",
43
- "type_vocab_size": 1,
44
  "use_cache": true,
45
- "vocab_size": 64000
46
  }
 
1
  {
2
+ "_name_or_path": "michiyasunaga/BioLinkBERT-large",
3
  "architectures": [
4
+ "BertForTokenClassification"
5
  ],
6
+ "attention_probs_dropout_prob": 0.1,
 
 
 
7
  "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
 
9
  "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 1024,
12
  "id2label": {
13
  "0": "O",
14
  "1": "B-PANEL_START",
15
  "2": "I-PANEL_START"
16
  },
17
  "initializer_range": 0.02,
18
+ "intermediate_size": 4096,
19
  "label2id": {
20
  "B-PANEL_START": 1,
21
  "I-PANEL_START": 2,
22
  "O": 0
23
  },
24
  "layer_norm_eps": 1e-12,
 
25
  "max_length": 512,
26
+ "max_position_embeddings": 512,
27
+ "model_type": "bert",
28
+ "num_attention_heads": 16,
29
+ "num_hidden_layers": 24,
30
+ "pad_token_id": 0,
31
  "position_embedding_type": "absolute",
 
 
 
 
 
32
  "torch_dtype": "float32",
33
  "transformers_version": "4.20.0",
34
+ "type_vocab_size": 2,
35
  "use_cache": true,
36
+ "vocab_size": 28895
37
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5fcf91499380953fd583860c5b35ca38f57b902bbb503771f8f2ae75a3dcd89
3
- size 764757539
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32461e2a7352167c0e7e357825042ef0e491c4f39c8602d92fa8fa2da246ac1f
3
+ size 1329852593
runs/Jan25_13-13-49_74c6fcc0d76a/1674652572.4056435/events.out.tfevents.1674652572.74c6fcc0d76a.6394.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1942c9bb63d52262c574d4d81e338043be6c1a545ac0ac9c3477fc581cda870
3
+ size 5717
runs/Jan25_13-13-49_74c6fcc0d76a/events.out.tfevents.1674652572.74c6fcc0d76a.6394.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aa4fe9af6d9d998ea6ea4c71de2c31127c5285c517c567d7b2e316fdb78613f
3
+ size 4037
runs/Jan25_13-13-49_74c6fcc0d76a/losses_main_loss_eval/events.out.tfevents.1674653105.74c6fcc0d76a.6394.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e382f6063c9220c24f16f1e6297e2f0e24ddfb27f4169a7fa7e89eac88a604d6
3
+ size 95
runs/Jan25_13-13-49_74c6fcc0d76a/losses_main_loss_train/events.out.tfevents.1674652583.74c6fcc0d76a.6394.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca82b9f9f9dcba60e8c88bd3e68ba95b1a80152ed73d7901aafc6c36bd608b33
3
+ size 313
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_epoch_epoch/events.out.tfevents.1674652583.74c6fcc0d76a.6394.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9a18bda36f5f3db0f22377d55cad6b78b7d7f1e28cd27d30c7854627eb06ce0
3
+ size 423
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_accuracy_score_eval_accuracy_score/events.out.tfevents.1674653105.74c6fcc0d76a.6394.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d58816a24ed68bd679a81fac726962c295b2a0980a59d378f5a43b306e2b24a6
3
+ size 109
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_f1_eval_f1/events.out.tfevents.1674653105.74c6fcc0d76a.6394.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7767220b15608b4bdbd60f175a7e53a09c7c6f441058bfca6623480cd92889d5
3
+ size 97
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_precision_eval_precision/events.out.tfevents.1674653105.74c6fcc0d76a.6394.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd55a8b018aa669574459ac13d350300746550cef5ac5c8575b1187c5168d16f
3
+ size 104
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_recall_eval_recall/events.out.tfevents.1674653105.74c6fcc0d76a.6394.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb62cde58a48f604b58a8ff48e19a3b6a24c0c75c11df7fbd024746383ee22f3
3
+ size 101
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_runtime_eval_runtime/events.out.tfevents.1674653105.74c6fcc0d76a.6394.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b460cdbc8b5caf3c41a7b148fb7920e04d6c61fe18184fca55b89bc0a229eb0d
3
+ size 102
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_samples_per_second_eval_samples_per_second/events.out.tfevents.1674653105.74c6fcc0d76a.6394.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6045f7cb7f3d5ee1047611d1fa6ed9fea1931c2621aecb191304fcf980318e8a
3
+ size 113
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_eval_steps_per_second_eval_steps_per_second/events.out.tfevents.1674653105.74c6fcc0d76a.6394.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e25c3f9611bbe672373af750d497d8821ec3c9c19f3fd0e626c9c38b9664408e
3
+ size 111
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_learning_rate_learning_rate/events.out.tfevents.1674652583.74c6fcc0d76a.6394.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb69e10ad3ea51b4db014f586363e52c0a565d03b8f870aa14863da4df7ac438
3
+ size 353
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_loss_train_loss/events.out.tfevents.1674653112.74c6fcc0d76a.6394.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:171efe0ffd0d7745fbf516ed3267d254d318b028f685b4c409813cde57fa686c
3
+ size 100
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_runtime_train_runtime/events.out.tfevents.1674653112.74c6fcc0d76a.6394.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00b35036623666265699672d3f219deed5c2b866018e1839119ff83ea0946c0f
3
+ size 103
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_samples_per_second_train_samples_per_second/events.out.tfevents.1674653112.74c6fcc0d76a.6394.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8943aac6acb2c4ba093eb2887b077ddb62c350be5684988357f7c3d475512dde
3
+ size 114
runs/Jan25_13-13-49_74c6fcc0d76a/other_data_train_steps_per_second_train_steps_per_second/events.out.tfevents.1674653112.74c6fcc0d76a.6394.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8137446c8c4e61f82f48fa9aae114a845e6dfeb92a7c77ab21829ee70f02fd8
3
+ size 112
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c31900da60517d8e262707bb255823d99cc9cacecbb33d199f06c0d6ea361798
3
  size 3631
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21aaf697c75df65d2eb5be9345e37644ec11ebb0b553a0845420f15c7671808c
3
  size 3631