diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/README.md b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/README.md new file mode 100644 index 0000000000000000000000000000000000000000..4e4d0da3c02afc62391061832f357dab811a9b16 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/README.md @@ -0,0 +1,202 @@ +--- +base_model: ./checkpoints/pannot-Meta-Llama-3.1-8B-Instruct-pretrain-v00/checkpoint-24000 +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.9.0 \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_config.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..a250d8e3ab6378913bd07025eb2772b8b1cda930 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_config.json @@ -0,0 +1,46 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "./checkpoints/pannot-Meta-Llama-3.1-8B-Instruct-pretrain-v00/checkpoint-24000", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "gate_proj", + "fc1", + "q_proj", + "down_proj", + "node_embedding", + "v_proj", + "wg", + "up_proj", + "wv", + "ws", + "k_proj", + "mm_struc_projector", + "o_proj", + "out_proj", + "embed_confidence", + "embed_gvp_input_features", + "embed_gvp_output", + "output_projection", + "wh", + "fc2" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_model.safetensors b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6664c89ee56dee03b9842282e7d0fda6b85a6428 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f19f17c6b394fa8aac507df217de3a50ca14593d281b38efa0b436e7e85005 +size 377762600 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/config.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/config.json new file mode 100644 index 0000000000000000000000000000000000000000..d0368db99decd84aa54530080a34aa04aae6ee22 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/config.json @@ -0,0 +1,57 @@ +{ + "_name_or_path": "./checkpoints/pannot-Meta-Llama-3.1-8B-Instruct-pretrain-v00/checkpoint-24000", + "architectures": [ + "PannotLlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": [ + 128001, + 128008, + 128009 + ], + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 131072, + "mlp_bias": false, + "mm_projector_lr": null, + "mm_seq_hidden_size": 1280, + "mm_seq_no_pooling": true, + "mm_seq_projector_type": "linear", + "mm_seq_select_feature": "cls", + "mm_seq_select_layer": -1, + "mm_seq_tower": "ESM", + "mm_str_hidden_size": 512, + "mm_str_select_feature": "residue", + "mm_str_select_layer": -1, + "mm_struc_projector_type": "linear", + "mm_struc_tower": "ESMIF", + "mm_use_seq_start_end": false, + "mm_use_str_start_end": false, + "model_type": "pannot_llama", + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "low_freq_factor": 1.0, + "high_freq_factor": 4.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3", + "type":"llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.37.2", + "tune_mm_mlp_adapter": false, + "use_cache": true, + "use_mm_seq_proj": true, + "use_mm_str_proj": true, + "vocab_size": 128257 +} diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/non_lora_trainables.bin b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/non_lora_trainables.bin new file mode 100644 index 0000000000000000000000000000000000000000..bffe23ce6835872e0c38de8bf2518c31b3ab1f0c --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/non_lora_trainables.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfaef39d83259bc6188412e5e3bf7b3d48771904751511e6d3cd9339e30e64c +size 912 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/trainer_state.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..ffb015b57b757f075f2244eadfd53fc0f2024128 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v000/trainer_state.json @@ -0,0 +1,75762 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.9999603881956823, + "eval_steps": 500, + "global_step": 12622, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 5.277044854881267e-08, + "loss": 0.5484, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 1.0554089709762534e-07, + "loss": 0.5712, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 1.5831134564643802e-07, + "loss": 0.3471, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 2.1108179419525068e-07, + "loss": 0.5516, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 2.6385224274406334e-07, + "loss": 0.4672, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 3.1662269129287605e-07, + "loss": 0.4934, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 3.693931398416887e-07, + "loss": 0.6151, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 4.2216358839050136e-07, + "loss": 0.5, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 4.7493403693931397e-07, + "loss": 0.5454, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 5.277044854881267e-07, + "loss": 0.7022, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 5.804749340369393e-07, + "loss": 0.5653, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 6.332453825857521e-07, + "loss": 0.4582, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 6.860158311345646e-07, + "loss": 0.6098, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 7.387862796833774e-07, + "loss": 0.4902, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 7.915567282321901e-07, + "loss": 0.5286, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 8.443271767810027e-07, + "loss": 0.4537, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 8.970976253298154e-07, + "loss": 0.468, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 9.498680738786279e-07, + "loss": 0.4506, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 1.0026385224274407e-06, + "loss": 0.5048, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 1.0554089709762534e-06, + "loss": 0.421, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 1.108179419525066e-06, + "loss": 0.552, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 1.1609498680738787e-06, + "loss": 0.5861, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 1.2137203166226915e-06, + "loss": 0.5033, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 1.2664907651715042e-06, + "loss": 0.576, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 1.3192612137203166e-06, + "loss": 0.5959, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 1.3720316622691293e-06, + "loss": 0.5812, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 1.4248021108179422e-06, + "loss": 0.4161, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 1.4775725593667548e-06, + "loss": 0.519, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 1.5303430079155673e-06, + "loss": 0.6832, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 1.5831134564643801e-06, + "loss": 0.4238, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 1.6358839050131928e-06, + "loss": 0.4995, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 1.6886543535620054e-06, + "loss": 0.689, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 1.7414248021108183e-06, + "loss": 0.2753, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 1.7941952506596308e-06, + "loss": 0.4369, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 1.8469656992084434e-06, + "loss": 0.5408, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 1.8997361477572559e-06, + "loss": 0.4951, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 1.9525065963060687e-06, + "loss": 0.4892, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 2.0052770448548814e-06, + "loss": 0.4631, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 2.058047493403694e-06, + "loss": 0.4768, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 2.1108179419525067e-06, + "loss": 0.4672, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 2.1635883905013194e-06, + "loss": 0.4902, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 2.216358839050132e-06, + "loss": 0.5527, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 2.2691292875989447e-06, + "loss": 0.4656, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 2.3218997361477573e-06, + "loss": 0.5018, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 2.37467018469657e-06, + "loss": 0.4412, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 2.427440633245383e-06, + "loss": 0.4734, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 2.4802110817941953e-06, + "loss": 0.5094, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 2.5329815303430084e-06, + "loss": 0.4745, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 2.5857519788918206e-06, + "loss": 0.5062, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 2.6385224274406333e-06, + "loss": 0.3426, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 2.6912928759894464e-06, + "loss": 0.439, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 2.7440633245382586e-06, + "loss": 0.5652, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 2.7968337730870717e-06, + "loss": 0.5443, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 2.8496042216358843e-06, + "loss": 0.5024, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 2.9023746701846966e-06, + "loss": 0.3457, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 2.9551451187335096e-06, + "loss": 0.4686, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 3.0079155672823223e-06, + "loss": 0.3593, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 3.0606860158311345e-06, + "loss": 0.4398, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 3.1134564643799476e-06, + "loss": 0.4445, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 3.1662269129287603e-06, + "loss": 0.447, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 3.2189973614775725e-06, + "loss": 0.554, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 3.2717678100263856e-06, + "loss": 0.4652, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 3.3245382585751982e-06, + "loss": 0.527, + "step": 63 + }, + { + "epoch": 0.01, + "learning_rate": 3.377308707124011e-06, + "loss": 0.5207, + "step": 64 + }, + { + "epoch": 0.01, + "learning_rate": 3.4300791556728235e-06, + "loss": 0.5138, + "step": 65 + }, + { + "epoch": 0.01, + "learning_rate": 3.4828496042216366e-06, + "loss": 0.3909, + "step": 66 + }, + { + "epoch": 0.01, + "learning_rate": 3.535620052770449e-06, + "loss": 0.3827, + "step": 67 + }, + { + "epoch": 0.01, + "learning_rate": 3.5883905013192615e-06, + "loss": 0.4755, + "step": 68 + }, + { + "epoch": 0.01, + "learning_rate": 3.6411609498680746e-06, + "loss": 0.552, + "step": 69 + }, + { + "epoch": 0.01, + "learning_rate": 3.693931398416887e-06, + "loss": 0.4365, + "step": 70 + }, + { + "epoch": 0.01, + "learning_rate": 3.7467018469656995e-06, + "loss": 0.6031, + "step": 71 + }, + { + "epoch": 0.01, + "learning_rate": 3.7994722955145117e-06, + "loss": 0.68, + "step": 72 + }, + { + "epoch": 0.01, + "learning_rate": 3.852242744063324e-06, + "loss": 0.5197, + "step": 73 + }, + { + "epoch": 0.01, + "learning_rate": 3.9050131926121375e-06, + "loss": 0.4486, + "step": 74 + }, + { + "epoch": 0.01, + "learning_rate": 3.95778364116095e-06, + "loss": 0.4635, + "step": 75 + }, + { + "epoch": 0.01, + "learning_rate": 4.010554089709763e-06, + "loss": 0.5978, + "step": 76 + }, + { + "epoch": 0.01, + "learning_rate": 4.063324538258576e-06, + "loss": 0.4959, + "step": 77 + }, + { + "epoch": 0.01, + "learning_rate": 4.116094986807388e-06, + "loss": 0.605, + "step": 78 + }, + { + "epoch": 0.01, + "learning_rate": 4.168865435356201e-06, + "loss": 0.5458, + "step": 79 + }, + { + "epoch": 0.01, + "learning_rate": 4.221635883905013e-06, + "loss": 0.5247, + "step": 80 + }, + { + "epoch": 0.01, + "learning_rate": 4.274406332453826e-06, + "loss": 0.3924, + "step": 81 + }, + { + "epoch": 0.01, + "learning_rate": 4.327176781002639e-06, + "loss": 0.4956, + "step": 82 + }, + { + "epoch": 0.01, + "learning_rate": 4.379947229551452e-06, + "loss": 0.4864, + "step": 83 + }, + { + "epoch": 0.01, + "learning_rate": 4.432717678100264e-06, + "loss": 0.4362, + "step": 84 + }, + { + "epoch": 0.01, + "learning_rate": 4.485488126649077e-06, + "loss": 0.5678, + "step": 85 + }, + { + "epoch": 0.01, + "learning_rate": 4.538258575197889e-06, + "loss": 0.4097, + "step": 86 + }, + { + "epoch": 0.01, + "learning_rate": 4.5910290237467024e-06, + "loss": 0.4862, + "step": 87 + }, + { + "epoch": 0.01, + "learning_rate": 4.643799472295515e-06, + "loss": 0.5886, + "step": 88 + }, + { + "epoch": 0.01, + "learning_rate": 4.696569920844328e-06, + "loss": 0.5072, + "step": 89 + }, + { + "epoch": 0.01, + "learning_rate": 4.74934036939314e-06, + "loss": 0.5908, + "step": 90 + }, + { + "epoch": 0.01, + "learning_rate": 4.802110817941953e-06, + "loss": 0.3937, + "step": 91 + }, + { + "epoch": 0.01, + "learning_rate": 4.854881266490766e-06, + "loss": 0.6338, + "step": 92 + }, + { + "epoch": 0.01, + "learning_rate": 4.907651715039578e-06, + "loss": 0.4323, + "step": 93 + }, + { + "epoch": 0.01, + "learning_rate": 4.960422163588391e-06, + "loss": 0.4448, + "step": 94 + }, + { + "epoch": 0.01, + "learning_rate": 5.013192612137203e-06, + "loss": 0.5013, + "step": 95 + }, + { + "epoch": 0.01, + "learning_rate": 5.065963060686017e-06, + "loss": 0.449, + "step": 96 + }, + { + "epoch": 0.01, + "learning_rate": 5.118733509234829e-06, + "loss": 0.5521, + "step": 97 + }, + { + "epoch": 0.01, + "learning_rate": 5.171503957783641e-06, + "loss": 0.4838, + "step": 98 + }, + { + "epoch": 0.01, + "learning_rate": 5.224274406332454e-06, + "loss": 0.3994, + "step": 99 + }, + { + "epoch": 0.01, + "learning_rate": 5.2770448548812665e-06, + "loss": 0.4433, + "step": 100 + }, + { + "epoch": 0.01, + "learning_rate": 5.32981530343008e-06, + "loss": 0.5692, + "step": 101 + }, + { + "epoch": 0.01, + "learning_rate": 5.382585751978893e-06, + "loss": 0.4939, + "step": 102 + }, + { + "epoch": 0.01, + "learning_rate": 5.435356200527705e-06, + "loss": 0.5006, + "step": 103 + }, + { + "epoch": 0.01, + "learning_rate": 5.488126649076517e-06, + "loss": 0.6119, + "step": 104 + }, + { + "epoch": 0.01, + "learning_rate": 5.540897097625331e-06, + "loss": 0.5193, + "step": 105 + }, + { + "epoch": 0.01, + "learning_rate": 5.593667546174143e-06, + "loss": 0.531, + "step": 106 + }, + { + "epoch": 0.01, + "learning_rate": 5.6464379947229556e-06, + "loss": 0.553, + "step": 107 + }, + { + "epoch": 0.01, + "learning_rate": 5.699208443271769e-06, + "loss": 0.5276, + "step": 108 + }, + { + "epoch": 0.01, + "learning_rate": 5.751978891820581e-06, + "loss": 0.5054, + "step": 109 + }, + { + "epoch": 0.01, + "learning_rate": 5.804749340369393e-06, + "loss": 0.4162, + "step": 110 + }, + { + "epoch": 0.01, + "learning_rate": 5.857519788918207e-06, + "loss": 0.4507, + "step": 111 + }, + { + "epoch": 0.01, + "learning_rate": 5.910290237467019e-06, + "loss": 0.4423, + "step": 112 + }, + { + "epoch": 0.01, + "learning_rate": 5.9630606860158315e-06, + "loss": 0.666, + "step": 113 + }, + { + "epoch": 0.01, + "learning_rate": 6.015831134564645e-06, + "loss": 0.3538, + "step": 114 + }, + { + "epoch": 0.01, + "learning_rate": 6.068601583113457e-06, + "loss": 0.5266, + "step": 115 + }, + { + "epoch": 0.01, + "learning_rate": 6.121372031662269e-06, + "loss": 0.5874, + "step": 116 + }, + { + "epoch": 0.01, + "learning_rate": 6.174142480211083e-06, + "loss": 0.6413, + "step": 117 + }, + { + "epoch": 0.01, + "learning_rate": 6.226912928759895e-06, + "loss": 0.4947, + "step": 118 + }, + { + "epoch": 0.01, + "learning_rate": 6.2796833773087074e-06, + "loss": 0.4201, + "step": 119 + }, + { + "epoch": 0.01, + "learning_rate": 6.3324538258575205e-06, + "loss": 0.5365, + "step": 120 + }, + { + "epoch": 0.01, + "learning_rate": 6.385224274406333e-06, + "loss": 0.4985, + "step": 121 + }, + { + "epoch": 0.01, + "learning_rate": 6.437994722955145e-06, + "loss": 0.4793, + "step": 122 + }, + { + "epoch": 0.01, + "learning_rate": 6.490765171503959e-06, + "loss": 0.5136, + "step": 123 + }, + { + "epoch": 0.01, + "learning_rate": 6.543535620052771e-06, + "loss": 0.5292, + "step": 124 + }, + { + "epoch": 0.01, + "learning_rate": 6.596306068601583e-06, + "loss": 0.5644, + "step": 125 + }, + { + "epoch": 0.01, + "learning_rate": 6.6490765171503965e-06, + "loss": 0.5366, + "step": 126 + }, + { + "epoch": 0.01, + "learning_rate": 6.701846965699209e-06, + "loss": 0.3492, + "step": 127 + }, + { + "epoch": 0.01, + "learning_rate": 6.754617414248022e-06, + "loss": 0.4335, + "step": 128 + }, + { + "epoch": 0.01, + "learning_rate": 6.807387862796835e-06, + "loss": 0.5587, + "step": 129 + }, + { + "epoch": 0.01, + "learning_rate": 6.860158311345647e-06, + "loss": 0.6136, + "step": 130 + }, + { + "epoch": 0.01, + "learning_rate": 6.912928759894459e-06, + "loss": 0.4934, + "step": 131 + }, + { + "epoch": 0.01, + "learning_rate": 6.965699208443273e-06, + "loss": 0.542, + "step": 132 + }, + { + "epoch": 0.01, + "learning_rate": 7.0184696569920855e-06, + "loss": 0.6283, + "step": 133 + }, + { + "epoch": 0.01, + "learning_rate": 7.071240105540898e-06, + "loss": 0.4908, + "step": 134 + }, + { + "epoch": 0.01, + "learning_rate": 7.124010554089711e-06, + "loss": 0.5885, + "step": 135 + }, + { + "epoch": 0.01, + "learning_rate": 7.176781002638523e-06, + "loss": 0.6095, + "step": 136 + }, + { + "epoch": 0.01, + "learning_rate": 7.229551451187335e-06, + "loss": 0.5101, + "step": 137 + }, + { + "epoch": 0.01, + "learning_rate": 7.282321899736149e-06, + "loss": 0.5876, + "step": 138 + }, + { + "epoch": 0.01, + "learning_rate": 7.3350923482849614e-06, + "loss": 0.4332, + "step": 139 + }, + { + "epoch": 0.01, + "learning_rate": 7.387862796833774e-06, + "loss": 0.518, + "step": 140 + }, + { + "epoch": 0.01, + "learning_rate": 7.440633245382587e-06, + "loss": 0.4361, + "step": 141 + }, + { + "epoch": 0.01, + "learning_rate": 7.493403693931399e-06, + "loss": 0.382, + "step": 142 + }, + { + "epoch": 0.01, + "learning_rate": 7.546174142480211e-06, + "loss": 0.3682, + "step": 143 + }, + { + "epoch": 0.01, + "learning_rate": 7.5989445910290234e-06, + "loss": 0.5955, + "step": 144 + }, + { + "epoch": 0.01, + "learning_rate": 7.651715039577837e-06, + "loss": 0.506, + "step": 145 + }, + { + "epoch": 0.01, + "learning_rate": 7.704485488126649e-06, + "loss": 0.4097, + "step": 146 + }, + { + "epoch": 0.01, + "learning_rate": 7.757255936675462e-06, + "loss": 0.5349, + "step": 147 + }, + { + "epoch": 0.01, + "learning_rate": 7.810026385224275e-06, + "loss": 0.392, + "step": 148 + }, + { + "epoch": 0.01, + "learning_rate": 7.862796833773088e-06, + "loss": 0.5652, + "step": 149 + }, + { + "epoch": 0.01, + "learning_rate": 7.9155672823219e-06, + "loss": 0.4713, + "step": 150 + }, + { + "epoch": 0.01, + "learning_rate": 7.968337730870712e-06, + "loss": 0.374, + "step": 151 + }, + { + "epoch": 0.01, + "learning_rate": 8.021108179419526e-06, + "loss": 0.5669, + "step": 152 + }, + { + "epoch": 0.01, + "learning_rate": 8.073878627968339e-06, + "loss": 0.4861, + "step": 153 + }, + { + "epoch": 0.01, + "learning_rate": 8.126649076517152e-06, + "loss": 0.4685, + "step": 154 + }, + { + "epoch": 0.01, + "learning_rate": 8.179419525065963e-06, + "loss": 0.4767, + "step": 155 + }, + { + "epoch": 0.01, + "learning_rate": 8.232189973614776e-06, + "loss": 0.4682, + "step": 156 + }, + { + "epoch": 0.01, + "learning_rate": 8.28496042216359e-06, + "loss": 0.421, + "step": 157 + }, + { + "epoch": 0.01, + "learning_rate": 8.337730870712402e-06, + "loss": 0.5517, + "step": 158 + }, + { + "epoch": 0.01, + "learning_rate": 8.390501319261214e-06, + "loss": 0.5352, + "step": 159 + }, + { + "epoch": 0.01, + "learning_rate": 8.443271767810027e-06, + "loss": 0.5637, + "step": 160 + }, + { + "epoch": 0.01, + "learning_rate": 8.49604221635884e-06, + "loss": 0.4665, + "step": 161 + }, + { + "epoch": 0.01, + "learning_rate": 8.548812664907651e-06, + "loss": 0.4397, + "step": 162 + }, + { + "epoch": 0.01, + "learning_rate": 8.601583113456466e-06, + "loss": 0.3153, + "step": 163 + }, + { + "epoch": 0.01, + "learning_rate": 8.654353562005277e-06, + "loss": 0.5395, + "step": 164 + }, + { + "epoch": 0.01, + "learning_rate": 8.70712401055409e-06, + "loss": 0.5231, + "step": 165 + }, + { + "epoch": 0.01, + "learning_rate": 8.759894459102904e-06, + "loss": 0.3702, + "step": 166 + }, + { + "epoch": 0.01, + "learning_rate": 8.812664907651715e-06, + "loss": 0.6472, + "step": 167 + }, + { + "epoch": 0.01, + "learning_rate": 8.865435356200528e-06, + "loss": 0.4293, + "step": 168 + }, + { + "epoch": 0.01, + "learning_rate": 8.918205804749341e-06, + "loss": 0.3716, + "step": 169 + }, + { + "epoch": 0.01, + "learning_rate": 8.970976253298154e-06, + "loss": 0.6373, + "step": 170 + }, + { + "epoch": 0.01, + "learning_rate": 9.023746701846966e-06, + "loss": 0.5078, + "step": 171 + }, + { + "epoch": 0.01, + "learning_rate": 9.076517150395779e-06, + "loss": 0.5946, + "step": 172 + }, + { + "epoch": 0.01, + "learning_rate": 9.129287598944592e-06, + "loss": 0.6085, + "step": 173 + }, + { + "epoch": 0.01, + "learning_rate": 9.182058047493405e-06, + "loss": 0.3978, + "step": 174 + }, + { + "epoch": 0.01, + "learning_rate": 9.234828496042218e-06, + "loss": 0.5055, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 9.28759894459103e-06, + "loss": 0.5559, + "step": 176 + }, + { + "epoch": 0.01, + "learning_rate": 9.340369393139842e-06, + "loss": 0.4761, + "step": 177 + }, + { + "epoch": 0.01, + "learning_rate": 9.393139841688655e-06, + "loss": 0.5185, + "step": 178 + }, + { + "epoch": 0.01, + "learning_rate": 9.445910290237469e-06, + "loss": 0.4974, + "step": 179 + }, + { + "epoch": 0.01, + "learning_rate": 9.49868073878628e-06, + "loss": 0.3948, + "step": 180 + }, + { + "epoch": 0.01, + "learning_rate": 9.551451187335093e-06, + "loss": 0.6213, + "step": 181 + }, + { + "epoch": 0.01, + "learning_rate": 9.604221635883906e-06, + "loss": 0.5719, + "step": 182 + }, + { + "epoch": 0.01, + "learning_rate": 9.656992084432717e-06, + "loss": 0.3942, + "step": 183 + }, + { + "epoch": 0.01, + "learning_rate": 9.709762532981532e-06, + "loss": 0.5803, + "step": 184 + }, + { + "epoch": 0.01, + "learning_rate": 9.762532981530344e-06, + "loss": 0.5586, + "step": 185 + }, + { + "epoch": 0.01, + "learning_rate": 9.815303430079157e-06, + "loss": 0.497, + "step": 186 + }, + { + "epoch": 0.01, + "learning_rate": 9.86807387862797e-06, + "loss": 0.5329, + "step": 187 + }, + { + "epoch": 0.01, + "learning_rate": 9.920844327176781e-06, + "loss": 0.4446, + "step": 188 + }, + { + "epoch": 0.01, + "learning_rate": 9.973614775725594e-06, + "loss": 0.5594, + "step": 189 + }, + { + "epoch": 0.02, + "learning_rate": 1.0026385224274406e-05, + "loss": 0.5282, + "step": 190 + }, + { + "epoch": 0.02, + "learning_rate": 1.007915567282322e-05, + "loss": 0.5399, + "step": 191 + }, + { + "epoch": 0.02, + "learning_rate": 1.0131926121372034e-05, + "loss": 0.3619, + "step": 192 + }, + { + "epoch": 0.02, + "learning_rate": 1.0184696569920845e-05, + "loss": 0.6154, + "step": 193 + }, + { + "epoch": 0.02, + "learning_rate": 1.0237467018469658e-05, + "loss": 0.4055, + "step": 194 + }, + { + "epoch": 0.02, + "learning_rate": 1.0290237467018471e-05, + "loss": 0.4228, + "step": 195 + }, + { + "epoch": 0.02, + "learning_rate": 1.0343007915567282e-05, + "loss": 0.4591, + "step": 196 + }, + { + "epoch": 0.02, + "learning_rate": 1.0395778364116096e-05, + "loss": 0.4531, + "step": 197 + }, + { + "epoch": 0.02, + "learning_rate": 1.0448548812664909e-05, + "loss": 0.5329, + "step": 198 + }, + { + "epoch": 0.02, + "learning_rate": 1.050131926121372e-05, + "loss": 0.4139, + "step": 199 + }, + { + "epoch": 0.02, + "learning_rate": 1.0554089709762533e-05, + "loss": 0.4325, + "step": 200 + }, + { + "epoch": 0.02, + "learning_rate": 1.0606860158311348e-05, + "loss": 0.5113, + "step": 201 + }, + { + "epoch": 0.02, + "learning_rate": 1.065963060686016e-05, + "loss": 0.4701, + "step": 202 + }, + { + "epoch": 0.02, + "learning_rate": 1.0712401055408972e-05, + "loss": 0.4778, + "step": 203 + }, + { + "epoch": 0.02, + "learning_rate": 1.0765171503957785e-05, + "loss": 0.437, + "step": 204 + }, + { + "epoch": 0.02, + "learning_rate": 1.0817941952506597e-05, + "loss": 0.4914, + "step": 205 + }, + { + "epoch": 0.02, + "learning_rate": 1.087071240105541e-05, + "loss": 0.4732, + "step": 206 + }, + { + "epoch": 0.02, + "learning_rate": 1.0923482849604223e-05, + "loss": 0.5248, + "step": 207 + }, + { + "epoch": 0.02, + "learning_rate": 1.0976253298153034e-05, + "loss": 0.4656, + "step": 208 + }, + { + "epoch": 0.02, + "learning_rate": 1.1029023746701847e-05, + "loss": 0.527, + "step": 209 + }, + { + "epoch": 0.02, + "learning_rate": 1.1081794195250662e-05, + "loss": 0.528, + "step": 210 + }, + { + "epoch": 0.02, + "learning_rate": 1.1134564643799472e-05, + "loss": 0.3635, + "step": 211 + }, + { + "epoch": 0.02, + "learning_rate": 1.1187335092348287e-05, + "loss": 0.4237, + "step": 212 + }, + { + "epoch": 0.02, + "learning_rate": 1.12401055408971e-05, + "loss": 0.5188, + "step": 213 + }, + { + "epoch": 0.02, + "learning_rate": 1.1292875989445911e-05, + "loss": 0.5728, + "step": 214 + }, + { + "epoch": 0.02, + "learning_rate": 1.1345646437994724e-05, + "loss": 0.5543, + "step": 215 + }, + { + "epoch": 0.02, + "learning_rate": 1.1398416886543537e-05, + "loss": 0.547, + "step": 216 + }, + { + "epoch": 0.02, + "learning_rate": 1.1451187335092349e-05, + "loss": 0.4752, + "step": 217 + }, + { + "epoch": 0.02, + "learning_rate": 1.1503957783641162e-05, + "loss": 0.3026, + "step": 218 + }, + { + "epoch": 0.02, + "learning_rate": 1.1556728232189975e-05, + "loss": 0.4353, + "step": 219 + }, + { + "epoch": 0.02, + "learning_rate": 1.1609498680738786e-05, + "loss": 0.4915, + "step": 220 + }, + { + "epoch": 0.02, + "learning_rate": 1.16622691292876e-05, + "loss": 0.5688, + "step": 221 + }, + { + "epoch": 0.02, + "learning_rate": 1.1715039577836414e-05, + "loss": 0.6301, + "step": 222 + }, + { + "epoch": 0.02, + "learning_rate": 1.1767810026385225e-05, + "loss": 0.549, + "step": 223 + }, + { + "epoch": 0.02, + "learning_rate": 1.1820580474934039e-05, + "loss": 0.512, + "step": 224 + }, + { + "epoch": 0.02, + "learning_rate": 1.1873350923482852e-05, + "loss": 0.5317, + "step": 225 + }, + { + "epoch": 0.02, + "learning_rate": 1.1926121372031663e-05, + "loss": 0.5692, + "step": 226 + }, + { + "epoch": 0.02, + "learning_rate": 1.1978891820580476e-05, + "loss": 0.4103, + "step": 227 + }, + { + "epoch": 0.02, + "learning_rate": 1.203166226912929e-05, + "loss": 0.4389, + "step": 228 + }, + { + "epoch": 0.02, + "learning_rate": 1.20844327176781e-05, + "loss": 0.5522, + "step": 229 + }, + { + "epoch": 0.02, + "learning_rate": 1.2137203166226914e-05, + "loss": 0.5842, + "step": 230 + }, + { + "epoch": 0.02, + "learning_rate": 1.2189973614775727e-05, + "loss": 0.4094, + "step": 231 + }, + { + "epoch": 0.02, + "learning_rate": 1.2242744063324538e-05, + "loss": 0.49, + "step": 232 + }, + { + "epoch": 0.02, + "learning_rate": 1.2295514511873353e-05, + "loss": 0.5449, + "step": 233 + }, + { + "epoch": 0.02, + "learning_rate": 1.2348284960422166e-05, + "loss": 0.4754, + "step": 234 + }, + { + "epoch": 0.02, + "learning_rate": 1.2401055408970977e-05, + "loss": 0.4352, + "step": 235 + }, + { + "epoch": 0.02, + "learning_rate": 1.245382585751979e-05, + "loss": 0.5255, + "step": 236 + }, + { + "epoch": 0.02, + "learning_rate": 1.2506596306068604e-05, + "loss": 0.4887, + "step": 237 + }, + { + "epoch": 0.02, + "learning_rate": 1.2559366754617415e-05, + "loss": 0.5344, + "step": 238 + }, + { + "epoch": 0.02, + "learning_rate": 1.2612137203166228e-05, + "loss": 0.6626, + "step": 239 + }, + { + "epoch": 0.02, + "learning_rate": 1.2664907651715041e-05, + "loss": 0.4302, + "step": 240 + }, + { + "epoch": 0.02, + "learning_rate": 1.2717678100263852e-05, + "loss": 0.5362, + "step": 241 + }, + { + "epoch": 0.02, + "learning_rate": 1.2770448548812666e-05, + "loss": 0.4696, + "step": 242 + }, + { + "epoch": 0.02, + "learning_rate": 1.282321899736148e-05, + "loss": 0.4109, + "step": 243 + }, + { + "epoch": 0.02, + "learning_rate": 1.287598944591029e-05, + "loss": 0.4088, + "step": 244 + }, + { + "epoch": 0.02, + "learning_rate": 1.2928759894459105e-05, + "loss": 0.5432, + "step": 245 + }, + { + "epoch": 0.02, + "learning_rate": 1.2981530343007918e-05, + "loss": 0.5071, + "step": 246 + }, + { + "epoch": 0.02, + "learning_rate": 1.303430079155673e-05, + "loss": 0.4557, + "step": 247 + }, + { + "epoch": 0.02, + "learning_rate": 1.3087071240105542e-05, + "loss": 0.6173, + "step": 248 + }, + { + "epoch": 0.02, + "learning_rate": 1.3139841688654355e-05, + "loss": 0.4259, + "step": 249 + }, + { + "epoch": 0.02, + "learning_rate": 1.3192612137203167e-05, + "loss": 0.5968, + "step": 250 + }, + { + "epoch": 0.02, + "learning_rate": 1.324538258575198e-05, + "loss": 0.3718, + "step": 251 + }, + { + "epoch": 0.02, + "learning_rate": 1.3298153034300793e-05, + "loss": 0.5886, + "step": 252 + }, + { + "epoch": 0.02, + "learning_rate": 1.3350923482849604e-05, + "loss": 0.4247, + "step": 253 + }, + { + "epoch": 0.02, + "learning_rate": 1.3403693931398417e-05, + "loss": 0.5633, + "step": 254 + }, + { + "epoch": 0.02, + "learning_rate": 1.3456464379947232e-05, + "loss": 0.5082, + "step": 255 + }, + { + "epoch": 0.02, + "learning_rate": 1.3509234828496044e-05, + "loss": 0.5633, + "step": 256 + }, + { + "epoch": 0.02, + "learning_rate": 1.3562005277044857e-05, + "loss": 0.5056, + "step": 257 + }, + { + "epoch": 0.02, + "learning_rate": 1.361477572559367e-05, + "loss": 0.5454, + "step": 258 + }, + { + "epoch": 0.02, + "learning_rate": 1.3667546174142481e-05, + "loss": 0.52, + "step": 259 + }, + { + "epoch": 0.02, + "learning_rate": 1.3720316622691294e-05, + "loss": 0.6794, + "step": 260 + }, + { + "epoch": 0.02, + "learning_rate": 1.3773087071240107e-05, + "loss": 0.545, + "step": 261 + }, + { + "epoch": 0.02, + "learning_rate": 1.3825857519788919e-05, + "loss": 0.441, + "step": 262 + }, + { + "epoch": 0.02, + "learning_rate": 1.3878627968337732e-05, + "loss": 0.6181, + "step": 263 + }, + { + "epoch": 0.02, + "learning_rate": 1.3931398416886547e-05, + "loss": 0.6882, + "step": 264 + }, + { + "epoch": 0.02, + "learning_rate": 1.3984168865435356e-05, + "loss": 0.4743, + "step": 265 + }, + { + "epoch": 0.02, + "learning_rate": 1.4036939313984171e-05, + "loss": 0.4379, + "step": 266 + }, + { + "epoch": 0.02, + "learning_rate": 1.4089709762532984e-05, + "loss": 0.597, + "step": 267 + }, + { + "epoch": 0.02, + "learning_rate": 1.4142480211081795e-05, + "loss": 0.5952, + "step": 268 + }, + { + "epoch": 0.02, + "learning_rate": 1.4195250659630609e-05, + "loss": 0.4887, + "step": 269 + }, + { + "epoch": 0.02, + "learning_rate": 1.4248021108179422e-05, + "loss": 0.4755, + "step": 270 + }, + { + "epoch": 0.02, + "learning_rate": 1.4300791556728233e-05, + "loss": 0.5067, + "step": 271 + }, + { + "epoch": 0.02, + "learning_rate": 1.4353562005277046e-05, + "loss": 0.4125, + "step": 272 + }, + { + "epoch": 0.02, + "learning_rate": 1.440633245382586e-05, + "loss": 0.4479, + "step": 273 + }, + { + "epoch": 0.02, + "learning_rate": 1.445910290237467e-05, + "loss": 0.6593, + "step": 274 + }, + { + "epoch": 0.02, + "learning_rate": 1.4511873350923484e-05, + "loss": 0.6088, + "step": 275 + }, + { + "epoch": 0.02, + "learning_rate": 1.4564643799472298e-05, + "loss": 0.682, + "step": 276 + }, + { + "epoch": 0.02, + "learning_rate": 1.461741424802111e-05, + "loss": 0.3218, + "step": 277 + }, + { + "epoch": 0.02, + "learning_rate": 1.4670184696569923e-05, + "loss": 0.482, + "step": 278 + }, + { + "epoch": 0.02, + "learning_rate": 1.4722955145118736e-05, + "loss": 0.3646, + "step": 279 + }, + { + "epoch": 0.02, + "learning_rate": 1.4775725593667547e-05, + "loss": 0.6439, + "step": 280 + }, + { + "epoch": 0.02, + "learning_rate": 1.482849604221636e-05, + "loss": 0.5493, + "step": 281 + }, + { + "epoch": 0.02, + "learning_rate": 1.4881266490765173e-05, + "loss": 0.5587, + "step": 282 + }, + { + "epoch": 0.02, + "learning_rate": 1.4934036939313985e-05, + "loss": 0.5777, + "step": 283 + }, + { + "epoch": 0.02, + "learning_rate": 1.4986807387862798e-05, + "loss": 0.4697, + "step": 284 + }, + { + "epoch": 0.02, + "learning_rate": 1.503957783641161e-05, + "loss": 0.4482, + "step": 285 + }, + { + "epoch": 0.02, + "learning_rate": 1.5092348284960422e-05, + "loss": 0.5034, + "step": 286 + }, + { + "epoch": 0.02, + "learning_rate": 1.5145118733509237e-05, + "loss": 0.5931, + "step": 287 + }, + { + "epoch": 0.02, + "learning_rate": 1.5197889182058047e-05, + "loss": 0.4914, + "step": 288 + }, + { + "epoch": 0.02, + "learning_rate": 1.5250659630606862e-05, + "loss": 0.6395, + "step": 289 + }, + { + "epoch": 0.02, + "learning_rate": 1.5303430079155675e-05, + "loss": 0.5475, + "step": 290 + }, + { + "epoch": 0.02, + "learning_rate": 1.5356200527704484e-05, + "loss": 0.4601, + "step": 291 + }, + { + "epoch": 0.02, + "learning_rate": 1.5408970976253298e-05, + "loss": 0.6117, + "step": 292 + }, + { + "epoch": 0.02, + "learning_rate": 1.5461741424802114e-05, + "loss": 0.4752, + "step": 293 + }, + { + "epoch": 0.02, + "learning_rate": 1.5514511873350924e-05, + "loss": 0.4157, + "step": 294 + }, + { + "epoch": 0.02, + "learning_rate": 1.5567282321899737e-05, + "loss": 0.5167, + "step": 295 + }, + { + "epoch": 0.02, + "learning_rate": 1.562005277044855e-05, + "loss": 0.4771, + "step": 296 + }, + { + "epoch": 0.02, + "learning_rate": 1.5672823218997363e-05, + "loss": 0.5003, + "step": 297 + }, + { + "epoch": 0.02, + "learning_rate": 1.5725593667546176e-05, + "loss": 0.5939, + "step": 298 + }, + { + "epoch": 0.02, + "learning_rate": 1.577836411609499e-05, + "loss": 0.7057, + "step": 299 + }, + { + "epoch": 0.02, + "learning_rate": 1.58311345646438e-05, + "loss": 0.5738, + "step": 300 + }, + { + "epoch": 0.02, + "learning_rate": 1.5883905013192612e-05, + "loss": 0.4542, + "step": 301 + }, + { + "epoch": 0.02, + "learning_rate": 1.5936675461741425e-05, + "loss": 0.4689, + "step": 302 + }, + { + "epoch": 0.02, + "learning_rate": 1.5989445910290238e-05, + "loss": 0.4119, + "step": 303 + }, + { + "epoch": 0.02, + "learning_rate": 1.604221635883905e-05, + "loss": 0.4173, + "step": 304 + }, + { + "epoch": 0.02, + "learning_rate": 1.6094986807387864e-05, + "loss": 0.6227, + "step": 305 + }, + { + "epoch": 0.02, + "learning_rate": 1.6147757255936677e-05, + "loss": 0.4235, + "step": 306 + }, + { + "epoch": 0.02, + "learning_rate": 1.620052770448549e-05, + "loss": 0.5409, + "step": 307 + }, + { + "epoch": 0.02, + "learning_rate": 1.6253298153034303e-05, + "loss": 0.5373, + "step": 308 + }, + { + "epoch": 0.02, + "learning_rate": 1.6306068601583113e-05, + "loss": 0.467, + "step": 309 + }, + { + "epoch": 0.02, + "learning_rate": 1.6358839050131926e-05, + "loss": 0.4264, + "step": 310 + }, + { + "epoch": 0.02, + "learning_rate": 1.641160949868074e-05, + "loss": 0.5674, + "step": 311 + }, + { + "epoch": 0.02, + "learning_rate": 1.6464379947229552e-05, + "loss": 0.4211, + "step": 312 + }, + { + "epoch": 0.02, + "learning_rate": 1.6517150395778365e-05, + "loss": 0.5324, + "step": 313 + }, + { + "epoch": 0.02, + "learning_rate": 1.656992084432718e-05, + "loss": 0.514, + "step": 314 + }, + { + "epoch": 0.02, + "learning_rate": 1.6622691292875988e-05, + "loss": 0.4171, + "step": 315 + }, + { + "epoch": 0.03, + "learning_rate": 1.6675461741424805e-05, + "loss": 0.5573, + "step": 316 + }, + { + "epoch": 0.03, + "learning_rate": 1.6728232189973618e-05, + "loss": 0.4072, + "step": 317 + }, + { + "epoch": 0.03, + "learning_rate": 1.6781002638522427e-05, + "loss": 0.4735, + "step": 318 + }, + { + "epoch": 0.03, + "learning_rate": 1.683377308707124e-05, + "loss": 0.5461, + "step": 319 + }, + { + "epoch": 0.03, + "learning_rate": 1.6886543535620054e-05, + "loss": 0.4304, + "step": 320 + }, + { + "epoch": 0.03, + "learning_rate": 1.6939313984168867e-05, + "loss": 0.4202, + "step": 321 + }, + { + "epoch": 0.03, + "learning_rate": 1.699208443271768e-05, + "loss": 0.4572, + "step": 322 + }, + { + "epoch": 0.03, + "learning_rate": 1.7044854881266493e-05, + "loss": 0.5163, + "step": 323 + }, + { + "epoch": 0.03, + "learning_rate": 1.7097625329815303e-05, + "loss": 0.5066, + "step": 324 + }, + { + "epoch": 0.03, + "learning_rate": 1.7150395778364116e-05, + "loss": 0.4231, + "step": 325 + }, + { + "epoch": 0.03, + "learning_rate": 1.7203166226912932e-05, + "loss": 0.5945, + "step": 326 + }, + { + "epoch": 0.03, + "learning_rate": 1.7255936675461742e-05, + "loss": 0.6386, + "step": 327 + }, + { + "epoch": 0.03, + "learning_rate": 1.7308707124010555e-05, + "loss": 0.5473, + "step": 328 + }, + { + "epoch": 0.03, + "learning_rate": 1.7361477572559368e-05, + "loss": 0.5394, + "step": 329 + }, + { + "epoch": 0.03, + "learning_rate": 1.741424802110818e-05, + "loss": 0.5138, + "step": 330 + }, + { + "epoch": 0.03, + "learning_rate": 1.7467018469656994e-05, + "loss": 0.5968, + "step": 331 + }, + { + "epoch": 0.03, + "learning_rate": 1.7519788918205807e-05, + "loss": 0.4336, + "step": 332 + }, + { + "epoch": 0.03, + "learning_rate": 1.7572559366754617e-05, + "loss": 0.5357, + "step": 333 + }, + { + "epoch": 0.03, + "learning_rate": 1.762532981530343e-05, + "loss": 0.3987, + "step": 334 + }, + { + "epoch": 0.03, + "learning_rate": 1.7678100263852246e-05, + "loss": 0.4486, + "step": 335 + }, + { + "epoch": 0.03, + "learning_rate": 1.7730870712401056e-05, + "loss": 0.5239, + "step": 336 + }, + { + "epoch": 0.03, + "learning_rate": 1.778364116094987e-05, + "loss": 0.4993, + "step": 337 + }, + { + "epoch": 0.03, + "learning_rate": 1.7836411609498682e-05, + "loss": 0.3837, + "step": 338 + }, + { + "epoch": 0.03, + "learning_rate": 1.7889182058047495e-05, + "loss": 0.4153, + "step": 339 + }, + { + "epoch": 0.03, + "learning_rate": 1.794195250659631e-05, + "loss": 0.6075, + "step": 340 + }, + { + "epoch": 0.03, + "learning_rate": 1.799472295514512e-05, + "loss": 0.6715, + "step": 341 + }, + { + "epoch": 0.03, + "learning_rate": 1.804749340369393e-05, + "loss": 0.6202, + "step": 342 + }, + { + "epoch": 0.03, + "learning_rate": 1.8100263852242744e-05, + "loss": 0.3846, + "step": 343 + }, + { + "epoch": 0.03, + "learning_rate": 1.8153034300791557e-05, + "loss": 0.4731, + "step": 344 + }, + { + "epoch": 0.03, + "learning_rate": 1.820580474934037e-05, + "loss": 0.4758, + "step": 345 + }, + { + "epoch": 0.03, + "learning_rate": 1.8258575197889184e-05, + "loss": 0.5357, + "step": 346 + }, + { + "epoch": 0.03, + "learning_rate": 1.8311345646437997e-05, + "loss": 0.4572, + "step": 347 + }, + { + "epoch": 0.03, + "learning_rate": 1.836411609498681e-05, + "loss": 0.3958, + "step": 348 + }, + { + "epoch": 0.03, + "learning_rate": 1.8416886543535623e-05, + "loss": 0.6442, + "step": 349 + }, + { + "epoch": 0.03, + "learning_rate": 1.8469656992084436e-05, + "loss": 0.4247, + "step": 350 + }, + { + "epoch": 0.03, + "learning_rate": 1.8522427440633246e-05, + "loss": 0.482, + "step": 351 + }, + { + "epoch": 0.03, + "learning_rate": 1.857519788918206e-05, + "loss": 0.454, + "step": 352 + }, + { + "epoch": 0.03, + "learning_rate": 1.8627968337730872e-05, + "loss": 0.4409, + "step": 353 + }, + { + "epoch": 0.03, + "learning_rate": 1.8680738786279685e-05, + "loss": 0.4219, + "step": 354 + }, + { + "epoch": 0.03, + "learning_rate": 1.8733509234828498e-05, + "loss": 0.5644, + "step": 355 + }, + { + "epoch": 0.03, + "learning_rate": 1.878627968337731e-05, + "loss": 0.5209, + "step": 356 + }, + { + "epoch": 0.03, + "learning_rate": 1.883905013192612e-05, + "loss": 0.5706, + "step": 357 + }, + { + "epoch": 0.03, + "learning_rate": 1.8891820580474937e-05, + "loss": 0.5016, + "step": 358 + }, + { + "epoch": 0.03, + "learning_rate": 1.894459102902375e-05, + "loss": 0.572, + "step": 359 + }, + { + "epoch": 0.03, + "learning_rate": 1.899736147757256e-05, + "loss": 0.6549, + "step": 360 + }, + { + "epoch": 0.03, + "learning_rate": 1.9050131926121373e-05, + "loss": 0.5141, + "step": 361 + }, + { + "epoch": 0.03, + "learning_rate": 1.9102902374670186e-05, + "loss": 0.5997, + "step": 362 + }, + { + "epoch": 0.03, + "learning_rate": 1.9155672823219e-05, + "loss": 0.4522, + "step": 363 + }, + { + "epoch": 0.03, + "learning_rate": 1.9208443271767812e-05, + "loss": 0.433, + "step": 364 + }, + { + "epoch": 0.03, + "learning_rate": 1.9261213720316625e-05, + "loss": 0.449, + "step": 365 + }, + { + "epoch": 0.03, + "learning_rate": 1.9313984168865435e-05, + "loss": 0.4728, + "step": 366 + }, + { + "epoch": 0.03, + "learning_rate": 1.9366754617414248e-05, + "loss": 0.491, + "step": 367 + }, + { + "epoch": 0.03, + "learning_rate": 1.9419525065963065e-05, + "loss": 0.615, + "step": 368 + }, + { + "epoch": 0.03, + "learning_rate": 1.9472295514511874e-05, + "loss": 0.4152, + "step": 369 + }, + { + "epoch": 0.03, + "learning_rate": 1.9525065963060687e-05, + "loss": 0.4383, + "step": 370 + }, + { + "epoch": 0.03, + "learning_rate": 1.95778364116095e-05, + "loss": 0.6447, + "step": 371 + }, + { + "epoch": 0.03, + "learning_rate": 1.9630606860158313e-05, + "loss": 0.3675, + "step": 372 + }, + { + "epoch": 0.03, + "learning_rate": 1.9683377308707127e-05, + "loss": 0.5476, + "step": 373 + }, + { + "epoch": 0.03, + "learning_rate": 1.973614775725594e-05, + "loss": 0.5129, + "step": 374 + }, + { + "epoch": 0.03, + "learning_rate": 1.978891820580475e-05, + "loss": 0.6155, + "step": 375 + }, + { + "epoch": 0.03, + "learning_rate": 1.9841688654353562e-05, + "loss": 0.4281, + "step": 376 + }, + { + "epoch": 0.03, + "learning_rate": 1.9894459102902375e-05, + "loss": 0.3696, + "step": 377 + }, + { + "epoch": 0.03, + "learning_rate": 1.994722955145119e-05, + "loss": 0.6021, + "step": 378 + }, + { + "epoch": 0.03, + "learning_rate": 2e-05, + "loss": 0.5341, + "step": 379 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999967077406e-05, + "loss": 0.5195, + "step": 380 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999998683096255e-05, + "loss": 0.4532, + "step": 381 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999703696666e-05, + "loss": 0.6008, + "step": 382 + }, + { + "epoch": 0.03, + "learning_rate": 1.999999473238537e-05, + "loss": 0.4562, + "step": 383 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999991769352545e-05, + "loss": 0.4995, + "step": 384 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999988147868384e-05, + "loss": 0.4802, + "step": 385 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999983867933114e-05, + "loss": 0.4843, + "step": 386 + }, + { + "epoch": 0.03, + "learning_rate": 1.999997892954703e-05, + "loss": 0.5208, + "step": 387 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999973332710443e-05, + "loss": 0.5132, + "step": 388 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999967077423732e-05, + "loss": 0.5103, + "step": 389 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999960163687307e-05, + "loss": 0.4142, + "step": 390 + }, + { + "epoch": 0.03, + "learning_rate": 1.999995259150162e-05, + "loss": 0.4395, + "step": 391 + }, + { + "epoch": 0.03, + "learning_rate": 1.999994436086717e-05, + "loss": 0.422, + "step": 392 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999935471784508e-05, + "loss": 0.5767, + "step": 393 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999925924254203e-05, + "loss": 0.4099, + "step": 394 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999915718276898e-05, + "loss": 0.5255, + "step": 395 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999904853853256e-05, + "loss": 0.4103, + "step": 396 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999893330983998e-05, + "loss": 0.504, + "step": 397 + }, + { + "epoch": 0.03, + "learning_rate": 1.999988114966988e-05, + "loss": 0.515, + "step": 398 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999868309911704e-05, + "loss": 0.4644, + "step": 399 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999854811710317e-05, + "loss": 0.5344, + "step": 400 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999840655066608e-05, + "loss": 0.5693, + "step": 401 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999825839981506e-05, + "loss": 0.6017, + "step": 402 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999810366455986e-05, + "loss": 0.4403, + "step": 403 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999794234491075e-05, + "loss": 0.618, + "step": 404 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999777444087826e-05, + "loss": 0.445, + "step": 405 + }, + { + "epoch": 0.03, + "learning_rate": 1.999975999524735e-05, + "loss": 0.4812, + "step": 406 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999741887970795e-05, + "loss": 0.4618, + "step": 407 + }, + { + "epoch": 0.03, + "learning_rate": 1.999972312225935e-05, + "loss": 0.529, + "step": 408 + }, + { + "epoch": 0.03, + "learning_rate": 1.999970369811425e-05, + "loss": 0.6059, + "step": 409 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999683615536784e-05, + "loss": 0.3908, + "step": 410 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999662874528264e-05, + "loss": 0.5163, + "step": 411 + }, + { + "epoch": 0.03, + "learning_rate": 1.999964147509006e-05, + "loss": 0.4522, + "step": 412 + }, + { + "epoch": 0.03, + "learning_rate": 1.999961941722358e-05, + "loss": 0.5573, + "step": 413 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999596700930274e-05, + "loss": 0.4013, + "step": 414 + }, + { + "epoch": 0.03, + "learning_rate": 1.999957332621164e-05, + "loss": 0.5783, + "step": 415 + }, + { + "epoch": 0.03, + "learning_rate": 1.999954929306922e-05, + "loss": 0.4962, + "step": 416 + }, + { + "epoch": 0.03, + "learning_rate": 1.999952460150459e-05, + "loss": 0.7153, + "step": 417 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999499251519388e-05, + "loss": 0.5032, + "step": 418 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999473243115268e-05, + "loss": 0.5712, + "step": 419 + }, + { + "epoch": 0.03, + "learning_rate": 1.999944657629395e-05, + "loss": 0.496, + "step": 420 + }, + { + "epoch": 0.03, + "learning_rate": 1.999941925105719e-05, + "loss": 0.4595, + "step": 421 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999391267406786e-05, + "loss": 0.5615, + "step": 422 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999362625344584e-05, + "loss": 0.5056, + "step": 423 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999333324872464e-05, + "loss": 0.525, + "step": 424 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999303365992357e-05, + "loss": 0.6214, + "step": 425 + }, + { + "epoch": 0.03, + "learning_rate": 1.999927274870624e-05, + "loss": 0.4013, + "step": 426 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999241473016126e-05, + "loss": 0.4107, + "step": 427 + }, + { + "epoch": 0.03, + "learning_rate": 1.999920953892407e-05, + "loss": 0.503, + "step": 428 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999176946432183e-05, + "loss": 0.5285, + "step": 429 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999143695542606e-05, + "loss": 0.5122, + "step": 430 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999109786257528e-05, + "loss": 0.5158, + "step": 431 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999075218579184e-05, + "loss": 0.572, + "step": 432 + }, + { + "epoch": 0.03, + "learning_rate": 1.999903999250985e-05, + "loss": 0.2913, + "step": 433 + }, + { + "epoch": 0.03, + "learning_rate": 1.9999004108051846e-05, + "loss": 0.4703, + "step": 434 + }, + { + "epoch": 0.03, + "learning_rate": 1.999896756520753e-05, + "loss": 0.3896, + "step": 435 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998930363979315e-05, + "loss": 0.5339, + "step": 436 + }, + { + "epoch": 0.03, + "learning_rate": 1.999889250436965e-05, + "loss": 0.4875, + "step": 437 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998853986381018e-05, + "loss": 0.5099, + "step": 438 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998814810015968e-05, + "loss": 0.5543, + "step": 439 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998774975277074e-05, + "loss": 0.4946, + "step": 440 + }, + { + "epoch": 0.03, + "learning_rate": 1.9998734482166954e-05, + "loss": 0.3925, + "step": 441 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998693330688283e-05, + "loss": 0.6403, + "step": 442 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998651520843766e-05, + "loss": 0.6341, + "step": 443 + }, + { + "epoch": 0.04, + "learning_rate": 1.999860905263616e-05, + "loss": 0.3712, + "step": 444 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998565926068253e-05, + "loss": 0.5129, + "step": 445 + }, + { + "epoch": 0.04, + "learning_rate": 1.999852214114289e-05, + "loss": 0.3516, + "step": 446 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998477697862956e-05, + "loss": 0.529, + "step": 447 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998432596231373e-05, + "loss": 0.4974, + "step": 448 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998386836251116e-05, + "loss": 0.4338, + "step": 449 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998340417925193e-05, + "loss": 0.4208, + "step": 450 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998293341256664e-05, + "loss": 0.5846, + "step": 451 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998245606248627e-05, + "loss": 0.4732, + "step": 452 + }, + { + "epoch": 0.04, + "learning_rate": 1.999819721290422e-05, + "loss": 0.3971, + "step": 453 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998148161226645e-05, + "loss": 0.3463, + "step": 454 + }, + { + "epoch": 0.04, + "learning_rate": 1.9998098451219115e-05, + "loss": 0.4629, + "step": 455 + }, + { + "epoch": 0.04, + "learning_rate": 1.999804808288491e-05, + "loss": 0.5754, + "step": 456 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997997056227347e-05, + "loss": 0.5664, + "step": 457 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997945371249784e-05, + "loss": 0.5248, + "step": 458 + }, + { + "epoch": 0.04, + "learning_rate": 1.999789302795563e-05, + "loss": 0.4744, + "step": 459 + }, + { + "epoch": 0.04, + "learning_rate": 1.999784002634832e-05, + "loss": 0.5357, + "step": 460 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997786366431354e-05, + "loss": 0.6537, + "step": 461 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997732048208264e-05, + "loss": 0.4527, + "step": 462 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997677071682623e-05, + "loss": 0.4985, + "step": 463 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997621436858053e-05, + "loss": 0.4528, + "step": 464 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997565143738216e-05, + "loss": 0.429, + "step": 465 + }, + { + "epoch": 0.04, + "learning_rate": 1.999750819232682e-05, + "loss": 0.5007, + "step": 466 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997450582627614e-05, + "loss": 0.5214, + "step": 467 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997392314644392e-05, + "loss": 0.3502, + "step": 468 + }, + { + "epoch": 0.04, + "learning_rate": 1.999733338838099e-05, + "loss": 0.3376, + "step": 469 + }, + { + "epoch": 0.04, + "learning_rate": 1.999727380384129e-05, + "loss": 0.5157, + "step": 470 + }, + { + "epoch": 0.04, + "learning_rate": 1.999721356102921e-05, + "loss": 0.4042, + "step": 471 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997152659948727e-05, + "loss": 0.4579, + "step": 472 + }, + { + "epoch": 0.04, + "learning_rate": 1.9997091100603842e-05, + "loss": 0.4241, + "step": 473 + }, + { + "epoch": 0.04, + "learning_rate": 1.999702888299861e-05, + "loss": 0.5036, + "step": 474 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996966007137125e-05, + "loss": 0.5666, + "step": 475 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996902473023537e-05, + "loss": 0.5138, + "step": 476 + }, + { + "epoch": 0.04, + "learning_rate": 1.999683828066202e-05, + "loss": 0.4312, + "step": 477 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996773430056806e-05, + "loss": 0.4961, + "step": 478 + }, + { + "epoch": 0.04, + "learning_rate": 1.999670792121216e-05, + "loss": 0.4047, + "step": 479 + }, + { + "epoch": 0.04, + "learning_rate": 1.99966417541324e-05, + "loss": 0.4161, + "step": 480 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996574928821883e-05, + "loss": 0.5334, + "step": 481 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996507445285003e-05, + "loss": 0.536, + "step": 482 + }, + { + "epoch": 0.04, + "learning_rate": 1.999643930352621e-05, + "loss": 0.4686, + "step": 483 + }, + { + "epoch": 0.04, + "learning_rate": 1.999637050354999e-05, + "loss": 0.4076, + "step": 484 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996301045360874e-05, + "loss": 0.4238, + "step": 485 + }, + { + "epoch": 0.04, + "learning_rate": 1.999623092896343e-05, + "loss": 0.5335, + "step": 486 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996160154362275e-05, + "loss": 0.5755, + "step": 487 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996088721562076e-05, + "loss": 0.5558, + "step": 488 + }, + { + "epoch": 0.04, + "learning_rate": 1.9996016630567535e-05, + "loss": 0.4579, + "step": 489 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995943881383393e-05, + "loss": 0.3542, + "step": 490 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995870474014444e-05, + "loss": 0.5374, + "step": 491 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995796408465523e-05, + "loss": 0.494, + "step": 492 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995721684741505e-05, + "loss": 0.6123, + "step": 493 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995646302847307e-05, + "loss": 0.5978, + "step": 494 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995570262787903e-05, + "loss": 0.4313, + "step": 495 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995493564568286e-05, + "loss": 0.4402, + "step": 496 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995416208193518e-05, + "loss": 0.4768, + "step": 497 + }, + { + "epoch": 0.04, + "learning_rate": 1.999533819366868e-05, + "loss": 0.4544, + "step": 498 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995259520998927e-05, + "loss": 0.4456, + "step": 499 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995180190189424e-05, + "loss": 0.4175, + "step": 500 + }, + { + "epoch": 0.04, + "learning_rate": 1.9995100201245397e-05, + "loss": 0.3899, + "step": 501 + }, + { + "epoch": 0.04, + "learning_rate": 1.999501955417212e-05, + "loss": 0.4562, + "step": 502 + }, + { + "epoch": 0.04, + "learning_rate": 1.999493824897489e-05, + "loss": 0.5242, + "step": 503 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994856285659073e-05, + "loss": 0.5509, + "step": 504 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994773664230064e-05, + "loss": 0.4813, + "step": 505 + }, + { + "epoch": 0.04, + "learning_rate": 1.99946903846933e-05, + "loss": 0.4884, + "step": 506 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994606447054265e-05, + "loss": 0.4809, + "step": 507 + }, + { + "epoch": 0.04, + "learning_rate": 1.999452185131849e-05, + "loss": 0.5702, + "step": 508 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994436597491537e-05, + "loss": 0.4978, + "step": 509 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994350685579024e-05, + "loss": 0.5678, + "step": 510 + }, + { + "epoch": 0.04, + "learning_rate": 1.999426411558661e-05, + "loss": 0.5927, + "step": 511 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994176887519994e-05, + "loss": 0.5643, + "step": 512 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994089001384918e-05, + "loss": 0.4599, + "step": 513 + }, + { + "epoch": 0.04, + "learning_rate": 1.9994000457187167e-05, + "loss": 0.4299, + "step": 514 + }, + { + "epoch": 0.04, + "learning_rate": 1.999391125493258e-05, + "loss": 0.5306, + "step": 515 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993821394627018e-05, + "loss": 0.4771, + "step": 516 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993730876276407e-05, + "loss": 0.5077, + "step": 517 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993639699886707e-05, + "loss": 0.6801, + "step": 518 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993547865463916e-05, + "loss": 0.4089, + "step": 519 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993455373014087e-05, + "loss": 0.5752, + "step": 520 + }, + { + "epoch": 0.04, + "learning_rate": 1.99933622225433e-05, + "loss": 0.4643, + "step": 521 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993268414057704e-05, + "loss": 0.4852, + "step": 522 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993173947563466e-05, + "loss": 0.451, + "step": 523 + }, + { + "epoch": 0.04, + "learning_rate": 1.9993078823066804e-05, + "loss": 0.608, + "step": 524 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992983040573986e-05, + "loss": 0.4712, + "step": 525 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992886600091318e-05, + "loss": 0.4318, + "step": 526 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992789501625155e-05, + "loss": 0.5379, + "step": 527 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992691745181882e-05, + "loss": 0.6214, + "step": 528 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992593330767938e-05, + "loss": 0.4474, + "step": 529 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992494258389805e-05, + "loss": 0.4164, + "step": 530 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992394528054006e-05, + "loss": 0.512, + "step": 531 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992294139767106e-05, + "loss": 0.311, + "step": 532 + }, + { + "epoch": 0.04, + "learning_rate": 1.999219309353572e-05, + "loss": 0.4489, + "step": 533 + }, + { + "epoch": 0.04, + "learning_rate": 1.9992091389366497e-05, + "loss": 0.4864, + "step": 534 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991989027266134e-05, + "loss": 0.6167, + "step": 535 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991886007241375e-05, + "loss": 0.5642, + "step": 536 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991782329298998e-05, + "loss": 0.4561, + "step": 537 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991677993445832e-05, + "loss": 0.5195, + "step": 538 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991572999688746e-05, + "loss": 0.5036, + "step": 539 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991467348034653e-05, + "loss": 0.5629, + "step": 540 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991361038490515e-05, + "loss": 0.4879, + "step": 541 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991254071063327e-05, + "loss": 0.494, + "step": 542 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991146445760133e-05, + "loss": 0.5324, + "step": 543 + }, + { + "epoch": 0.04, + "learning_rate": 1.9991038162588018e-05, + "loss": 0.5021, + "step": 544 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990929221554117e-05, + "loss": 0.3755, + "step": 545 + }, + { + "epoch": 0.04, + "learning_rate": 1.99908196226656e-05, + "loss": 0.449, + "step": 546 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990709365929678e-05, + "loss": 0.4233, + "step": 547 + }, + { + "epoch": 0.04, + "learning_rate": 1.999059845135362e-05, + "loss": 0.5311, + "step": 548 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990486878944727e-05, + "loss": 0.5448, + "step": 549 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990374648710343e-05, + "loss": 0.46, + "step": 550 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990261760657858e-05, + "loss": 0.4995, + "step": 551 + }, + { + "epoch": 0.04, + "learning_rate": 1.9990148214794713e-05, + "loss": 0.3974, + "step": 552 + }, + { + "epoch": 0.04, + "learning_rate": 1.999003401112837e-05, + "loss": 0.395, + "step": 553 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989919149666356e-05, + "loss": 0.5115, + "step": 554 + }, + { + "epoch": 0.04, + "learning_rate": 1.998980363041624e-05, + "loss": 0.5043, + "step": 555 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989687453385617e-05, + "loss": 0.547, + "step": 556 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989570618582145e-05, + "loss": 0.4002, + "step": 557 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989453126013515e-05, + "loss": 0.473, + "step": 558 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989334975687462e-05, + "loss": 0.4813, + "step": 559 + }, + { + "epoch": 0.04, + "learning_rate": 1.9989216167611766e-05, + "loss": 0.4079, + "step": 560 + }, + { + "epoch": 0.04, + "learning_rate": 1.998909670179425e-05, + "loss": 0.6068, + "step": 561 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988976578242785e-05, + "loss": 0.3321, + "step": 562 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988855796965275e-05, + "loss": 0.3962, + "step": 563 + }, + { + "epoch": 0.04, + "learning_rate": 1.998873435796967e-05, + "loss": 0.5048, + "step": 564 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988612261263972e-05, + "loss": 0.5398, + "step": 565 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988489506856218e-05, + "loss": 0.447, + "step": 566 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988366094754493e-05, + "loss": 0.379, + "step": 567 + }, + { + "epoch": 0.04, + "learning_rate": 1.9988242024966924e-05, + "loss": 0.4556, + "step": 568 + }, + { + "epoch": 0.05, + "learning_rate": 1.9988117297501674e-05, + "loss": 0.3105, + "step": 569 + }, + { + "epoch": 0.05, + "learning_rate": 1.998799191236696e-05, + "loss": 0.3668, + "step": 570 + }, + { + "epoch": 0.05, + "learning_rate": 1.998786586957104e-05, + "loss": 0.4916, + "step": 571 + }, + { + "epoch": 0.05, + "learning_rate": 1.998773916912221e-05, + "loss": 0.308, + "step": 572 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987611811028814e-05, + "loss": 0.5247, + "step": 573 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987483795299236e-05, + "loss": 0.5485, + "step": 574 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987355121941907e-05, + "loss": 0.4966, + "step": 575 + }, + { + "epoch": 0.05, + "learning_rate": 1.99872257909653e-05, + "loss": 0.4872, + "step": 576 + }, + { + "epoch": 0.05, + "learning_rate": 1.9987095802377933e-05, + "loss": 0.5025, + "step": 577 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986965156188357e-05, + "loss": 0.5714, + "step": 578 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986833852405183e-05, + "loss": 0.5208, + "step": 579 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986701891037053e-05, + "loss": 0.4676, + "step": 580 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986569272092656e-05, + "loss": 0.5299, + "step": 581 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986435995580725e-05, + "loss": 0.6287, + "step": 582 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986302061510036e-05, + "loss": 0.6313, + "step": 583 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986167469889405e-05, + "loss": 0.4931, + "step": 584 + }, + { + "epoch": 0.05, + "learning_rate": 1.9986032220727698e-05, + "loss": 0.416, + "step": 585 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985896314033816e-05, + "loss": 0.4872, + "step": 586 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985759749816715e-05, + "loss": 0.4544, + "step": 587 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985622528085382e-05, + "loss": 0.6076, + "step": 588 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985484648848854e-05, + "loss": 0.5247, + "step": 589 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985346112116207e-05, + "loss": 0.4338, + "step": 590 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985206917896563e-05, + "loss": 0.5009, + "step": 591 + }, + { + "epoch": 0.05, + "learning_rate": 1.9985067066199093e-05, + "loss": 0.5561, + "step": 592 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984926557033003e-05, + "loss": 0.4053, + "step": 593 + }, + { + "epoch": 0.05, + "learning_rate": 1.998478539040754e-05, + "loss": 0.4668, + "step": 594 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984643566332005e-05, + "loss": 0.4908, + "step": 595 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984501084815734e-05, + "loss": 0.504, + "step": 596 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984357945868106e-05, + "loss": 0.4605, + "step": 597 + }, + { + "epoch": 0.05, + "learning_rate": 1.998421414949855e-05, + "loss": 0.5766, + "step": 598 + }, + { + "epoch": 0.05, + "learning_rate": 1.9984069695716534e-05, + "loss": 0.5155, + "step": 599 + }, + { + "epoch": 0.05, + "learning_rate": 1.998392458453157e-05, + "loss": 0.5261, + "step": 600 + }, + { + "epoch": 0.05, + "learning_rate": 1.998377881595321e-05, + "loss": 0.5779, + "step": 601 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983632389991056e-05, + "loss": 0.4822, + "step": 602 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983485306654745e-05, + "loss": 0.4828, + "step": 603 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983337565953968e-05, + "loss": 0.4474, + "step": 604 + }, + { + "epoch": 0.05, + "learning_rate": 1.9983189167898446e-05, + "loss": 0.4979, + "step": 605 + }, + { + "epoch": 0.05, + "learning_rate": 1.998304011249795e-05, + "loss": 0.3698, + "step": 606 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982890399762303e-05, + "loss": 0.4166, + "step": 607 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982740029701356e-05, + "loss": 0.4733, + "step": 608 + }, + { + "epoch": 0.05, + "learning_rate": 1.998258900232501e-05, + "loss": 0.3716, + "step": 609 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982437317643218e-05, + "loss": 0.4844, + "step": 610 + }, + { + "epoch": 0.05, + "learning_rate": 1.9982284975665952e-05, + "loss": 0.3469, + "step": 611 + }, + { + "epoch": 0.05, + "learning_rate": 1.998213197640326e-05, + "loss": 0.6033, + "step": 612 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981978319865204e-05, + "loss": 0.3872, + "step": 613 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981824006061904e-05, + "loss": 0.3864, + "step": 614 + }, + { + "epoch": 0.05, + "learning_rate": 1.998166903500353e-05, + "loss": 0.4836, + "step": 615 + }, + { + "epoch": 0.05, + "learning_rate": 1.998151340670027e-05, + "loss": 0.4202, + "step": 616 + }, + { + "epoch": 0.05, + "learning_rate": 1.9981357121162385e-05, + "loss": 0.4131, + "step": 617 + }, + { + "epoch": 0.05, + "learning_rate": 1.998120017840016e-05, + "loss": 0.4096, + "step": 618 + }, + { + "epoch": 0.05, + "learning_rate": 1.998104257842393e-05, + "loss": 0.4204, + "step": 619 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980884321244072e-05, + "loss": 0.4956, + "step": 620 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980725406871007e-05, + "loss": 0.55, + "step": 621 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980565835315196e-05, + "loss": 0.5158, + "step": 622 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980405606587148e-05, + "loss": 0.432, + "step": 623 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980244720697417e-05, + "loss": 0.5646, + "step": 624 + }, + { + "epoch": 0.05, + "learning_rate": 1.9980083177656588e-05, + "loss": 0.4702, + "step": 625 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979920977475306e-05, + "loss": 0.5031, + "step": 626 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979758120164248e-05, + "loss": 0.4419, + "step": 627 + }, + { + "epoch": 0.05, + "learning_rate": 1.997959460573414e-05, + "loss": 0.4072, + "step": 628 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979430434195742e-05, + "loss": 0.3695, + "step": 629 + }, + { + "epoch": 0.05, + "learning_rate": 1.9979265605559868e-05, + "loss": 0.4272, + "step": 630 + }, + { + "epoch": 0.05, + "learning_rate": 1.997910011983737e-05, + "loss": 0.4969, + "step": 631 + }, + { + "epoch": 0.05, + "learning_rate": 1.997893397703915e-05, + "loss": 0.6968, + "step": 632 + }, + { + "epoch": 0.05, + "learning_rate": 1.997876717717614e-05, + "loss": 0.4055, + "step": 633 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978599720259325e-05, + "loss": 0.5105, + "step": 634 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978431606299736e-05, + "loss": 0.4004, + "step": 635 + }, + { + "epoch": 0.05, + "learning_rate": 1.9978262835308437e-05, + "loss": 0.4802, + "step": 636 + }, + { + "epoch": 0.05, + "learning_rate": 1.997809340729654e-05, + "loss": 0.4204, + "step": 637 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977923322275206e-05, + "loss": 0.5359, + "step": 638 + }, + { + "epoch": 0.05, + "learning_rate": 1.997775258025563e-05, + "loss": 0.5854, + "step": 639 + }, + { + "epoch": 0.05, + "learning_rate": 1.997758118124906e-05, + "loss": 0.481, + "step": 640 + }, + { + "epoch": 0.05, + "learning_rate": 1.997740912526678e-05, + "loss": 0.5076, + "step": 641 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977236412320112e-05, + "loss": 0.4504, + "step": 642 + }, + { + "epoch": 0.05, + "learning_rate": 1.9977063042420438e-05, + "loss": 0.5143, + "step": 643 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976889015579167e-05, + "loss": 0.5724, + "step": 644 + }, + { + "epoch": 0.05, + "learning_rate": 1.997671433180776e-05, + "loss": 0.4705, + "step": 645 + }, + { + "epoch": 0.05, + "learning_rate": 1.997653899111772e-05, + "loss": 0.4841, + "step": 646 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976362993520587e-05, + "loss": 0.4405, + "step": 647 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976186339027958e-05, + "loss": 0.3988, + "step": 648 + }, + { + "epoch": 0.05, + "learning_rate": 1.9976009027651463e-05, + "loss": 0.4487, + "step": 649 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975831059402774e-05, + "loss": 0.5622, + "step": 650 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975652434293607e-05, + "loss": 0.3798, + "step": 651 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975473152335726e-05, + "loss": 0.3878, + "step": 652 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975293213540942e-05, + "loss": 0.4124, + "step": 653 + }, + { + "epoch": 0.05, + "learning_rate": 1.9975112617921097e-05, + "loss": 0.3936, + "step": 654 + }, + { + "epoch": 0.05, + "learning_rate": 1.997493136548808e-05, + "loss": 0.5737, + "step": 655 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974749456253834e-05, + "loss": 0.3689, + "step": 656 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974566890230327e-05, + "loss": 0.4765, + "step": 657 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974383667429585e-05, + "loss": 0.3786, + "step": 658 + }, + { + "epoch": 0.05, + "learning_rate": 1.9974199787863674e-05, + "loss": 0.6221, + "step": 659 + }, + { + "epoch": 0.05, + "learning_rate": 1.99740152515447e-05, + "loss": 0.454, + "step": 660 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973830058484813e-05, + "loss": 0.4619, + "step": 661 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973644208696208e-05, + "loss": 0.5049, + "step": 662 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973457702191123e-05, + "loss": 0.4212, + "step": 663 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973270538981835e-05, + "loss": 0.4382, + "step": 664 + }, + { + "epoch": 0.05, + "learning_rate": 1.9973082719080673e-05, + "loss": 0.5352, + "step": 665 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972894242499997e-05, + "loss": 0.5085, + "step": 666 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972705109252227e-05, + "loss": 0.3178, + "step": 667 + }, + { + "epoch": 0.05, + "learning_rate": 1.997251531934981e-05, + "loss": 0.5467, + "step": 668 + }, + { + "epoch": 0.05, + "learning_rate": 1.997232487280524e-05, + "loss": 0.5246, + "step": 669 + }, + { + "epoch": 0.05, + "learning_rate": 1.9972133769631065e-05, + "loss": 0.4012, + "step": 670 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971942009839862e-05, + "loss": 0.423, + "step": 671 + }, + { + "epoch": 0.05, + "learning_rate": 1.997174959344426e-05, + "loss": 0.3705, + "step": 672 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971556520456928e-05, + "loss": 0.6327, + "step": 673 + }, + { + "epoch": 0.05, + "learning_rate": 1.997136279089058e-05, + "loss": 0.3956, + "step": 674 + }, + { + "epoch": 0.05, + "learning_rate": 1.9971168404757972e-05, + "loss": 0.4084, + "step": 675 + }, + { + "epoch": 0.05, + "learning_rate": 1.99709733620719e-05, + "loss": 0.4758, + "step": 676 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970777662845212e-05, + "loss": 0.4907, + "step": 677 + }, + { + "epoch": 0.05, + "learning_rate": 1.997058130709079e-05, + "loss": 0.515, + "step": 678 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970384294821565e-05, + "loss": 0.493, + "step": 679 + }, + { + "epoch": 0.05, + "learning_rate": 1.9970186626050507e-05, + "loss": 0.369, + "step": 680 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969988300790636e-05, + "loss": 0.4666, + "step": 681 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969789319055007e-05, + "loss": 0.4806, + "step": 682 + }, + { + "epoch": 0.05, + "learning_rate": 1.996958968085672e-05, + "loss": 0.5597, + "step": 683 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969389386208927e-05, + "loss": 0.4286, + "step": 684 + }, + { + "epoch": 0.05, + "learning_rate": 1.9969188435124812e-05, + "loss": 0.4617, + "step": 685 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968986827617603e-05, + "loss": 0.4569, + "step": 686 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968784563700586e-05, + "loss": 0.4828, + "step": 687 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968581643387065e-05, + "loss": 0.4478, + "step": 688 + }, + { + "epoch": 0.05, + "learning_rate": 1.9968378066690414e-05, + "loss": 0.4852, + "step": 689 + }, + { + "epoch": 0.05, + "learning_rate": 1.996817383362403e-05, + "loss": 0.3969, + "step": 690 + }, + { + "epoch": 0.05, + "learning_rate": 1.996796894420136e-05, + "loss": 0.5431, + "step": 691 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967763398435904e-05, + "loss": 0.3908, + "step": 692 + }, + { + "epoch": 0.05, + "learning_rate": 1.9967557196341184e-05, + "loss": 0.4358, + "step": 693 + }, + { + "epoch": 0.05, + "learning_rate": 1.996735033793079e-05, + "loss": 0.4629, + "step": 694 + }, + { + "epoch": 0.06, + "learning_rate": 1.996714282321833e-05, + "loss": 0.3689, + "step": 695 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966934652217477e-05, + "loss": 0.3757, + "step": 696 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966725824941933e-05, + "loss": 0.4014, + "step": 697 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966516341405452e-05, + "loss": 0.4847, + "step": 698 + }, + { + "epoch": 0.06, + "learning_rate": 1.9966306201621826e-05, + "loss": 0.5644, + "step": 699 + }, + { + "epoch": 0.06, + "learning_rate": 1.996609540560489e-05, + "loss": 0.5182, + "step": 700 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965883953368527e-05, + "loss": 0.4789, + "step": 701 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965671844926656e-05, + "loss": 0.3884, + "step": 702 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965459080293247e-05, + "loss": 0.4879, + "step": 703 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965245659482312e-05, + "loss": 0.4092, + "step": 704 + }, + { + "epoch": 0.06, + "learning_rate": 1.9965031582507896e-05, + "loss": 0.4769, + "step": 705 + }, + { + "epoch": 0.06, + "learning_rate": 1.99648168493841e-05, + "loss": 0.4722, + "step": 706 + }, + { + "epoch": 0.06, + "learning_rate": 1.996460146012506e-05, + "loss": 0.6584, + "step": 707 + }, + { + "epoch": 0.06, + "learning_rate": 1.996438541474496e-05, + "loss": 0.6279, + "step": 708 + }, + { + "epoch": 0.06, + "learning_rate": 1.996416871325803e-05, + "loss": 0.6066, + "step": 709 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963951355678533e-05, + "loss": 0.4614, + "step": 710 + }, + { + "epoch": 0.06, + "learning_rate": 1.996373334202078e-05, + "loss": 0.6362, + "step": 711 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963514672299135e-05, + "loss": 0.3619, + "step": 712 + }, + { + "epoch": 0.06, + "learning_rate": 1.9963295346527984e-05, + "loss": 0.419, + "step": 713 + }, + { + "epoch": 0.06, + "learning_rate": 1.996307536472178e-05, + "loss": 0.4658, + "step": 714 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962854726894997e-05, + "loss": 0.5451, + "step": 715 + }, + { + "epoch": 0.06, + "learning_rate": 1.9962633433062174e-05, + "loss": 0.4012, + "step": 716 + }, + { + "epoch": 0.06, + "learning_rate": 1.996241148323787e-05, + "loss": 0.406, + "step": 717 + }, + { + "epoch": 0.06, + "learning_rate": 1.996218887743671e-05, + "loss": 0.4824, + "step": 718 + }, + { + "epoch": 0.06, + "learning_rate": 1.996196561567335e-05, + "loss": 0.6101, + "step": 719 + }, + { + "epoch": 0.06, + "learning_rate": 1.996174169796248e-05, + "loss": 0.3918, + "step": 720 + }, + { + "epoch": 0.06, + "learning_rate": 1.996151712431886e-05, + "loss": 0.3742, + "step": 721 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961291894757267e-05, + "loss": 0.4048, + "step": 722 + }, + { + "epoch": 0.06, + "learning_rate": 1.9961066009292532e-05, + "loss": 0.4311, + "step": 723 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960839467939534e-05, + "loss": 0.4146, + "step": 724 + }, + { + "epoch": 0.06, + "learning_rate": 1.996061227071318e-05, + "loss": 0.4546, + "step": 725 + }, + { + "epoch": 0.06, + "learning_rate": 1.996038441762844e-05, + "loss": 0.407, + "step": 726 + }, + { + "epoch": 0.06, + "learning_rate": 1.9960155908700306e-05, + "loss": 0.3355, + "step": 727 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959926743943836e-05, + "loss": 0.5938, + "step": 728 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959696923374113e-05, + "loss": 0.3875, + "step": 729 + }, + { + "epoch": 0.06, + "learning_rate": 1.995946644700627e-05, + "loss": 0.2918, + "step": 730 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959235314855485e-05, + "loss": 0.4267, + "step": 731 + }, + { + "epoch": 0.06, + "learning_rate": 1.9959003526936972e-05, + "loss": 0.5619, + "step": 732 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958771083266e-05, + "loss": 0.3437, + "step": 733 + }, + { + "epoch": 0.06, + "learning_rate": 1.995853798385787e-05, + "loss": 0.5347, + "step": 734 + }, + { + "epoch": 0.06, + "learning_rate": 1.9958304228727928e-05, + "loss": 0.4052, + "step": 735 + }, + { + "epoch": 0.06, + "learning_rate": 1.995806981789157e-05, + "loss": 0.3675, + "step": 736 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957834751364232e-05, + "loss": 0.503, + "step": 737 + }, + { + "epoch": 0.06, + "learning_rate": 1.995759902916139e-05, + "loss": 0.4866, + "step": 738 + }, + { + "epoch": 0.06, + "learning_rate": 1.995736265129856e-05, + "loss": 0.3346, + "step": 739 + }, + { + "epoch": 0.06, + "learning_rate": 1.9957125617791314e-05, + "loss": 0.4416, + "step": 740 + }, + { + "epoch": 0.06, + "learning_rate": 1.995688792865526e-05, + "loss": 0.4191, + "step": 741 + }, + { + "epoch": 0.06, + "learning_rate": 1.995664958390604e-05, + "loss": 0.5843, + "step": 742 + }, + { + "epoch": 0.06, + "learning_rate": 1.995641058355936e-05, + "loss": 0.3984, + "step": 743 + }, + { + "epoch": 0.06, + "learning_rate": 1.9956170927630946e-05, + "loss": 0.3649, + "step": 744 + }, + { + "epoch": 0.06, + "learning_rate": 1.9955930616136582e-05, + "loss": 0.411, + "step": 745 + }, + { + "epoch": 0.06, + "learning_rate": 1.995568964909209e-05, + "loss": 0.4808, + "step": 746 + }, + { + "epoch": 0.06, + "learning_rate": 1.995544802651334e-05, + "loss": 0.4679, + "step": 747 + }, + { + "epoch": 0.06, + "learning_rate": 1.995520574841624e-05, + "loss": 0.4748, + "step": 748 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954962814816744e-05, + "loss": 0.445, + "step": 749 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954719225730847e-05, + "loss": 0.422, + "step": 750 + }, + { + "epoch": 0.06, + "learning_rate": 1.995447498117459e-05, + "loss": 0.3799, + "step": 751 + }, + { + "epoch": 0.06, + "learning_rate": 1.9954230081164047e-05, + "loss": 0.4669, + "step": 752 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953984525715354e-05, + "loss": 0.4219, + "step": 753 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953738314844676e-05, + "loss": 0.4049, + "step": 754 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953491448568222e-05, + "loss": 0.5216, + "step": 755 + }, + { + "epoch": 0.06, + "learning_rate": 1.9953243926902254e-05, + "loss": 0.4504, + "step": 756 + }, + { + "epoch": 0.06, + "learning_rate": 1.995299574986306e-05, + "loss": 0.4779, + "step": 757 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952746917466988e-05, + "loss": 0.4131, + "step": 758 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952497429730423e-05, + "loss": 0.453, + "step": 759 + }, + { + "epoch": 0.06, + "learning_rate": 1.9952247286669787e-05, + "loss": 0.4649, + "step": 760 + }, + { + "epoch": 0.06, + "learning_rate": 1.995199648830156e-05, + "loss": 0.4805, + "step": 761 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951745034642245e-05, + "loss": 0.4835, + "step": 762 + }, + { + "epoch": 0.06, + "learning_rate": 1.995149292570841e-05, + "loss": 0.5703, + "step": 763 + }, + { + "epoch": 0.06, + "learning_rate": 1.9951240161516643e-05, + "loss": 0.3692, + "step": 764 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950986742083594e-05, + "loss": 0.7688, + "step": 765 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950732667425953e-05, + "loss": 0.5639, + "step": 766 + }, + { + "epoch": 0.06, + "learning_rate": 1.9950477937560442e-05, + "loss": 0.4514, + "step": 767 + }, + { + "epoch": 0.06, + "learning_rate": 1.995022255250384e-05, + "loss": 0.5004, + "step": 768 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949966512272964e-05, + "loss": 0.4437, + "step": 769 + }, + { + "epoch": 0.06, + "learning_rate": 1.994970981688466e-05, + "loss": 0.5558, + "step": 770 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949452466355847e-05, + "loss": 0.485, + "step": 771 + }, + { + "epoch": 0.06, + "learning_rate": 1.9949194460703462e-05, + "loss": 0.4279, + "step": 772 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948935799944492e-05, + "loss": 0.4137, + "step": 773 + }, + { + "epoch": 0.06, + "learning_rate": 1.994867648409597e-05, + "loss": 0.3936, + "step": 774 + }, + { + "epoch": 0.06, + "learning_rate": 1.9948416513174976e-05, + "loss": 0.4801, + "step": 775 + }, + { + "epoch": 0.06, + "learning_rate": 1.994815588719862e-05, + "loss": 0.5287, + "step": 776 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947894606184065e-05, + "loss": 0.4514, + "step": 777 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947632670148517e-05, + "loss": 0.4955, + "step": 778 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947370079109224e-05, + "loss": 0.556, + "step": 779 + }, + { + "epoch": 0.06, + "learning_rate": 1.9947106833083474e-05, + "loss": 0.4515, + "step": 780 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946842932088603e-05, + "loss": 0.4997, + "step": 781 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946578376141985e-05, + "loss": 0.4379, + "step": 782 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946313165261042e-05, + "loss": 0.3184, + "step": 783 + }, + { + "epoch": 0.06, + "learning_rate": 1.9946047299463234e-05, + "loss": 0.4418, + "step": 784 + }, + { + "epoch": 0.06, + "learning_rate": 1.994578077876607e-05, + "loss": 0.4426, + "step": 785 + }, + { + "epoch": 0.06, + "learning_rate": 1.9945513603187096e-05, + "loss": 0.4197, + "step": 786 + }, + { + "epoch": 0.06, + "learning_rate": 1.994524577274391e-05, + "loss": 0.371, + "step": 787 + }, + { + "epoch": 0.06, + "learning_rate": 1.994497728745414e-05, + "loss": 0.4312, + "step": 788 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944708147335466e-05, + "loss": 0.491, + "step": 789 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944438352405614e-05, + "loss": 0.5961, + "step": 790 + }, + { + "epoch": 0.06, + "learning_rate": 1.9944167902682345e-05, + "loss": 0.4977, + "step": 791 + }, + { + "epoch": 0.06, + "learning_rate": 1.994389679818347e-05, + "loss": 0.4404, + "step": 792 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943625038926834e-05, + "loss": 0.5013, + "step": 793 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943352624930336e-05, + "loss": 0.4016, + "step": 794 + }, + { + "epoch": 0.06, + "learning_rate": 1.9943079556211915e-05, + "loss": 0.4955, + "step": 795 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942805832789548e-05, + "loss": 0.4708, + "step": 796 + }, + { + "epoch": 0.06, + "learning_rate": 1.9942531454681254e-05, + "loss": 0.4092, + "step": 797 + }, + { + "epoch": 0.06, + "learning_rate": 1.994225642190511e-05, + "loss": 0.6157, + "step": 798 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941980734479214e-05, + "loss": 0.4468, + "step": 799 + }, + { + "epoch": 0.06, + "learning_rate": 1.994170439242173e-05, + "loss": 0.4379, + "step": 800 + }, + { + "epoch": 0.06, + "learning_rate": 1.9941427395750844e-05, + "loss": 0.4908, + "step": 801 + }, + { + "epoch": 0.06, + "learning_rate": 1.99411497444848e-05, + "loss": 0.4329, + "step": 802 + }, + { + "epoch": 0.06, + "learning_rate": 1.994087143864188e-05, + "loss": 0.4329, + "step": 803 + }, + { + "epoch": 0.06, + "learning_rate": 1.994059247824041e-05, + "loss": 0.4963, + "step": 804 + }, + { + "epoch": 0.06, + "learning_rate": 1.994031286329875e-05, + "loss": 0.3448, + "step": 805 + }, + { + "epoch": 0.06, + "learning_rate": 1.9940032593835324e-05, + "loss": 0.2984, + "step": 806 + }, + { + "epoch": 0.06, + "learning_rate": 1.993975166986858e-05, + "loss": 0.4799, + "step": 807 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939470091417012e-05, + "loss": 0.3905, + "step": 808 + }, + { + "epoch": 0.06, + "learning_rate": 1.9939187858499166e-05, + "loss": 0.4737, + "step": 809 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938904971133626e-05, + "loss": 0.4197, + "step": 810 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938621429339012e-05, + "loss": 0.4573, + "step": 811 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938337233134e-05, + "loss": 0.3659, + "step": 812 + }, + { + "epoch": 0.06, + "learning_rate": 1.9938052382537304e-05, + "loss": 0.4065, + "step": 813 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937766877567676e-05, + "loss": 0.4472, + "step": 814 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937480718243914e-05, + "loss": 0.5199, + "step": 815 + }, + { + "epoch": 0.06, + "learning_rate": 1.9937193904584865e-05, + "loss": 0.4744, + "step": 816 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936906436609413e-05, + "loss": 0.4348, + "step": 817 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936618314336486e-05, + "loss": 0.5031, + "step": 818 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936329537785054e-05, + "loss": 0.3342, + "step": 819 + }, + { + "epoch": 0.06, + "learning_rate": 1.9936040106974132e-05, + "loss": 0.5404, + "step": 820 + }, + { + "epoch": 0.07, + "learning_rate": 1.9935750021922778e-05, + "loss": 0.5728, + "step": 821 + }, + { + "epoch": 0.07, + "learning_rate": 1.993545928265009e-05, + "loss": 0.4295, + "step": 822 + }, + { + "epoch": 0.07, + "learning_rate": 1.993516788917522e-05, + "loss": 0.5043, + "step": 823 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934875841517346e-05, + "loss": 0.3355, + "step": 824 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934583139695703e-05, + "loss": 0.4884, + "step": 825 + }, + { + "epoch": 0.07, + "learning_rate": 1.9934289783729564e-05, + "loss": 0.517, + "step": 826 + }, + { + "epoch": 0.07, + "learning_rate": 1.993399577363824e-05, + "loss": 0.363, + "step": 827 + }, + { + "epoch": 0.07, + "learning_rate": 1.9933701109441093e-05, + "loss": 0.4575, + "step": 828 + }, + { + "epoch": 0.07, + "learning_rate": 1.993340579115753e-05, + "loss": 0.4805, + "step": 829 + }, + { + "epoch": 0.07, + "learning_rate": 1.993310981880699e-05, + "loss": 0.4646, + "step": 830 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932813192408964e-05, + "loss": 0.4352, + "step": 831 + }, + { + "epoch": 0.07, + "learning_rate": 1.9932515911982983e-05, + "loss": 0.4523, + "step": 832 + }, + { + "epoch": 0.07, + "learning_rate": 1.993221797754862e-05, + "loss": 0.5781, + "step": 833 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931919389125496e-05, + "loss": 0.3761, + "step": 834 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931620146733264e-05, + "loss": 0.5403, + "step": 835 + }, + { + "epoch": 0.07, + "learning_rate": 1.993132025039164e-05, + "loss": 0.4394, + "step": 836 + }, + { + "epoch": 0.07, + "learning_rate": 1.9931019700120363e-05, + "loss": 0.55, + "step": 837 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930718495939222e-05, + "loss": 0.4037, + "step": 838 + }, + { + "epoch": 0.07, + "learning_rate": 1.9930416637868053e-05, + "loss": 0.4212, + "step": 839 + }, + { + "epoch": 0.07, + "learning_rate": 1.993011412592673e-05, + "loss": 0.4537, + "step": 840 + }, + { + "epoch": 0.07, + "learning_rate": 1.992981096013517e-05, + "loss": 0.4889, + "step": 841 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929507140513342e-05, + "loss": 0.478, + "step": 842 + }, + { + "epoch": 0.07, + "learning_rate": 1.9929202667081246e-05, + "loss": 0.447, + "step": 843 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928897539858926e-05, + "loss": 0.4269, + "step": 844 + }, + { + "epoch": 0.07, + "learning_rate": 1.992859175886648e-05, + "loss": 0.4166, + "step": 845 + }, + { + "epoch": 0.07, + "learning_rate": 1.9928285324124038e-05, + "loss": 0.4716, + "step": 846 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927978235651782e-05, + "loss": 0.4598, + "step": 847 + }, + { + "epoch": 0.07, + "learning_rate": 1.992767049346993e-05, + "loss": 0.4479, + "step": 848 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927362097598746e-05, + "loss": 0.3856, + "step": 849 + }, + { + "epoch": 0.07, + "learning_rate": 1.9927053048058534e-05, + "loss": 0.4764, + "step": 850 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926743344869645e-05, + "loss": 0.3989, + "step": 851 + }, + { + "epoch": 0.07, + "learning_rate": 1.992643298805247e-05, + "loss": 0.3926, + "step": 852 + }, + { + "epoch": 0.07, + "learning_rate": 1.9926121977627447e-05, + "loss": 0.4304, + "step": 853 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925810313615052e-05, + "loss": 0.4521, + "step": 854 + }, + { + "epoch": 0.07, + "learning_rate": 1.9925497996035807e-05, + "loss": 0.4067, + "step": 855 + }, + { + "epoch": 0.07, + "learning_rate": 1.992518502491028e-05, + "loss": 0.5512, + "step": 856 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924871400259074e-05, + "loss": 0.5328, + "step": 857 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924557122102843e-05, + "loss": 0.5436, + "step": 858 + }, + { + "epoch": 0.07, + "learning_rate": 1.9924242190462276e-05, + "loss": 0.5301, + "step": 859 + }, + { + "epoch": 0.07, + "learning_rate": 1.992392660535812e-05, + "loss": 0.535, + "step": 860 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923610366811142e-05, + "loss": 0.7168, + "step": 861 + }, + { + "epoch": 0.07, + "learning_rate": 1.9923293474842175e-05, + "loss": 0.5642, + "step": 862 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922975929472076e-05, + "loss": 0.4754, + "step": 863 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922657730721758e-05, + "loss": 0.4715, + "step": 864 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922338878612177e-05, + "loss": 0.5377, + "step": 865 + }, + { + "epoch": 0.07, + "learning_rate": 1.9922019373164324e-05, + "loss": 0.374, + "step": 866 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921699214399238e-05, + "loss": 0.5085, + "step": 867 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921378402337996e-05, + "loss": 0.4323, + "step": 868 + }, + { + "epoch": 0.07, + "learning_rate": 1.9921056937001725e-05, + "loss": 0.505, + "step": 869 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920734818411592e-05, + "loss": 0.4788, + "step": 870 + }, + { + "epoch": 0.07, + "learning_rate": 1.9920412046588807e-05, + "loss": 0.5267, + "step": 871 + }, + { + "epoch": 0.07, + "learning_rate": 1.992008862155462e-05, + "loss": 0.3955, + "step": 872 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919764543330334e-05, + "loss": 0.3927, + "step": 873 + }, + { + "epoch": 0.07, + "learning_rate": 1.9919439811937283e-05, + "loss": 0.5036, + "step": 874 + }, + { + "epoch": 0.07, + "learning_rate": 1.991911442739685e-05, + "loss": 0.566, + "step": 875 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918788389730457e-05, + "loss": 0.3908, + "step": 876 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918461698959576e-05, + "loss": 0.5324, + "step": 877 + }, + { + "epoch": 0.07, + "learning_rate": 1.9918134355105717e-05, + "loss": 0.4176, + "step": 878 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917806358190434e-05, + "loss": 0.3384, + "step": 879 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917477708235324e-05, + "loss": 0.4873, + "step": 880 + }, + { + "epoch": 0.07, + "learning_rate": 1.9917148405262027e-05, + "loss": 0.5392, + "step": 881 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916818449292223e-05, + "loss": 0.4869, + "step": 882 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916487840347644e-05, + "loss": 0.5101, + "step": 883 + }, + { + "epoch": 0.07, + "learning_rate": 1.9916156578450052e-05, + "loss": 0.5067, + "step": 884 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915824663621267e-05, + "loss": 0.4471, + "step": 885 + }, + { + "epoch": 0.07, + "learning_rate": 1.991549209588314e-05, + "loss": 0.3273, + "step": 886 + }, + { + "epoch": 0.07, + "learning_rate": 1.9915158875257566e-05, + "loss": 0.4278, + "step": 887 + }, + { + "epoch": 0.07, + "learning_rate": 1.991482500176649e-05, + "loss": 0.4191, + "step": 888 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914490475431892e-05, + "loss": 0.4937, + "step": 889 + }, + { + "epoch": 0.07, + "learning_rate": 1.9914155296275804e-05, + "loss": 0.4904, + "step": 890 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913819464320295e-05, + "loss": 0.4784, + "step": 891 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913482979587473e-05, + "loss": 0.3482, + "step": 892 + }, + { + "epoch": 0.07, + "learning_rate": 1.9913145842099503e-05, + "loss": 0.5072, + "step": 893 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912808051878575e-05, + "loss": 0.4337, + "step": 894 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912469608946932e-05, + "loss": 0.3934, + "step": 895 + }, + { + "epoch": 0.07, + "learning_rate": 1.9912130513326863e-05, + "loss": 0.4283, + "step": 896 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911790765040697e-05, + "loss": 0.5822, + "step": 897 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911450364110798e-05, + "loss": 0.5106, + "step": 898 + }, + { + "epoch": 0.07, + "learning_rate": 1.9911109310559583e-05, + "loss": 0.3672, + "step": 899 + }, + { + "epoch": 0.07, + "learning_rate": 1.991076760440951e-05, + "loss": 0.4487, + "step": 900 + }, + { + "epoch": 0.07, + "learning_rate": 1.991042524568308e-05, + "loss": 0.5004, + "step": 901 + }, + { + "epoch": 0.07, + "learning_rate": 1.991008223440283e-05, + "loss": 0.5932, + "step": 902 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909738570591352e-05, + "loss": 0.3571, + "step": 903 + }, + { + "epoch": 0.07, + "learning_rate": 1.990939425427127e-05, + "loss": 0.4513, + "step": 904 + }, + { + "epoch": 0.07, + "learning_rate": 1.9909049285465258e-05, + "loss": 0.4776, + "step": 905 + }, + { + "epoch": 0.07, + "learning_rate": 1.990870366419603e-05, + "loss": 0.4842, + "step": 906 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908357390486342e-05, + "loss": 0.4522, + "step": 907 + }, + { + "epoch": 0.07, + "learning_rate": 1.9908010464358997e-05, + "loss": 0.3464, + "step": 908 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907662885836836e-05, + "loss": 0.5185, + "step": 909 + }, + { + "epoch": 0.07, + "learning_rate": 1.9907314654942748e-05, + "loss": 0.3878, + "step": 910 + }, + { + "epoch": 0.07, + "learning_rate": 1.990696577169966e-05, + "loss": 0.5181, + "step": 911 + }, + { + "epoch": 0.07, + "learning_rate": 1.9906616236130543e-05, + "loss": 0.3134, + "step": 912 + }, + { + "epoch": 0.07, + "learning_rate": 1.990626604825842e-05, + "loss": 0.5083, + "step": 913 + }, + { + "epoch": 0.07, + "learning_rate": 1.9905915208106342e-05, + "loss": 0.3633, + "step": 914 + }, + { + "epoch": 0.07, + "learning_rate": 1.990556371569741e-05, + "loss": 0.5387, + "step": 915 + }, + { + "epoch": 0.07, + "learning_rate": 1.990521157105477e-05, + "loss": 0.3559, + "step": 916 + }, + { + "epoch": 0.07, + "learning_rate": 1.990485877420161e-05, + "loss": 0.4421, + "step": 917 + }, + { + "epoch": 0.07, + "learning_rate": 1.990450532516116e-05, + "loss": 0.4673, + "step": 918 + }, + { + "epoch": 0.07, + "learning_rate": 1.9904151223956688e-05, + "loss": 0.511, + "step": 919 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903796470611515e-05, + "loss": 0.3782, + "step": 920 + }, + { + "epoch": 0.07, + "learning_rate": 1.9903441065149e-05, + "loss": 0.5179, + "step": 921 + }, + { + "epoch": 0.07, + "learning_rate": 1.990308500759254e-05, + "loss": 0.5039, + "step": 922 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902728297965586e-05, + "loss": 0.5464, + "step": 923 + }, + { + "epoch": 0.07, + "learning_rate": 1.990237093629162e-05, + "loss": 0.547, + "step": 924 + }, + { + "epoch": 0.07, + "learning_rate": 1.9902012922594178e-05, + "loss": 0.5008, + "step": 925 + }, + { + "epoch": 0.07, + "learning_rate": 1.990165425689683e-05, + "loss": 0.4807, + "step": 926 + }, + { + "epoch": 0.07, + "learning_rate": 1.9901294939223192e-05, + "loss": 0.5374, + "step": 927 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900934969596925e-05, + "loss": 0.4831, + "step": 928 + }, + { + "epoch": 0.07, + "learning_rate": 1.9900574348041728e-05, + "loss": 0.3967, + "step": 929 + }, + { + "epoch": 0.07, + "learning_rate": 1.990021307458135e-05, + "loss": 0.4375, + "step": 930 + }, + { + "epoch": 0.07, + "learning_rate": 1.989985114923958e-05, + "loss": 0.5318, + "step": 931 + }, + { + "epoch": 0.07, + "learning_rate": 1.9899488572040244e-05, + "loss": 0.3767, + "step": 932 + }, + { + "epoch": 0.07, + "learning_rate": 1.989912534300722e-05, + "loss": 0.468, + "step": 933 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898761462164425e-05, + "loss": 0.6273, + "step": 934 + }, + { + "epoch": 0.07, + "learning_rate": 1.989839692953581e-05, + "loss": 0.452, + "step": 935 + }, + { + "epoch": 0.07, + "learning_rate": 1.9898031745145397e-05, + "loss": 0.4089, + "step": 936 + }, + { + "epoch": 0.07, + "learning_rate": 1.989766590901721e-05, + "loss": 0.5847, + "step": 937 + }, + { + "epoch": 0.07, + "learning_rate": 1.9897299421175353e-05, + "loss": 0.5081, + "step": 938 + }, + { + "epoch": 0.07, + "learning_rate": 1.989693228164395e-05, + "loss": 0.5609, + "step": 939 + }, + { + "epoch": 0.07, + "learning_rate": 1.989656449044718e-05, + "loss": 0.4695, + "step": 940 + }, + { + "epoch": 0.07, + "learning_rate": 1.9896196047609255e-05, + "loss": 0.6024, + "step": 941 + }, + { + "epoch": 0.07, + "learning_rate": 1.9895826953154437e-05, + "loss": 0.4075, + "step": 942 + }, + { + "epoch": 0.07, + "learning_rate": 1.9895457207107032e-05, + "loss": 0.4401, + "step": 943 + }, + { + "epoch": 0.07, + "learning_rate": 1.9895086809491384e-05, + "loss": 0.5136, + "step": 944 + }, + { + "epoch": 0.07, + "learning_rate": 1.989471576033188e-05, + "loss": 0.5483, + "step": 945 + }, + { + "epoch": 0.07, + "learning_rate": 1.9894344059652953e-05, + "loss": 0.3195, + "step": 946 + }, + { + "epoch": 0.08, + "learning_rate": 1.989397170747908e-05, + "loss": 0.5379, + "step": 947 + }, + { + "epoch": 0.08, + "learning_rate": 1.9893598703834773e-05, + "loss": 0.479, + "step": 948 + }, + { + "epoch": 0.08, + "learning_rate": 1.98932250487446e-05, + "loss": 0.4554, + "step": 949 + }, + { + "epoch": 0.08, + "learning_rate": 1.989285074223316e-05, + "loss": 0.3892, + "step": 950 + }, + { + "epoch": 0.08, + "learning_rate": 1.98924757843251e-05, + "loss": 0.5258, + "step": 951 + }, + { + "epoch": 0.08, + "learning_rate": 1.989210017504511e-05, + "loss": 0.3411, + "step": 952 + }, + { + "epoch": 0.08, + "learning_rate": 1.989172391441792e-05, + "loss": 0.4077, + "step": 953 + }, + { + "epoch": 0.08, + "learning_rate": 1.9891347002468307e-05, + "loss": 0.4862, + "step": 954 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890969439221086e-05, + "loss": 0.2532, + "step": 955 + }, + { + "epoch": 0.08, + "learning_rate": 1.989059122470112e-05, + "loss": 0.3903, + "step": 956 + }, + { + "epoch": 0.08, + "learning_rate": 1.9890212358933316e-05, + "loss": 0.4934, + "step": 957 + }, + { + "epoch": 0.08, + "learning_rate": 1.9889832841942613e-05, + "loss": 0.4672, + "step": 958 + }, + { + "epoch": 0.08, + "learning_rate": 1.988945267375401e-05, + "loss": 0.51, + "step": 959 + }, + { + "epoch": 0.08, + "learning_rate": 1.9889071854392528e-05, + "loss": 0.3747, + "step": 960 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888690383883247e-05, + "loss": 0.3955, + "step": 961 + }, + { + "epoch": 0.08, + "learning_rate": 1.9888308262251286e-05, + "loss": 0.4242, + "step": 962 + }, + { + "epoch": 0.08, + "learning_rate": 1.988792548952181e-05, + "loss": 0.4078, + "step": 963 + }, + { + "epoch": 0.08, + "learning_rate": 1.9887542065720013e-05, + "loss": 0.4761, + "step": 964 + }, + { + "epoch": 0.08, + "learning_rate": 1.988715799087115e-05, + "loss": 0.4656, + "step": 965 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886773265000502e-05, + "loss": 0.4304, + "step": 966 + }, + { + "epoch": 0.08, + "learning_rate": 1.9886387888133413e-05, + "loss": 0.3639, + "step": 967 + }, + { + "epoch": 0.08, + "learning_rate": 1.988600186029525e-05, + "loss": 0.3599, + "step": 968 + }, + { + "epoch": 0.08, + "learning_rate": 1.988561518151143e-05, + "loss": 0.4618, + "step": 969 + }, + { + "epoch": 0.08, + "learning_rate": 1.988522785180742e-05, + "loss": 0.4133, + "step": 970 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884839871208717e-05, + "loss": 0.477, + "step": 971 + }, + { + "epoch": 0.08, + "learning_rate": 1.9884451239740877e-05, + "loss": 0.4136, + "step": 972 + }, + { + "epoch": 0.08, + "learning_rate": 1.988406195742948e-05, + "loss": 0.4663, + "step": 973 + }, + { + "epoch": 0.08, + "learning_rate": 1.9883672024300163e-05, + "loss": 0.4593, + "step": 974 + }, + { + "epoch": 0.08, + "learning_rate": 1.98832814403786e-05, + "loss": 0.4803, + "step": 975 + }, + { + "epoch": 0.08, + "learning_rate": 1.988289020569051e-05, + "loss": 0.5636, + "step": 976 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882498320261652e-05, + "loss": 0.4854, + "step": 977 + }, + { + "epoch": 0.08, + "learning_rate": 1.9882105784117835e-05, + "loss": 0.4589, + "step": 978 + }, + { + "epoch": 0.08, + "learning_rate": 1.98817125972849e-05, + "loss": 0.5366, + "step": 979 + }, + { + "epoch": 0.08, + "learning_rate": 1.9881318759788738e-05, + "loss": 0.522, + "step": 980 + }, + { + "epoch": 0.08, + "learning_rate": 1.988092427165528e-05, + "loss": 0.439, + "step": 981 + }, + { + "epoch": 0.08, + "learning_rate": 1.98805291329105e-05, + "loss": 0.4767, + "step": 982 + }, + { + "epoch": 0.08, + "learning_rate": 1.9880133343580423e-05, + "loss": 0.4342, + "step": 983 + }, + { + "epoch": 0.08, + "learning_rate": 1.9879736903691107e-05, + "loss": 0.5902, + "step": 984 + }, + { + "epoch": 0.08, + "learning_rate": 1.9879339813268653e-05, + "loss": 0.6177, + "step": 985 + }, + { + "epoch": 0.08, + "learning_rate": 1.9878942072339208e-05, + "loss": 0.3866, + "step": 986 + }, + { + "epoch": 0.08, + "learning_rate": 1.987854368092896e-05, + "loss": 0.5521, + "step": 987 + }, + { + "epoch": 0.08, + "learning_rate": 1.9878144639064145e-05, + "loss": 0.3939, + "step": 988 + }, + { + "epoch": 0.08, + "learning_rate": 1.9877744946771034e-05, + "loss": 0.3063, + "step": 989 + }, + { + "epoch": 0.08, + "learning_rate": 1.987734460407595e-05, + "loss": 0.4149, + "step": 990 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876943611005252e-05, + "loss": 0.4289, + "step": 991 + }, + { + "epoch": 0.08, + "learning_rate": 1.9876541967585337e-05, + "loss": 0.487, + "step": 992 + }, + { + "epoch": 0.08, + "learning_rate": 1.987613967384266e-05, + "loss": 0.3878, + "step": 993 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875736729803705e-05, + "loss": 0.5315, + "step": 994 + }, + { + "epoch": 0.08, + "learning_rate": 1.9875333135495e-05, + "loss": 0.5275, + "step": 995 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874928890943134e-05, + "loss": 0.535, + "step": 996 + }, + { + "epoch": 0.08, + "learning_rate": 1.9874523996174714e-05, + "loss": 0.4141, + "step": 997 + }, + { + "epoch": 0.08, + "learning_rate": 1.98741184512164e-05, + "loss": 0.5013, + "step": 998 + }, + { + "epoch": 0.08, + "learning_rate": 1.9873712256094898e-05, + "loss": 0.5735, + "step": 999 + }, + { + "epoch": 0.08, + "learning_rate": 1.987330541083695e-05, + "loss": 0.4808, + "step": 1000 + }, + { + "epoch": 0.08, + "learning_rate": 1.9872897915469353e-05, + "loss": 0.3514, + "step": 1001 + }, + { + "epoch": 0.08, + "learning_rate": 1.987248977001893e-05, + "loss": 0.3986, + "step": 1002 + }, + { + "epoch": 0.08, + "learning_rate": 1.987208097451256e-05, + "loss": 0.4759, + "step": 1003 + }, + { + "epoch": 0.08, + "learning_rate": 1.987167152897716e-05, + "loss": 0.459, + "step": 1004 + }, + { + "epoch": 0.08, + "learning_rate": 1.987126143343969e-05, + "loss": 0.3672, + "step": 1005 + }, + { + "epoch": 0.08, + "learning_rate": 1.987085068792715e-05, + "loss": 0.4867, + "step": 1006 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870439292466587e-05, + "loss": 0.5051, + "step": 1007 + }, + { + "epoch": 0.08, + "learning_rate": 1.9870027247085093e-05, + "loss": 0.5399, + "step": 1008 + }, + { + "epoch": 0.08, + "learning_rate": 1.9869614551809793e-05, + "loss": 0.4489, + "step": 1009 + }, + { + "epoch": 0.08, + "learning_rate": 1.986920120666787e-05, + "loss": 0.4505, + "step": 1010 + }, + { + "epoch": 0.08, + "learning_rate": 1.986878721168653e-05, + "loss": 0.4669, + "step": 1011 + }, + { + "epoch": 0.08, + "learning_rate": 1.986837256689304e-05, + "loss": 0.4623, + "step": 1012 + }, + { + "epoch": 0.08, + "learning_rate": 1.98679572723147e-05, + "loss": 0.4532, + "step": 1013 + }, + { + "epoch": 0.08, + "learning_rate": 1.9867541327978853e-05, + "loss": 0.5368, + "step": 1014 + }, + { + "epoch": 0.08, + "learning_rate": 1.986712473391289e-05, + "loss": 0.3928, + "step": 1015 + }, + { + "epoch": 0.08, + "learning_rate": 1.986670749014424e-05, + "loss": 0.4643, + "step": 1016 + }, + { + "epoch": 0.08, + "learning_rate": 1.9866289596700383e-05, + "loss": 0.3954, + "step": 1017 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865871053608823e-05, + "loss": 0.4276, + "step": 1018 + }, + { + "epoch": 0.08, + "learning_rate": 1.9865451860897126e-05, + "loss": 0.4448, + "step": 1019 + }, + { + "epoch": 0.08, + "learning_rate": 1.98650320185929e-05, + "loss": 0.4241, + "step": 1020 + }, + { + "epoch": 0.08, + "learning_rate": 1.986461152672378e-05, + "loss": 0.4977, + "step": 1021 + }, + { + "epoch": 0.08, + "learning_rate": 1.986419038531745e-05, + "loss": 0.4437, + "step": 1022 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863768594401654e-05, + "loss": 0.3896, + "step": 1023 + }, + { + "epoch": 0.08, + "learning_rate": 1.9863346154004155e-05, + "loss": 0.4031, + "step": 1024 + }, + { + "epoch": 0.08, + "learning_rate": 1.986292306415277e-05, + "loss": 0.38, + "step": 1025 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862499324875362e-05, + "loss": 0.3601, + "step": 1026 + }, + { + "epoch": 0.08, + "learning_rate": 1.9862074936199827e-05, + "loss": 0.3944, + "step": 1027 + }, + { + "epoch": 0.08, + "learning_rate": 1.9861649898154107e-05, + "loss": 0.4822, + "step": 1028 + }, + { + "epoch": 0.08, + "learning_rate": 1.98612242107662e-05, + "loss": 0.4246, + "step": 1029 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860797874064123e-05, + "loss": 0.3107, + "step": 1030 + }, + { + "epoch": 0.08, + "learning_rate": 1.9860370888075954e-05, + "loss": 0.4464, + "step": 1031 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859943252829804e-05, + "loss": 0.4818, + "step": 1032 + }, + { + "epoch": 0.08, + "learning_rate": 1.9859514968353836e-05, + "loss": 0.5699, + "step": 1033 + }, + { + "epoch": 0.08, + "learning_rate": 1.985908603467625e-05, + "loss": 0.3822, + "step": 1034 + }, + { + "epoch": 0.08, + "learning_rate": 1.985865645182529e-05, + "loss": 0.4071, + "step": 1035 + }, + { + "epoch": 0.08, + "learning_rate": 1.9858226219829234e-05, + "loss": 0.4459, + "step": 1036 + }, + { + "epoch": 0.08, + "learning_rate": 1.985779533871642e-05, + "loss": 0.4498, + "step": 1037 + }, + { + "epoch": 0.08, + "learning_rate": 1.985736380851521e-05, + "loss": 0.4545, + "step": 1038 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856931629254032e-05, + "loss": 0.3547, + "step": 1039 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856498800961328e-05, + "loss": 0.3279, + "step": 1040 + }, + { + "epoch": 0.08, + "learning_rate": 1.9856065323665606e-05, + "loss": 0.4389, + "step": 1041 + }, + { + "epoch": 0.08, + "learning_rate": 1.9855631197395406e-05, + "loss": 0.4721, + "step": 1042 + }, + { + "epoch": 0.08, + "learning_rate": 1.985519642217932e-05, + "loss": 0.4259, + "step": 1043 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854760998045964e-05, + "loss": 0.5126, + "step": 1044 + }, + { + "epoch": 0.08, + "learning_rate": 1.9854324925024017e-05, + "loss": 0.5823, + "step": 1045 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853888203142184e-05, + "loss": 0.4594, + "step": 1046 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853450832429234e-05, + "loss": 0.3902, + "step": 1047 + }, + { + "epoch": 0.08, + "learning_rate": 1.9853012812913956e-05, + "loss": 0.3963, + "step": 1048 + }, + { + "epoch": 0.08, + "learning_rate": 1.9852574144625193e-05, + "loss": 0.4736, + "step": 1049 + }, + { + "epoch": 0.08, + "learning_rate": 1.985213482759183e-05, + "loss": 0.4286, + "step": 1050 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851694861842795e-05, + "loss": 0.6268, + "step": 1051 + }, + { + "epoch": 0.08, + "learning_rate": 1.9851254247407053e-05, + "loss": 0.3583, + "step": 1052 + }, + { + "epoch": 0.08, + "learning_rate": 1.9850812984313626e-05, + "loss": 0.4852, + "step": 1053 + }, + { + "epoch": 0.08, + "learning_rate": 1.985037107259156e-05, + "loss": 0.45, + "step": 1054 + }, + { + "epoch": 0.08, + "learning_rate": 1.984992851226996e-05, + "loss": 0.4733, + "step": 1055 + }, + { + "epoch": 0.08, + "learning_rate": 1.9849485303377955e-05, + "loss": 0.4186, + "step": 1056 + }, + { + "epoch": 0.08, + "learning_rate": 1.984904144594474e-05, + "loss": 0.5814, + "step": 1057 + }, + { + "epoch": 0.08, + "learning_rate": 1.9848596939999534e-05, + "loss": 0.56, + "step": 1058 + }, + { + "epoch": 0.08, + "learning_rate": 1.984815178557161e-05, + "loss": 0.4013, + "step": 1059 + }, + { + "epoch": 0.08, + "learning_rate": 1.9847705982690275e-05, + "loss": 0.4889, + "step": 1060 + }, + { + "epoch": 0.08, + "learning_rate": 1.984725953138489e-05, + "loss": 0.5575, + "step": 1061 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846812431684843e-05, + "loss": 0.388, + "step": 1062 + }, + { + "epoch": 0.08, + "learning_rate": 1.9846364683619575e-05, + "loss": 0.4897, + "step": 1063 + }, + { + "epoch": 0.08, + "learning_rate": 1.9845916287218575e-05, + "loss": 0.4974, + "step": 1064 + }, + { + "epoch": 0.08, + "learning_rate": 1.9845467242511362e-05, + "loss": 0.4499, + "step": 1065 + }, + { + "epoch": 0.08, + "learning_rate": 1.9845017549527502e-05, + "loss": 0.4037, + "step": 1066 + }, + { + "epoch": 0.08, + "learning_rate": 1.984456720829661e-05, + "loss": 0.4255, + "step": 1067 + }, + { + "epoch": 0.08, + "learning_rate": 1.9844116218848335e-05, + "loss": 0.4426, + "step": 1068 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843664581212374e-05, + "loss": 0.388, + "step": 1069 + }, + { + "epoch": 0.08, + "learning_rate": 1.9843212295418464e-05, + "loss": 0.4205, + "step": 1070 + }, + { + "epoch": 0.08, + "learning_rate": 1.984275936149639e-05, + "loss": 0.4468, + "step": 1071 + }, + { + "epoch": 0.08, + "learning_rate": 1.984230577947597e-05, + "loss": 0.4729, + "step": 1072 + }, + { + "epoch": 0.09, + "learning_rate": 1.9841851549387074e-05, + "loss": 0.4749, + "step": 1073 + }, + { + "epoch": 0.09, + "learning_rate": 1.9841396671259606e-05, + "loss": 0.4433, + "step": 1074 + }, + { + "epoch": 0.09, + "learning_rate": 1.9840941145123524e-05, + "loss": 0.4118, + "step": 1075 + }, + { + "epoch": 0.09, + "learning_rate": 1.984048497100882e-05, + "loss": 0.5209, + "step": 1076 + }, + { + "epoch": 0.09, + "learning_rate": 1.9840028148945526e-05, + "loss": 0.4258, + "step": 1077 + }, + { + "epoch": 0.09, + "learning_rate": 1.983957067896373e-05, + "loss": 0.3285, + "step": 1078 + }, + { + "epoch": 0.09, + "learning_rate": 1.9839112561093548e-05, + "loss": 0.3204, + "step": 1079 + }, + { + "epoch": 0.09, + "learning_rate": 1.983865379536515e-05, + "loss": 0.5883, + "step": 1080 + }, + { + "epoch": 0.09, + "learning_rate": 1.9838194381808737e-05, + "loss": 0.5709, + "step": 1081 + }, + { + "epoch": 0.09, + "learning_rate": 1.983773432045456e-05, + "loss": 0.399, + "step": 1082 + }, + { + "epoch": 0.09, + "learning_rate": 1.9837273611332918e-05, + "loss": 0.578, + "step": 1083 + }, + { + "epoch": 0.09, + "learning_rate": 1.983681225447414e-05, + "loss": 0.5967, + "step": 1084 + }, + { + "epoch": 0.09, + "learning_rate": 1.9836350249908606e-05, + "loss": 0.5742, + "step": 1085 + }, + { + "epoch": 0.09, + "learning_rate": 1.983588759766674e-05, + "loss": 0.2579, + "step": 1086 + }, + { + "epoch": 0.09, + "learning_rate": 1.9835424297779002e-05, + "loss": 0.4343, + "step": 1087 + }, + { + "epoch": 0.09, + "learning_rate": 1.98349603502759e-05, + "loss": 0.3416, + "step": 1088 + }, + { + "epoch": 0.09, + "learning_rate": 1.983449575518798e-05, + "loss": 0.3007, + "step": 1089 + }, + { + "epoch": 0.09, + "learning_rate": 1.983403051254584e-05, + "loss": 0.3259, + "step": 1090 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833564622380105e-05, + "loss": 0.4087, + "step": 1091 + }, + { + "epoch": 0.09, + "learning_rate": 1.9833098084721455e-05, + "loss": 0.3859, + "step": 1092 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832630899600607e-05, + "loss": 0.5566, + "step": 1093 + }, + { + "epoch": 0.09, + "learning_rate": 1.9832163067048335e-05, + "loss": 0.4857, + "step": 1094 + }, + { + "epoch": 0.09, + "learning_rate": 1.9831694587095428e-05, + "loss": 0.434, + "step": 1095 + }, + { + "epoch": 0.09, + "learning_rate": 1.983122545977274e-05, + "loss": 0.5178, + "step": 1096 + }, + { + "epoch": 0.09, + "learning_rate": 1.983075568511116e-05, + "loss": 0.4996, + "step": 1097 + }, + { + "epoch": 0.09, + "learning_rate": 1.983028526314162e-05, + "loss": 0.4909, + "step": 1098 + }, + { + "epoch": 0.09, + "learning_rate": 1.98298141938951e-05, + "loss": 0.516, + "step": 1099 + }, + { + "epoch": 0.09, + "learning_rate": 1.982934247740261e-05, + "loss": 0.3652, + "step": 1100 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828870113695217e-05, + "loss": 0.5489, + "step": 1101 + }, + { + "epoch": 0.09, + "learning_rate": 1.9828397102804016e-05, + "loss": 0.3523, + "step": 1102 + }, + { + "epoch": 0.09, + "learning_rate": 1.982792344476016e-05, + "loss": 0.3894, + "step": 1103 + }, + { + "epoch": 0.09, + "learning_rate": 1.982744913959483e-05, + "loss": 0.5416, + "step": 1104 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826974187339267e-05, + "loss": 0.5548, + "step": 1105 + }, + { + "epoch": 0.09, + "learning_rate": 1.9826498588024738e-05, + "loss": 0.3728, + "step": 1106 + }, + { + "epoch": 0.09, + "learning_rate": 1.982602234168255e-05, + "loss": 0.4828, + "step": 1107 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825545448344078e-05, + "loss": 0.4501, + "step": 1108 + }, + { + "epoch": 0.09, + "learning_rate": 1.9825067908040716e-05, + "loss": 0.5197, + "step": 1109 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824589720803906e-05, + "loss": 0.4577, + "step": 1110 + }, + { + "epoch": 0.09, + "learning_rate": 1.9824110886665137e-05, + "loss": 0.4475, + "step": 1111 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823631405655933e-05, + "loss": 0.459, + "step": 1112 + }, + { + "epoch": 0.09, + "learning_rate": 1.9823151277807873e-05, + "loss": 0.3884, + "step": 1113 + }, + { + "epoch": 0.09, + "learning_rate": 1.9822670503152567e-05, + "loss": 0.362, + "step": 1114 + }, + { + "epoch": 0.09, + "learning_rate": 1.982218908172167e-05, + "loss": 0.37, + "step": 1115 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821707013546885e-05, + "loss": 0.6234, + "step": 1116 + }, + { + "epoch": 0.09, + "learning_rate": 1.9821224298659953e-05, + "loss": 0.4824, + "step": 1117 + }, + { + "epoch": 0.09, + "learning_rate": 1.9820740937092656e-05, + "loss": 0.3945, + "step": 1118 + }, + { + "epoch": 0.09, + "learning_rate": 1.982025692887682e-05, + "loss": 0.5784, + "step": 1119 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819772274044323e-05, + "loss": 0.4242, + "step": 1120 + }, + { + "epoch": 0.09, + "learning_rate": 1.9819286972627066e-05, + "loss": 0.3683, + "step": 1121 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818801024657014e-05, + "loss": 0.4464, + "step": 1122 + }, + { + "epoch": 0.09, + "learning_rate": 1.9818314430166158e-05, + "loss": 0.4628, + "step": 1123 + }, + { + "epoch": 0.09, + "learning_rate": 1.981782718918654e-05, + "loss": 0.4451, + "step": 1124 + }, + { + "epoch": 0.09, + "learning_rate": 1.981733930175024e-05, + "loss": 0.4066, + "step": 1125 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816850767889387e-05, + "loss": 0.4074, + "step": 1126 + }, + { + "epoch": 0.09, + "learning_rate": 1.9816361587636143e-05, + "loss": 0.4966, + "step": 1127 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815871761022727e-05, + "loss": 0.5281, + "step": 1128 + }, + { + "epoch": 0.09, + "learning_rate": 1.9815381288081382e-05, + "loss": 0.34, + "step": 1129 + }, + { + "epoch": 0.09, + "learning_rate": 1.9814890168844412e-05, + "loss": 0.4947, + "step": 1130 + }, + { + "epoch": 0.09, + "learning_rate": 1.981439840334415e-05, + "loss": 0.4474, + "step": 1131 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813905991612974e-05, + "loss": 0.5167, + "step": 1132 + }, + { + "epoch": 0.09, + "learning_rate": 1.9813412933683312e-05, + "loss": 0.4204, + "step": 1133 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812919229587626e-05, + "loss": 0.3291, + "step": 1134 + }, + { + "epoch": 0.09, + "learning_rate": 1.9812424879358424e-05, + "loss": 0.4281, + "step": 1135 + }, + { + "epoch": 0.09, + "learning_rate": 1.981192988302826e-05, + "loss": 0.5149, + "step": 1136 + }, + { + "epoch": 0.09, + "learning_rate": 1.981143424062973e-05, + "loss": 0.3662, + "step": 1137 + }, + { + "epoch": 0.09, + "learning_rate": 1.981093795219546e-05, + "loss": 0.537, + "step": 1138 + }, + { + "epoch": 0.09, + "learning_rate": 1.9810441017758132e-05, + "loss": 0.4752, + "step": 1139 + }, + { + "epoch": 0.09, + "learning_rate": 1.980994343735047e-05, + "loss": 0.3718, + "step": 1140 + }, + { + "epoch": 0.09, + "learning_rate": 1.9809445211005235e-05, + "loss": 0.442, + "step": 1141 + }, + { + "epoch": 0.09, + "learning_rate": 1.980894633875523e-05, + "loss": 0.5671, + "step": 1142 + }, + { + "epoch": 0.09, + "learning_rate": 1.980844682063331e-05, + "loss": 0.4499, + "step": 1143 + }, + { + "epoch": 0.09, + "learning_rate": 1.980794665667236e-05, + "loss": 0.4796, + "step": 1144 + }, + { + "epoch": 0.09, + "learning_rate": 1.9807445846905316e-05, + "loss": 0.4985, + "step": 1145 + }, + { + "epoch": 0.09, + "learning_rate": 1.980694439136515e-05, + "loss": 0.4844, + "step": 1146 + }, + { + "epoch": 0.09, + "learning_rate": 1.980644229008489e-05, + "loss": 0.4222, + "step": 1147 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805939543097586e-05, + "loss": 0.5203, + "step": 1148 + }, + { + "epoch": 0.09, + "learning_rate": 1.9805436150436352e-05, + "loss": 0.4981, + "step": 1149 + }, + { + "epoch": 0.09, + "learning_rate": 1.9804932112134323e-05, + "loss": 0.4213, + "step": 1150 + }, + { + "epoch": 0.09, + "learning_rate": 1.9804427428224696e-05, + "loss": 0.4543, + "step": 1151 + }, + { + "epoch": 0.09, + "learning_rate": 1.9803922098740696e-05, + "loss": 0.3829, + "step": 1152 + }, + { + "epoch": 0.09, + "learning_rate": 1.98034161237156e-05, + "loss": 0.4776, + "step": 1153 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802909503182722e-05, + "loss": 0.3998, + "step": 1154 + }, + { + "epoch": 0.09, + "learning_rate": 1.9802402237175426e-05, + "loss": 0.4179, + "step": 1155 + }, + { + "epoch": 0.09, + "learning_rate": 1.9801894325727104e-05, + "loss": 0.3706, + "step": 1156 + }, + { + "epoch": 0.09, + "learning_rate": 1.980138576887121e-05, + "loss": 0.5547, + "step": 1157 + }, + { + "epoch": 0.09, + "learning_rate": 1.980087656664122e-05, + "loss": 0.32, + "step": 1158 + }, + { + "epoch": 0.09, + "learning_rate": 1.9800366719070668e-05, + "loss": 0.4585, + "step": 1159 + }, + { + "epoch": 0.09, + "learning_rate": 1.9799856226193125e-05, + "loss": 0.4255, + "step": 1160 + }, + { + "epoch": 0.09, + "learning_rate": 1.97993450880422e-05, + "loss": 0.4275, + "step": 1161 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798833304651555e-05, + "loss": 0.4841, + "step": 1162 + }, + { + "epoch": 0.09, + "learning_rate": 1.9798320876054882e-05, + "loss": 0.4311, + "step": 1163 + }, + { + "epoch": 0.09, + "learning_rate": 1.9797807802285933e-05, + "loss": 0.468, + "step": 1164 + }, + { + "epoch": 0.09, + "learning_rate": 1.979729408337848e-05, + "loss": 0.3709, + "step": 1165 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796779719366355e-05, + "loss": 0.4043, + "step": 1166 + }, + { + "epoch": 0.09, + "learning_rate": 1.9796264710283425e-05, + "loss": 0.5366, + "step": 1167 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795749056163595e-05, + "loss": 0.4181, + "step": 1168 + }, + { + "epoch": 0.09, + "learning_rate": 1.9795232757040827e-05, + "loss": 0.2701, + "step": 1169 + }, + { + "epoch": 0.09, + "learning_rate": 1.9794715812949117e-05, + "loss": 0.3383, + "step": 1170 + }, + { + "epoch": 0.09, + "learning_rate": 1.9794198223922496e-05, + "loss": 0.4139, + "step": 1171 + }, + { + "epoch": 0.09, + "learning_rate": 1.979367998999505e-05, + "loss": 0.3547, + "step": 1172 + }, + { + "epoch": 0.09, + "learning_rate": 1.97931611112009e-05, + "loss": 0.3509, + "step": 1173 + }, + { + "epoch": 0.09, + "learning_rate": 1.9792641587574212e-05, + "loss": 0.4078, + "step": 1174 + }, + { + "epoch": 0.09, + "learning_rate": 1.9792121419149196e-05, + "loss": 0.4896, + "step": 1175 + }, + { + "epoch": 0.09, + "learning_rate": 1.97916006059601e-05, + "loss": 0.3662, + "step": 1176 + }, + { + "epoch": 0.09, + "learning_rate": 1.979107914804122e-05, + "loss": 0.4445, + "step": 1177 + }, + { + "epoch": 0.09, + "learning_rate": 1.979055704542689e-05, + "loss": 0.5803, + "step": 1178 + }, + { + "epoch": 0.09, + "learning_rate": 1.9790034298151486e-05, + "loss": 0.3698, + "step": 1179 + }, + { + "epoch": 0.09, + "learning_rate": 1.9789510906249432e-05, + "loss": 0.3472, + "step": 1180 + }, + { + "epoch": 0.09, + "learning_rate": 1.9788986869755187e-05, + "loss": 0.5013, + "step": 1181 + }, + { + "epoch": 0.09, + "learning_rate": 1.978846218870326e-05, + "loss": 0.6103, + "step": 1182 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787936863128195e-05, + "loss": 0.3604, + "step": 1183 + }, + { + "epoch": 0.09, + "learning_rate": 1.9787410893064584e-05, + "loss": 0.5179, + "step": 1184 + }, + { + "epoch": 0.09, + "learning_rate": 1.978688427854706e-05, + "loss": 0.4062, + "step": 1185 + }, + { + "epoch": 0.09, + "learning_rate": 1.97863570196103e-05, + "loss": 0.4319, + "step": 1186 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785829116289017e-05, + "loss": 0.4197, + "step": 1187 + }, + { + "epoch": 0.09, + "learning_rate": 1.9785300568617973e-05, + "loss": 0.4089, + "step": 1188 + }, + { + "epoch": 0.09, + "learning_rate": 1.978477137663197e-05, + "loss": 0.4835, + "step": 1189 + }, + { + "epoch": 0.09, + "learning_rate": 1.9784241540365856e-05, + "loss": 0.4701, + "step": 1190 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783711059854514e-05, + "loss": 0.3796, + "step": 1191 + }, + { + "epoch": 0.09, + "learning_rate": 1.9783179935132874e-05, + "loss": 0.4592, + "step": 1192 + }, + { + "epoch": 0.09, + "learning_rate": 1.978264816623591e-05, + "loss": 0.4031, + "step": 1193 + }, + { + "epoch": 0.09, + "learning_rate": 1.9782115753198633e-05, + "loss": 0.496, + "step": 1194 + }, + { + "epoch": 0.09, + "learning_rate": 1.9781582696056105e-05, + "loss": 0.4183, + "step": 1195 + }, + { + "epoch": 0.09, + "learning_rate": 1.9781048994843423e-05, + "loss": 0.5047, + "step": 1196 + }, + { + "epoch": 0.09, + "learning_rate": 1.9780514649595727e-05, + "loss": 0.3336, + "step": 1197 + }, + { + "epoch": 0.09, + "learning_rate": 1.97799796603482e-05, + "loss": 0.5387, + "step": 1198 + }, + { + "epoch": 0.09, + "learning_rate": 1.9779444027136075e-05, + "loss": 0.4606, + "step": 1199 + }, + { + "epoch": 0.1, + "learning_rate": 1.977890774999461e-05, + "loss": 0.4605, + "step": 1200 + }, + { + "epoch": 0.1, + "learning_rate": 1.977837082895913e-05, + "loss": 0.495, + "step": 1201 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777833264064977e-05, + "loss": 0.3635, + "step": 1202 + }, + { + "epoch": 0.1, + "learning_rate": 1.9777295055347553e-05, + "loss": 0.4142, + "step": 1203 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776756202842297e-05, + "loss": 0.3457, + "step": 1204 + }, + { + "epoch": 0.1, + "learning_rate": 1.9776216706584682e-05, + "loss": 0.5133, + "step": 1205 + }, + { + "epoch": 0.1, + "learning_rate": 1.977567656661024e-05, + "loss": 0.4657, + "step": 1206 + }, + { + "epoch": 0.1, + "learning_rate": 1.9775135782954534e-05, + "loss": 0.4199, + "step": 1207 + }, + { + "epoch": 0.1, + "learning_rate": 1.9774594355653175e-05, + "loss": 0.427, + "step": 1208 + }, + { + "epoch": 0.1, + "learning_rate": 1.9774052284741804e-05, + "loss": 0.3908, + "step": 1209 + }, + { + "epoch": 0.1, + "learning_rate": 1.9773509570256124e-05, + "loss": 0.5115, + "step": 1210 + }, + { + "epoch": 0.1, + "learning_rate": 1.9772966212231863e-05, + "loss": 0.59, + "step": 1211 + }, + { + "epoch": 0.1, + "learning_rate": 1.9772422210704803e-05, + "loss": 0.4842, + "step": 1212 + }, + { + "epoch": 0.1, + "learning_rate": 1.977187756571076e-05, + "loss": 0.4459, + "step": 1213 + }, + { + "epoch": 0.1, + "learning_rate": 1.9771332277285603e-05, + "loss": 0.4164, + "step": 1214 + }, + { + "epoch": 0.1, + "learning_rate": 1.977078634546523e-05, + "loss": 0.5567, + "step": 1215 + }, + { + "epoch": 0.1, + "learning_rate": 1.977023977028559e-05, + "loss": 0.4697, + "step": 1216 + }, + { + "epoch": 0.1, + "learning_rate": 1.9769692551782672e-05, + "loss": 0.5447, + "step": 1217 + }, + { + "epoch": 0.1, + "learning_rate": 1.976914468999251e-05, + "loss": 0.3813, + "step": 1218 + }, + { + "epoch": 0.1, + "learning_rate": 1.9768596184951174e-05, + "loss": 0.4155, + "step": 1219 + }, + { + "epoch": 0.1, + "learning_rate": 1.9768047036694785e-05, + "loss": 0.4639, + "step": 1220 + }, + { + "epoch": 0.1, + "learning_rate": 1.9767497245259496e-05, + "loss": 0.3676, + "step": 1221 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766946810681517e-05, + "loss": 0.3927, + "step": 1222 + }, + { + "epoch": 0.1, + "learning_rate": 1.9766395732997082e-05, + "loss": 0.3933, + "step": 1223 + }, + { + "epoch": 0.1, + "learning_rate": 1.9765844012242482e-05, + "loss": 0.4179, + "step": 1224 + }, + { + "epoch": 0.1, + "learning_rate": 1.9765291648454042e-05, + "loss": 0.379, + "step": 1225 + }, + { + "epoch": 0.1, + "learning_rate": 1.9764738641668137e-05, + "loss": 0.4625, + "step": 1226 + }, + { + "epoch": 0.1, + "learning_rate": 1.9764184991921178e-05, + "loss": 0.4501, + "step": 1227 + }, + { + "epoch": 0.1, + "learning_rate": 1.9763630699249615e-05, + "loss": 0.3815, + "step": 1228 + }, + { + "epoch": 0.1, + "learning_rate": 1.9763075763689956e-05, + "loss": 0.4352, + "step": 1229 + }, + { + "epoch": 0.1, + "learning_rate": 1.9762520185278734e-05, + "loss": 0.414, + "step": 1230 + }, + { + "epoch": 0.1, + "learning_rate": 1.9761963964052528e-05, + "loss": 0.4829, + "step": 1231 + }, + { + "epoch": 0.1, + "learning_rate": 1.976140710004797e-05, + "loss": 0.55, + "step": 1232 + }, + { + "epoch": 0.1, + "learning_rate": 1.976084959330172e-05, + "loss": 0.4511, + "step": 1233 + }, + { + "epoch": 0.1, + "learning_rate": 1.9760291443850496e-05, + "loss": 0.4538, + "step": 1234 + }, + { + "epoch": 0.1, + "learning_rate": 1.9759732651731037e-05, + "loss": 0.3933, + "step": 1235 + }, + { + "epoch": 0.1, + "learning_rate": 1.975917321698015e-05, + "loss": 0.4289, + "step": 1236 + }, + { + "epoch": 0.1, + "learning_rate": 1.9758613139634662e-05, + "loss": 0.5142, + "step": 1237 + }, + { + "epoch": 0.1, + "learning_rate": 1.975805241973145e-05, + "loss": 0.5235, + "step": 1238 + }, + { + "epoch": 0.1, + "learning_rate": 1.9757491057307448e-05, + "loss": 0.4736, + "step": 1239 + }, + { + "epoch": 0.1, + "learning_rate": 1.9756929052399606e-05, + "loss": 0.4585, + "step": 1240 + }, + { + "epoch": 0.1, + "learning_rate": 1.9756366405044928e-05, + "loss": 0.4713, + "step": 1241 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755803115280476e-05, + "loss": 0.4261, + "step": 1242 + }, + { + "epoch": 0.1, + "learning_rate": 1.9755239183143323e-05, + "loss": 0.3687, + "step": 1243 + }, + { + "epoch": 0.1, + "learning_rate": 1.9754674608670613e-05, + "loss": 0.508, + "step": 1244 + }, + { + "epoch": 0.1, + "learning_rate": 1.9754109391899514e-05, + "loss": 0.514, + "step": 1245 + }, + { + "epoch": 0.1, + "learning_rate": 1.975354353286725e-05, + "loss": 0.4466, + "step": 1246 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752977031611072e-05, + "loss": 0.4878, + "step": 1247 + }, + { + "epoch": 0.1, + "learning_rate": 1.9752409888168285e-05, + "loss": 0.4143, + "step": 1248 + }, + { + "epoch": 0.1, + "learning_rate": 1.975184210257623e-05, + "loss": 0.4909, + "step": 1249 + }, + { + "epoch": 0.1, + "learning_rate": 1.97512736748723e-05, + "loss": 0.4131, + "step": 1250 + }, + { + "epoch": 0.1, + "learning_rate": 1.975070460509392e-05, + "loss": 0.4785, + "step": 1251 + }, + { + "epoch": 0.1, + "learning_rate": 1.9750134893278553e-05, + "loss": 0.4097, + "step": 1252 + }, + { + "epoch": 0.1, + "learning_rate": 1.974956453946372e-05, + "loss": 0.3688, + "step": 1253 + }, + { + "epoch": 0.1, + "learning_rate": 1.9748993543686973e-05, + "loss": 0.4027, + "step": 1254 + }, + { + "epoch": 0.1, + "learning_rate": 1.9748421905985915e-05, + "loss": 0.5024, + "step": 1255 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747849626398176e-05, + "loss": 0.4286, + "step": 1256 + }, + { + "epoch": 0.1, + "learning_rate": 1.9747276704961447e-05, + "loss": 0.351, + "step": 1257 + }, + { + "epoch": 0.1, + "learning_rate": 1.9746703141713444e-05, + "loss": 0.4535, + "step": 1258 + }, + { + "epoch": 0.1, + "learning_rate": 1.974612893669194e-05, + "loss": 0.4548, + "step": 1259 + }, + { + "epoch": 0.1, + "learning_rate": 1.974555408993474e-05, + "loss": 0.493, + "step": 1260 + }, + { + "epoch": 0.1, + "learning_rate": 1.9744978601479693e-05, + "loss": 0.4557, + "step": 1261 + }, + { + "epoch": 0.1, + "learning_rate": 1.97444024713647e-05, + "loss": 0.497, + "step": 1262 + }, + { + "epoch": 0.1, + "learning_rate": 1.9743825699627687e-05, + "loss": 0.5231, + "step": 1263 + }, + { + "epoch": 0.1, + "learning_rate": 1.974324828630664e-05, + "loss": 0.5269, + "step": 1264 + }, + { + "epoch": 0.1, + "learning_rate": 1.974267023143957e-05, + "loss": 0.4373, + "step": 1265 + }, + { + "epoch": 0.1, + "learning_rate": 1.974209153506455e-05, + "loss": 0.6751, + "step": 1266 + }, + { + "epoch": 0.1, + "learning_rate": 1.9741512197219675e-05, + "loss": 0.4119, + "step": 1267 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740932217943095e-05, + "loss": 0.3822, + "step": 1268 + }, + { + "epoch": 0.1, + "learning_rate": 1.9740351597272998e-05, + "loss": 0.3713, + "step": 1269 + }, + { + "epoch": 0.1, + "learning_rate": 1.9739770335247616e-05, + "loss": 0.5091, + "step": 1270 + }, + { + "epoch": 0.1, + "learning_rate": 1.9739188431905223e-05, + "loss": 0.5587, + "step": 1271 + }, + { + "epoch": 0.1, + "learning_rate": 1.9738605887284134e-05, + "loss": 0.4384, + "step": 1272 + }, + { + "epoch": 0.1, + "learning_rate": 1.9738022701422705e-05, + "loss": 0.5007, + "step": 1273 + }, + { + "epoch": 0.1, + "learning_rate": 1.973743887435934e-05, + "loss": 0.4024, + "step": 1274 + }, + { + "epoch": 0.1, + "learning_rate": 1.9736854406132476e-05, + "loss": 0.3731, + "step": 1275 + }, + { + "epoch": 0.1, + "learning_rate": 1.9736269296780603e-05, + "loss": 0.4056, + "step": 1276 + }, + { + "epoch": 0.1, + "learning_rate": 1.9735683546342243e-05, + "loss": 0.5726, + "step": 1277 + }, + { + "epoch": 0.1, + "learning_rate": 1.9735097154855968e-05, + "loss": 0.4579, + "step": 1278 + }, + { + "epoch": 0.1, + "learning_rate": 1.9734510122360383e-05, + "loss": 0.6147, + "step": 1279 + }, + { + "epoch": 0.1, + "learning_rate": 1.973392244889415e-05, + "loss": 0.4665, + "step": 1280 + }, + { + "epoch": 0.1, + "learning_rate": 1.9733334134495963e-05, + "loss": 0.4923, + "step": 1281 + }, + { + "epoch": 0.1, + "learning_rate": 1.9732745179204553e-05, + "loss": 0.4753, + "step": 1282 + }, + { + "epoch": 0.1, + "learning_rate": 1.9732155583058705e-05, + "loss": 0.5242, + "step": 1283 + }, + { + "epoch": 0.1, + "learning_rate": 1.973156534609724e-05, + "loss": 0.466, + "step": 1284 + }, + { + "epoch": 0.1, + "learning_rate": 1.973097446835902e-05, + "loss": 0.5001, + "step": 1285 + }, + { + "epoch": 0.1, + "learning_rate": 1.9730382949882955e-05, + "loss": 0.3944, + "step": 1286 + }, + { + "epoch": 0.1, + "learning_rate": 1.9729790790707995e-05, + "loss": 0.4907, + "step": 1287 + }, + { + "epoch": 0.1, + "learning_rate": 1.9729197990873127e-05, + "loss": 0.3944, + "step": 1288 + }, + { + "epoch": 0.1, + "learning_rate": 1.9728604550417385e-05, + "loss": 0.4432, + "step": 1289 + }, + { + "epoch": 0.1, + "learning_rate": 1.9728010469379844e-05, + "loss": 0.4358, + "step": 1290 + }, + { + "epoch": 0.1, + "learning_rate": 1.972741574779962e-05, + "loss": 0.531, + "step": 1291 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726820385715877e-05, + "loss": 0.4573, + "step": 1292 + }, + { + "epoch": 0.1, + "learning_rate": 1.9726224383167815e-05, + "loss": 0.3515, + "step": 1293 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725627740194673e-05, + "loss": 0.3772, + "step": 1294 + }, + { + "epoch": 0.1, + "learning_rate": 1.9725030456835745e-05, + "loss": 0.3064, + "step": 1295 + }, + { + "epoch": 0.1, + "learning_rate": 1.9724432533130355e-05, + "loss": 0.5013, + "step": 1296 + }, + { + "epoch": 0.1, + "learning_rate": 1.972383396911787e-05, + "loss": 0.4621, + "step": 1297 + }, + { + "epoch": 0.1, + "learning_rate": 1.9723234764837708e-05, + "loss": 0.3751, + "step": 1298 + }, + { + "epoch": 0.1, + "learning_rate": 1.9722634920329323e-05, + "loss": 0.3972, + "step": 1299 + }, + { + "epoch": 0.1, + "learning_rate": 1.9722034435632207e-05, + "loss": 0.5768, + "step": 1300 + }, + { + "epoch": 0.1, + "learning_rate": 1.972143331078591e-05, + "loss": 0.4982, + "step": 1301 + }, + { + "epoch": 0.1, + "learning_rate": 1.972083154583e-05, + "loss": 0.4241, + "step": 1302 + }, + { + "epoch": 0.1, + "learning_rate": 1.972022914080411e-05, + "loss": 0.3216, + "step": 1303 + }, + { + "epoch": 0.1, + "learning_rate": 1.9719626095747897e-05, + "loss": 0.5108, + "step": 1304 + }, + { + "epoch": 0.1, + "learning_rate": 1.971902241070108e-05, + "loss": 0.4501, + "step": 1305 + }, + { + "epoch": 0.1, + "learning_rate": 1.9718418085703397e-05, + "loss": 0.481, + "step": 1306 + }, + { + "epoch": 0.1, + "learning_rate": 1.971781312079465e-05, + "loss": 0.3216, + "step": 1307 + }, + { + "epoch": 0.1, + "learning_rate": 1.9717207516014664e-05, + "loss": 0.4592, + "step": 1308 + }, + { + "epoch": 0.1, + "learning_rate": 1.9716601271403322e-05, + "loss": 0.4164, + "step": 1309 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715994387000537e-05, + "loss": 0.5396, + "step": 1310 + }, + { + "epoch": 0.1, + "learning_rate": 1.9715386862846272e-05, + "loss": 0.4403, + "step": 1311 + }, + { + "epoch": 0.1, + "learning_rate": 1.971477869898053e-05, + "loss": 0.3807, + "step": 1312 + }, + { + "epoch": 0.1, + "learning_rate": 1.9714169895443357e-05, + "loss": 0.3965, + "step": 1313 + }, + { + "epoch": 0.1, + "learning_rate": 1.971356045227484e-05, + "loss": 0.534, + "step": 1314 + }, + { + "epoch": 0.1, + "learning_rate": 1.97129503695151e-05, + "loss": 0.4512, + "step": 1315 + }, + { + "epoch": 0.1, + "learning_rate": 1.9712339647204313e-05, + "loss": 0.458, + "step": 1316 + }, + { + "epoch": 0.1, + "learning_rate": 1.97117282853827e-05, + "loss": 0.2889, + "step": 1317 + }, + { + "epoch": 0.1, + "learning_rate": 1.9711116284090506e-05, + "loss": 0.4503, + "step": 1318 + }, + { + "epoch": 0.1, + "learning_rate": 1.971050364336803e-05, + "loss": 0.4798, + "step": 1319 + }, + { + "epoch": 0.1, + "learning_rate": 1.9709890363255617e-05, + "loss": 0.5163, + "step": 1320 + }, + { + "epoch": 0.1, + "learning_rate": 1.9709276443793638e-05, + "loss": 0.4998, + "step": 1321 + }, + { + "epoch": 0.1, + "learning_rate": 1.970866188502253e-05, + "loss": 0.5327, + "step": 1322 + }, + { + "epoch": 0.1, + "learning_rate": 1.970804668698275e-05, + "loss": 0.4054, + "step": 1323 + }, + { + "epoch": 0.1, + "learning_rate": 1.970743084971481e-05, + "loss": 0.5559, + "step": 1324 + }, + { + "epoch": 0.1, + "learning_rate": 1.970681437325925e-05, + "loss": 0.4523, + "step": 1325 + }, + { + "epoch": 0.11, + "learning_rate": 1.9706197257656675e-05, + "loss": 0.4899, + "step": 1326 + }, + { + "epoch": 0.11, + "learning_rate": 1.9705579502947712e-05, + "loss": 0.397, + "step": 1327 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704961109173042e-05, + "loss": 0.5988, + "step": 1328 + }, + { + "epoch": 0.11, + "learning_rate": 1.9704342076373378e-05, + "loss": 0.5063, + "step": 1329 + }, + { + "epoch": 0.11, + "learning_rate": 1.9703722404589484e-05, + "loss": 0.3583, + "step": 1330 + }, + { + "epoch": 0.11, + "learning_rate": 1.970310209386216e-05, + "loss": 0.4242, + "step": 1331 + }, + { + "epoch": 0.11, + "learning_rate": 1.9702481144232253e-05, + "loss": 0.4139, + "step": 1332 + }, + { + "epoch": 0.11, + "learning_rate": 1.9701859555740647e-05, + "loss": 0.3979, + "step": 1333 + }, + { + "epoch": 0.11, + "learning_rate": 1.9701237328428272e-05, + "loss": 0.4168, + "step": 1334 + }, + { + "epoch": 0.11, + "learning_rate": 1.9700614462336096e-05, + "loss": 0.4663, + "step": 1335 + }, + { + "epoch": 0.11, + "learning_rate": 1.9699990957505136e-05, + "loss": 0.4349, + "step": 1336 + }, + { + "epoch": 0.11, + "learning_rate": 1.9699366813976443e-05, + "loss": 0.3355, + "step": 1337 + }, + { + "epoch": 0.11, + "learning_rate": 1.9698742031791118e-05, + "loss": 0.4293, + "step": 1338 + }, + { + "epoch": 0.11, + "learning_rate": 1.96981166109903e-05, + "loss": 0.3956, + "step": 1339 + }, + { + "epoch": 0.11, + "learning_rate": 1.9697490551615162e-05, + "loss": 0.5424, + "step": 1340 + }, + { + "epoch": 0.11, + "learning_rate": 1.9696863853706937e-05, + "loss": 0.3549, + "step": 1341 + }, + { + "epoch": 0.11, + "learning_rate": 1.969623651730688e-05, + "loss": 0.3475, + "step": 1342 + }, + { + "epoch": 0.11, + "learning_rate": 1.969560854245631e-05, + "loss": 0.4433, + "step": 1343 + }, + { + "epoch": 0.11, + "learning_rate": 1.9694979929196566e-05, + "loss": 0.4569, + "step": 1344 + }, + { + "epoch": 0.11, + "learning_rate": 1.9694350677569043e-05, + "loss": 0.4035, + "step": 1345 + }, + { + "epoch": 0.11, + "learning_rate": 1.9693720787615174e-05, + "loss": 0.4386, + "step": 1346 + }, + { + "epoch": 0.11, + "learning_rate": 1.9693090259376436e-05, + "loss": 0.3998, + "step": 1347 + }, + { + "epoch": 0.11, + "learning_rate": 1.9692459092894343e-05, + "loss": 0.4668, + "step": 1348 + }, + { + "epoch": 0.11, + "learning_rate": 1.969182728821046e-05, + "loss": 0.4699, + "step": 1349 + }, + { + "epoch": 0.11, + "learning_rate": 1.969119484536638e-05, + "loss": 0.4695, + "step": 1350 + }, + { + "epoch": 0.11, + "learning_rate": 1.969056176440375e-05, + "loss": 0.3789, + "step": 1351 + }, + { + "epoch": 0.11, + "learning_rate": 1.9689928045364258e-05, + "loss": 0.3404, + "step": 1352 + }, + { + "epoch": 0.11, + "learning_rate": 1.9689293688289627e-05, + "loss": 0.5195, + "step": 1353 + }, + { + "epoch": 0.11, + "learning_rate": 1.968865869322163e-05, + "loss": 0.4015, + "step": 1354 + }, + { + "epoch": 0.11, + "learning_rate": 1.968802306020208e-05, + "loss": 0.5871, + "step": 1355 + }, + { + "epoch": 0.11, + "learning_rate": 1.968738678927282e-05, + "loss": 0.5685, + "step": 1356 + }, + { + "epoch": 0.11, + "learning_rate": 1.9686749880475756e-05, + "loss": 0.4103, + "step": 1357 + }, + { + "epoch": 0.11, + "learning_rate": 1.9686112333852826e-05, + "loss": 0.4195, + "step": 1358 + }, + { + "epoch": 0.11, + "learning_rate": 1.9685474149446e-05, + "loss": 0.5201, + "step": 1359 + }, + { + "epoch": 0.11, + "learning_rate": 1.9684835327297306e-05, + "loss": 0.4402, + "step": 1360 + }, + { + "epoch": 0.11, + "learning_rate": 1.9684195867448806e-05, + "loss": 0.3823, + "step": 1361 + }, + { + "epoch": 0.11, + "learning_rate": 1.9683555769942608e-05, + "loss": 0.5281, + "step": 1362 + }, + { + "epoch": 0.11, + "learning_rate": 1.968291503482086e-05, + "loss": 0.4295, + "step": 1363 + }, + { + "epoch": 0.11, + "learning_rate": 1.968227366212574e-05, + "loss": 0.4718, + "step": 1364 + }, + { + "epoch": 0.11, + "learning_rate": 1.968163165189949e-05, + "loss": 0.4864, + "step": 1365 + }, + { + "epoch": 0.11, + "learning_rate": 1.9680989004184383e-05, + "loss": 0.3038, + "step": 1366 + }, + { + "epoch": 0.11, + "learning_rate": 1.968034571902273e-05, + "loss": 0.4419, + "step": 1367 + }, + { + "epoch": 0.11, + "learning_rate": 1.967970179645689e-05, + "loss": 0.4248, + "step": 1368 + }, + { + "epoch": 0.11, + "learning_rate": 1.9679057236529266e-05, + "loss": 0.4758, + "step": 1369 + }, + { + "epoch": 0.11, + "learning_rate": 1.9678412039282292e-05, + "loss": 0.5392, + "step": 1370 + }, + { + "epoch": 0.11, + "learning_rate": 1.967776620475846e-05, + "loss": 0.391, + "step": 1371 + }, + { + "epoch": 0.11, + "learning_rate": 1.9677119733000283e-05, + "loss": 0.5069, + "step": 1372 + }, + { + "epoch": 0.11, + "learning_rate": 1.967647262405034e-05, + "loss": 0.5139, + "step": 1373 + }, + { + "epoch": 0.11, + "learning_rate": 1.967582487795123e-05, + "loss": 0.3163, + "step": 1374 + }, + { + "epoch": 0.11, + "learning_rate": 1.967517649474561e-05, + "loss": 0.3057, + "step": 1375 + }, + { + "epoch": 0.11, + "learning_rate": 1.9674527474476175e-05, + "loss": 0.4374, + "step": 1376 + }, + { + "epoch": 0.11, + "learning_rate": 1.9673877817185656e-05, + "loss": 0.3708, + "step": 1377 + }, + { + "epoch": 0.11, + "learning_rate": 1.9673227522916827e-05, + "loss": 0.4855, + "step": 1378 + }, + { + "epoch": 0.11, + "learning_rate": 1.9672576591712517e-05, + "loss": 0.3572, + "step": 1379 + }, + { + "epoch": 0.11, + "learning_rate": 1.9671925023615572e-05, + "loss": 0.4179, + "step": 1380 + }, + { + "epoch": 0.11, + "learning_rate": 1.9671272818668906e-05, + "loss": 0.3952, + "step": 1381 + }, + { + "epoch": 0.11, + "learning_rate": 1.967061997691546e-05, + "loss": 0.3259, + "step": 1382 + }, + { + "epoch": 0.11, + "learning_rate": 1.966996649839822e-05, + "loss": 0.4694, + "step": 1383 + }, + { + "epoch": 0.11, + "learning_rate": 1.9669312383160217e-05, + "loss": 0.4401, + "step": 1384 + }, + { + "epoch": 0.11, + "learning_rate": 1.966865763124452e-05, + "loss": 0.3648, + "step": 1385 + }, + { + "epoch": 0.11, + "learning_rate": 1.966800224269424e-05, + "loss": 0.3914, + "step": 1386 + }, + { + "epoch": 0.11, + "learning_rate": 1.9667346217552528e-05, + "loss": 0.4736, + "step": 1387 + }, + { + "epoch": 0.11, + "learning_rate": 1.9666689555862586e-05, + "loss": 0.3737, + "step": 1388 + }, + { + "epoch": 0.11, + "learning_rate": 1.966603225766765e-05, + "loss": 0.3338, + "step": 1389 + }, + { + "epoch": 0.11, + "learning_rate": 1.9665374323011002e-05, + "loss": 0.344, + "step": 1390 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664715751935958e-05, + "loss": 0.3035, + "step": 1391 + }, + { + "epoch": 0.11, + "learning_rate": 1.9664056544485887e-05, + "loss": 0.505, + "step": 1392 + }, + { + "epoch": 0.11, + "learning_rate": 1.9663396700704195e-05, + "loss": 0.3742, + "step": 1393 + }, + { + "epoch": 0.11, + "learning_rate": 1.9662736220634325e-05, + "loss": 0.3997, + "step": 1394 + }, + { + "epoch": 0.11, + "learning_rate": 1.966207510431977e-05, + "loss": 0.5213, + "step": 1395 + }, + { + "epoch": 0.11, + "learning_rate": 1.966141335180406e-05, + "loss": 0.4413, + "step": 1396 + }, + { + "epoch": 0.11, + "learning_rate": 1.966075096313077e-05, + "loss": 0.3747, + "step": 1397 + }, + { + "epoch": 0.11, + "learning_rate": 1.966008793834351e-05, + "loss": 0.4642, + "step": 1398 + }, + { + "epoch": 0.11, + "learning_rate": 1.9659424277485943e-05, + "loss": 0.4506, + "step": 1399 + }, + { + "epoch": 0.11, + "learning_rate": 1.9658759980601766e-05, + "loss": 0.4326, + "step": 1400 + }, + { + "epoch": 0.11, + "learning_rate": 1.9658095047734718e-05, + "loss": 0.4413, + "step": 1401 + }, + { + "epoch": 0.11, + "learning_rate": 1.965742947892858e-05, + "loss": 0.424, + "step": 1402 + }, + { + "epoch": 0.11, + "learning_rate": 1.9656763274227188e-05, + "loss": 0.2823, + "step": 1403 + }, + { + "epoch": 0.11, + "learning_rate": 1.9656096433674393e-05, + "loss": 0.3504, + "step": 1404 + }, + { + "epoch": 0.11, + "learning_rate": 1.965542895731411e-05, + "loss": 0.4783, + "step": 1405 + }, + { + "epoch": 0.11, + "learning_rate": 1.965476084519029e-05, + "loss": 0.4495, + "step": 1406 + }, + { + "epoch": 0.11, + "learning_rate": 1.9654092097346925e-05, + "loss": 0.4662, + "step": 1407 + }, + { + "epoch": 0.11, + "learning_rate": 1.965342271382805e-05, + "loss": 0.4943, + "step": 1408 + }, + { + "epoch": 0.11, + "learning_rate": 1.9652752694677735e-05, + "loss": 0.4273, + "step": 1409 + }, + { + "epoch": 0.11, + "learning_rate": 1.9652082039940102e-05, + "loss": 0.4313, + "step": 1410 + }, + { + "epoch": 0.11, + "learning_rate": 1.965141074965931e-05, + "loss": 0.4806, + "step": 1411 + }, + { + "epoch": 0.11, + "learning_rate": 1.965073882387956e-05, + "loss": 0.4224, + "step": 1412 + }, + { + "epoch": 0.11, + "learning_rate": 1.9650066262645097e-05, + "loss": 0.3804, + "step": 1413 + }, + { + "epoch": 0.11, + "learning_rate": 1.96493930660002e-05, + "loss": 0.4907, + "step": 1414 + }, + { + "epoch": 0.11, + "learning_rate": 1.9648719233989202e-05, + "loss": 0.3922, + "step": 1415 + }, + { + "epoch": 0.11, + "learning_rate": 1.9648044766656466e-05, + "loss": 0.3935, + "step": 1416 + }, + { + "epoch": 0.11, + "learning_rate": 1.9647369664046407e-05, + "loss": 0.4149, + "step": 1417 + }, + { + "epoch": 0.11, + "learning_rate": 1.9646693926203477e-05, + "loss": 0.5757, + "step": 1418 + }, + { + "epoch": 0.11, + "learning_rate": 1.964601755317217e-05, + "loss": 0.3758, + "step": 1419 + }, + { + "epoch": 0.11, + "learning_rate": 1.9645340544997017e-05, + "loss": 0.3541, + "step": 1420 + }, + { + "epoch": 0.11, + "learning_rate": 1.9644662901722603e-05, + "loss": 0.4254, + "step": 1421 + }, + { + "epoch": 0.11, + "learning_rate": 1.9643984623393542e-05, + "loss": 0.3137, + "step": 1422 + }, + { + "epoch": 0.11, + "learning_rate": 1.96433057100545e-05, + "loss": 0.4151, + "step": 1423 + }, + { + "epoch": 0.11, + "learning_rate": 1.9642626161750176e-05, + "loss": 0.5281, + "step": 1424 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641945978525318e-05, + "loss": 0.4291, + "step": 1425 + }, + { + "epoch": 0.11, + "learning_rate": 1.9641265160424705e-05, + "loss": 0.4627, + "step": 1426 + }, + { + "epoch": 0.11, + "learning_rate": 1.9640583707493176e-05, + "loss": 0.3875, + "step": 1427 + }, + { + "epoch": 0.11, + "learning_rate": 1.96399016197756e-05, + "loss": 0.5014, + "step": 1428 + }, + { + "epoch": 0.11, + "learning_rate": 1.9639218897316885e-05, + "loss": 0.4956, + "step": 1429 + }, + { + "epoch": 0.11, + "learning_rate": 1.9638535540161988e-05, + "loss": 0.4108, + "step": 1430 + }, + { + "epoch": 0.11, + "learning_rate": 1.96378515483559e-05, + "loss": 0.3751, + "step": 1431 + }, + { + "epoch": 0.11, + "learning_rate": 1.9637166921943663e-05, + "loss": 0.4936, + "step": 1432 + }, + { + "epoch": 0.11, + "learning_rate": 1.963648166097036e-05, + "loss": 0.4658, + "step": 1433 + }, + { + "epoch": 0.11, + "learning_rate": 1.9635795765481102e-05, + "loss": 0.392, + "step": 1434 + }, + { + "epoch": 0.11, + "learning_rate": 1.9635109235521057e-05, + "loss": 0.6297, + "step": 1435 + }, + { + "epoch": 0.11, + "learning_rate": 1.963442207113543e-05, + "loss": 0.5046, + "step": 1436 + }, + { + "epoch": 0.11, + "learning_rate": 1.9633734272369473e-05, + "loss": 0.4885, + "step": 1437 + }, + { + "epoch": 0.11, + "learning_rate": 1.9633045839268464e-05, + "loss": 0.4048, + "step": 1438 + }, + { + "epoch": 0.11, + "learning_rate": 1.9632356771877735e-05, + "loss": 0.3591, + "step": 1439 + }, + { + "epoch": 0.11, + "learning_rate": 1.9631667070242667e-05, + "loss": 0.3854, + "step": 1440 + }, + { + "epoch": 0.11, + "learning_rate": 1.963097673440866e-05, + "loss": 0.5236, + "step": 1441 + }, + { + "epoch": 0.11, + "learning_rate": 1.9630285764421183e-05, + "loss": 0.3711, + "step": 1442 + }, + { + "epoch": 0.11, + "learning_rate": 1.9629594160325725e-05, + "loss": 0.3854, + "step": 1443 + }, + { + "epoch": 0.11, + "learning_rate": 1.9628901922167823e-05, + "loss": 0.4786, + "step": 1444 + }, + { + "epoch": 0.11, + "learning_rate": 1.9628209049993064e-05, + "loss": 0.478, + "step": 1445 + }, + { + "epoch": 0.11, + "learning_rate": 1.9627515543847068e-05, + "loss": 0.4568, + "step": 1446 + }, + { + "epoch": 0.11, + "learning_rate": 1.9626821403775494e-05, + "loss": 0.382, + "step": 1447 + }, + { + "epoch": 0.11, + "learning_rate": 1.9626126629824056e-05, + "loss": 0.4949, + "step": 1448 + }, + { + "epoch": 0.11, + "learning_rate": 1.9625431222038494e-05, + "loss": 0.543, + "step": 1449 + }, + { + "epoch": 0.11, + "learning_rate": 1.9624735180464602e-05, + "loss": 0.5771, + "step": 1450 + }, + { + "epoch": 0.11, + "learning_rate": 1.962403850514821e-05, + "loss": 0.5122, + "step": 1451 + }, + { + "epoch": 0.12, + "learning_rate": 1.962334119613519e-05, + "loss": 0.3963, + "step": 1452 + }, + { + "epoch": 0.12, + "learning_rate": 1.9622643253471457e-05, + "loss": 0.3596, + "step": 1453 + }, + { + "epoch": 0.12, + "learning_rate": 1.9621944677202966e-05, + "loss": 0.401, + "step": 1454 + }, + { + "epoch": 0.12, + "learning_rate": 1.9621245467375715e-05, + "loss": 0.3187, + "step": 1455 + }, + { + "epoch": 0.12, + "learning_rate": 1.9620545624035748e-05, + "loss": 0.5443, + "step": 1456 + }, + { + "epoch": 0.12, + "learning_rate": 1.961984514722914e-05, + "loss": 0.3011, + "step": 1457 + }, + { + "epoch": 0.12, + "learning_rate": 1.9619144037002015e-05, + "loss": 0.4236, + "step": 1458 + }, + { + "epoch": 0.12, + "learning_rate": 1.9618442293400544e-05, + "loss": 0.5173, + "step": 1459 + }, + { + "epoch": 0.12, + "learning_rate": 1.9617739916470926e-05, + "loss": 0.4976, + "step": 1460 + }, + { + "epoch": 0.12, + "learning_rate": 1.9617036906259416e-05, + "loss": 0.5864, + "step": 1461 + }, + { + "epoch": 0.12, + "learning_rate": 1.9616333262812298e-05, + "loss": 0.3987, + "step": 1462 + }, + { + "epoch": 0.12, + "learning_rate": 1.9615628986175902e-05, + "loss": 0.4237, + "step": 1463 + }, + { + "epoch": 0.12, + "learning_rate": 1.9614924076396605e-05, + "loss": 0.4267, + "step": 1464 + }, + { + "epoch": 0.12, + "learning_rate": 1.9614218533520827e-05, + "loss": 0.3616, + "step": 1465 + }, + { + "epoch": 0.12, + "learning_rate": 1.9613512357595014e-05, + "loss": 0.3443, + "step": 1466 + }, + { + "epoch": 0.12, + "learning_rate": 1.9612805548665673e-05, + "loss": 0.4273, + "step": 1467 + }, + { + "epoch": 0.12, + "learning_rate": 1.961209810677934e-05, + "loss": 0.4128, + "step": 1468 + }, + { + "epoch": 0.12, + "learning_rate": 1.9611390031982595e-05, + "loss": 0.4887, + "step": 1469 + }, + { + "epoch": 0.12, + "learning_rate": 1.9610681324322068e-05, + "loss": 0.3552, + "step": 1470 + }, + { + "epoch": 0.12, + "learning_rate": 1.9609971983844412e-05, + "loss": 0.3638, + "step": 1471 + }, + { + "epoch": 0.12, + "learning_rate": 1.9609262010596346e-05, + "loss": 0.3602, + "step": 1472 + }, + { + "epoch": 0.12, + "learning_rate": 1.9608551404624613e-05, + "loss": 0.4291, + "step": 1473 + }, + { + "epoch": 0.12, + "learning_rate": 1.9607840165976003e-05, + "loss": 0.4069, + "step": 1474 + }, + { + "epoch": 0.12, + "learning_rate": 1.960712829469735e-05, + "loss": 0.4717, + "step": 1475 + }, + { + "epoch": 0.12, + "learning_rate": 1.9606415790835523e-05, + "loss": 0.4473, + "step": 1476 + }, + { + "epoch": 0.12, + "learning_rate": 1.9605702654437438e-05, + "loss": 0.3054, + "step": 1477 + }, + { + "epoch": 0.12, + "learning_rate": 1.9604988885550056e-05, + "loss": 0.384, + "step": 1478 + }, + { + "epoch": 0.12, + "learning_rate": 1.960427448422037e-05, + "loss": 0.498, + "step": 1479 + }, + { + "epoch": 0.12, + "learning_rate": 1.9603559450495423e-05, + "loss": 0.4271, + "step": 1480 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602843784422297e-05, + "loss": 0.3251, + "step": 1481 + }, + { + "epoch": 0.12, + "learning_rate": 1.9602127486048112e-05, + "loss": 0.3824, + "step": 1482 + }, + { + "epoch": 0.12, + "learning_rate": 1.9601410555420035e-05, + "loss": 0.4166, + "step": 1483 + }, + { + "epoch": 0.12, + "learning_rate": 1.9600692992585275e-05, + "loss": 0.4798, + "step": 1484 + }, + { + "epoch": 0.12, + "learning_rate": 1.959997479759107e-05, + "loss": 0.429, + "step": 1485 + }, + { + "epoch": 0.12, + "learning_rate": 1.959925597048472e-05, + "loss": 0.4681, + "step": 1486 + }, + { + "epoch": 0.12, + "learning_rate": 1.9598536511313553e-05, + "loss": 0.453, + "step": 1487 + }, + { + "epoch": 0.12, + "learning_rate": 1.9597816420124945e-05, + "loss": 0.5064, + "step": 1488 + }, + { + "epoch": 0.12, + "learning_rate": 1.95970956969663e-05, + "loss": 0.465, + "step": 1489 + }, + { + "epoch": 0.12, + "learning_rate": 1.9596374341885093e-05, + "loss": 0.509, + "step": 1490 + }, + { + "epoch": 0.12, + "learning_rate": 1.95956523549288e-05, + "loss": 0.3047, + "step": 1491 + }, + { + "epoch": 0.12, + "learning_rate": 1.9594929736144978e-05, + "loss": 0.4956, + "step": 1492 + }, + { + "epoch": 0.12, + "learning_rate": 1.9594206485581196e-05, + "loss": 0.4416, + "step": 1493 + }, + { + "epoch": 0.12, + "learning_rate": 1.959348260328508e-05, + "loss": 0.3631, + "step": 1494 + }, + { + "epoch": 0.12, + "learning_rate": 1.95927580893043e-05, + "loss": 0.6089, + "step": 1495 + }, + { + "epoch": 0.12, + "learning_rate": 1.9592032943686554e-05, + "loss": 0.5047, + "step": 1496 + }, + { + "epoch": 0.12, + "learning_rate": 1.9591307166479595e-05, + "loss": 0.3962, + "step": 1497 + }, + { + "epoch": 0.12, + "learning_rate": 1.959058075773121e-05, + "loss": 0.4687, + "step": 1498 + }, + { + "epoch": 0.12, + "learning_rate": 1.9589853717489228e-05, + "loss": 0.4559, + "step": 1499 + }, + { + "epoch": 0.12, + "learning_rate": 1.958912604580152e-05, + "loss": 0.3896, + "step": 1500 + }, + { + "epoch": 0.12, + "learning_rate": 1.9588397742716004e-05, + "loss": 0.4196, + "step": 1501 + }, + { + "epoch": 0.12, + "learning_rate": 1.9587668808280632e-05, + "loss": 0.5378, + "step": 1502 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586939242543402e-05, + "loss": 0.4519, + "step": 1503 + }, + { + "epoch": 0.12, + "learning_rate": 1.9586209045552355e-05, + "loss": 0.3849, + "step": 1504 + }, + { + "epoch": 0.12, + "learning_rate": 1.9585478217355563e-05, + "loss": 0.4598, + "step": 1505 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584746758001156e-05, + "loss": 0.4632, + "step": 1506 + }, + { + "epoch": 0.12, + "learning_rate": 1.9584014667537293e-05, + "loss": 0.4867, + "step": 1507 + }, + { + "epoch": 0.12, + "learning_rate": 1.9583281946012183e-05, + "loss": 0.53, + "step": 1508 + }, + { + "epoch": 0.12, + "learning_rate": 1.9582548593474064e-05, + "loss": 0.5192, + "step": 1509 + }, + { + "epoch": 0.12, + "learning_rate": 1.9581814609971232e-05, + "loss": 0.3676, + "step": 1510 + }, + { + "epoch": 0.12, + "learning_rate": 1.958107999555201e-05, + "loss": 0.3668, + "step": 1511 + }, + { + "epoch": 0.12, + "learning_rate": 1.958034475026477e-05, + "loss": 0.4364, + "step": 1512 + }, + { + "epoch": 0.12, + "learning_rate": 1.957960887415793e-05, + "loss": 0.348, + "step": 1513 + }, + { + "epoch": 0.12, + "learning_rate": 1.9578872367279937e-05, + "loss": 0.3792, + "step": 1514 + }, + { + "epoch": 0.12, + "learning_rate": 1.957813522967929e-05, + "loss": 0.4592, + "step": 1515 + }, + { + "epoch": 0.12, + "learning_rate": 1.9577397461404527e-05, + "loss": 0.2659, + "step": 1516 + }, + { + "epoch": 0.12, + "learning_rate": 1.957665906250422e-05, + "loss": 0.4926, + "step": 1517 + }, + { + "epoch": 0.12, + "learning_rate": 1.9575920033027002e-05, + "loss": 0.3624, + "step": 1518 + }, + { + "epoch": 0.12, + "learning_rate": 1.9575180373021516e-05, + "loss": 0.3354, + "step": 1519 + }, + { + "epoch": 0.12, + "learning_rate": 1.9574440082536482e-05, + "loss": 0.346, + "step": 1520 + }, + { + "epoch": 0.12, + "learning_rate": 1.9573699161620635e-05, + "loss": 0.564, + "step": 1521 + }, + { + "epoch": 0.12, + "learning_rate": 1.9572957610322766e-05, + "loss": 0.2788, + "step": 1522 + }, + { + "epoch": 0.12, + "learning_rate": 1.95722154286917e-05, + "loss": 0.4411, + "step": 1523 + }, + { + "epoch": 0.12, + "learning_rate": 1.9571472616776304e-05, + "loss": 0.442, + "step": 1524 + }, + { + "epoch": 0.12, + "learning_rate": 1.9570729174625493e-05, + "loss": 0.4237, + "step": 1525 + }, + { + "epoch": 0.12, + "learning_rate": 1.956998510228822e-05, + "loss": 0.375, + "step": 1526 + }, + { + "epoch": 0.12, + "learning_rate": 1.956924039981347e-05, + "loss": 0.499, + "step": 1527 + }, + { + "epoch": 0.12, + "learning_rate": 1.956849506725029e-05, + "loss": 0.4879, + "step": 1528 + }, + { + "epoch": 0.12, + "learning_rate": 1.9567749104647746e-05, + "loss": 0.4401, + "step": 1529 + }, + { + "epoch": 0.12, + "learning_rate": 1.9567002512054964e-05, + "loss": 0.4317, + "step": 1530 + }, + { + "epoch": 0.12, + "learning_rate": 1.9566255289521096e-05, + "loss": 0.4312, + "step": 1531 + }, + { + "epoch": 0.12, + "learning_rate": 1.956550743709535e-05, + "loss": 0.3477, + "step": 1532 + }, + { + "epoch": 0.12, + "learning_rate": 1.9564758954826964e-05, + "loss": 0.4276, + "step": 1533 + }, + { + "epoch": 0.12, + "learning_rate": 1.9564009842765225e-05, + "loss": 0.3439, + "step": 1534 + }, + { + "epoch": 0.12, + "learning_rate": 1.956326010095946e-05, + "loss": 0.4918, + "step": 1535 + }, + { + "epoch": 0.12, + "learning_rate": 1.9562509729459024e-05, + "loss": 0.3804, + "step": 1536 + }, + { + "epoch": 0.12, + "learning_rate": 1.956175872831334e-05, + "loss": 0.5518, + "step": 1537 + }, + { + "epoch": 0.12, + "learning_rate": 1.9561007097571853e-05, + "loss": 0.4017, + "step": 1538 + }, + { + "epoch": 0.12, + "learning_rate": 1.9560254837284053e-05, + "loss": 0.365, + "step": 1539 + }, + { + "epoch": 0.12, + "learning_rate": 1.955950194749947e-05, + "loss": 0.504, + "step": 1540 + }, + { + "epoch": 0.12, + "learning_rate": 1.9558748428267682e-05, + "loss": 0.4586, + "step": 1541 + }, + { + "epoch": 0.12, + "learning_rate": 1.9557994279638307e-05, + "loss": 0.4415, + "step": 1542 + }, + { + "epoch": 0.12, + "learning_rate": 1.9557239501660995e-05, + "loss": 0.424, + "step": 1543 + }, + { + "epoch": 0.12, + "learning_rate": 1.955648409438545e-05, + "loss": 0.419, + "step": 1544 + }, + { + "epoch": 0.12, + "learning_rate": 1.955572805786141e-05, + "loss": 0.5058, + "step": 1545 + }, + { + "epoch": 0.12, + "learning_rate": 1.9554971392138655e-05, + "loss": 0.4232, + "step": 1546 + }, + { + "epoch": 0.12, + "learning_rate": 1.955421409726701e-05, + "loss": 0.4225, + "step": 1547 + }, + { + "epoch": 0.12, + "learning_rate": 1.9553456173296342e-05, + "loss": 0.5033, + "step": 1548 + }, + { + "epoch": 0.12, + "learning_rate": 1.9552697620276547e-05, + "loss": 0.5373, + "step": 1549 + }, + { + "epoch": 0.12, + "learning_rate": 1.9551938438257583e-05, + "loss": 0.3479, + "step": 1550 + }, + { + "epoch": 0.12, + "learning_rate": 1.9551178627289436e-05, + "loss": 0.4738, + "step": 1551 + }, + { + "epoch": 0.12, + "learning_rate": 1.9550418187422127e-05, + "loss": 0.2137, + "step": 1552 + }, + { + "epoch": 0.12, + "learning_rate": 1.954965711870574e-05, + "loss": 0.3754, + "step": 1553 + }, + { + "epoch": 0.12, + "learning_rate": 1.954889542119038e-05, + "loss": 0.4584, + "step": 1554 + }, + { + "epoch": 0.12, + "learning_rate": 1.9548133094926203e-05, + "loss": 0.3242, + "step": 1555 + }, + { + "epoch": 0.12, + "learning_rate": 1.9547370139963406e-05, + "loss": 0.5547, + "step": 1556 + }, + { + "epoch": 0.12, + "learning_rate": 1.954660655635222e-05, + "loss": 0.4418, + "step": 1557 + }, + { + "epoch": 0.12, + "learning_rate": 1.954584234414293e-05, + "loss": 0.5087, + "step": 1558 + }, + { + "epoch": 0.12, + "learning_rate": 1.954507750338585e-05, + "loss": 0.3852, + "step": 1559 + }, + { + "epoch": 0.12, + "learning_rate": 1.954431203413135e-05, + "loss": 0.4628, + "step": 1560 + }, + { + "epoch": 0.12, + "learning_rate": 1.9543545936429824e-05, + "loss": 0.463, + "step": 1561 + }, + { + "epoch": 0.12, + "learning_rate": 1.954277921033172e-05, + "loss": 0.5194, + "step": 1562 + }, + { + "epoch": 0.12, + "learning_rate": 1.954201185588752e-05, + "loss": 0.531, + "step": 1563 + }, + { + "epoch": 0.12, + "learning_rate": 1.9541243873147752e-05, + "loss": 0.3609, + "step": 1564 + }, + { + "epoch": 0.12, + "learning_rate": 1.9540475262162988e-05, + "loss": 0.5692, + "step": 1565 + }, + { + "epoch": 0.12, + "learning_rate": 1.9539706022983827e-05, + "loss": 0.4161, + "step": 1566 + }, + { + "epoch": 0.12, + "learning_rate": 1.9538936155660934e-05, + "loss": 0.5487, + "step": 1567 + }, + { + "epoch": 0.12, + "learning_rate": 1.953816566024499e-05, + "loss": 0.564, + "step": 1568 + }, + { + "epoch": 0.12, + "learning_rate": 1.9537394536786734e-05, + "loss": 0.4471, + "step": 1569 + }, + { + "epoch": 0.12, + "learning_rate": 1.9536622785336936e-05, + "loss": 0.4243, + "step": 1570 + }, + { + "epoch": 0.12, + "learning_rate": 1.953585040594642e-05, + "loss": 0.3148, + "step": 1571 + }, + { + "epoch": 0.12, + "learning_rate": 1.9535077398666034e-05, + "loss": 0.5224, + "step": 1572 + }, + { + "epoch": 0.12, + "learning_rate": 1.953430376354668e-05, + "loss": 0.3741, + "step": 1573 + }, + { + "epoch": 0.12, + "learning_rate": 1.9533529500639302e-05, + "loss": 0.4927, + "step": 1574 + }, + { + "epoch": 0.12, + "learning_rate": 1.9532754609994878e-05, + "loss": 0.3586, + "step": 1575 + }, + { + "epoch": 0.12, + "learning_rate": 1.953197909166443e-05, + "loss": 0.5249, + "step": 1576 + }, + { + "epoch": 0.12, + "learning_rate": 1.9531202945699027e-05, + "loss": 0.3582, + "step": 1577 + }, + { + "epoch": 0.13, + "learning_rate": 1.953042617214977e-05, + "loss": 0.4187, + "step": 1578 + }, + { + "epoch": 0.13, + "learning_rate": 1.9529648771067805e-05, + "loss": 0.4051, + "step": 1579 + }, + { + "epoch": 0.13, + "learning_rate": 1.9528870742504328e-05, + "loss": 0.3816, + "step": 1580 + }, + { + "epoch": 0.13, + "learning_rate": 1.9528092086510556e-05, + "loss": 0.4854, + "step": 1581 + }, + { + "epoch": 0.13, + "learning_rate": 1.9527312803137767e-05, + "loss": 0.4689, + "step": 1582 + }, + { + "epoch": 0.13, + "learning_rate": 1.9526532892437275e-05, + "loss": 0.5491, + "step": 1583 + }, + { + "epoch": 0.13, + "learning_rate": 1.9525752354460433e-05, + "loss": 0.4851, + "step": 1584 + }, + { + "epoch": 0.13, + "learning_rate": 1.9524971189258627e-05, + "loss": 0.4054, + "step": 1585 + }, + { + "epoch": 0.13, + "learning_rate": 1.9524189396883307e-05, + "loss": 0.3477, + "step": 1586 + }, + { + "epoch": 0.13, + "learning_rate": 1.9523406977385937e-05, + "loss": 0.3977, + "step": 1587 + }, + { + "epoch": 0.13, + "learning_rate": 1.9522623930818043e-05, + "loss": 0.3295, + "step": 1588 + }, + { + "epoch": 0.13, + "learning_rate": 1.9521840257231183e-05, + "loss": 0.4465, + "step": 1589 + }, + { + "epoch": 0.13, + "learning_rate": 1.9521055956676956e-05, + "loss": 0.4816, + "step": 1590 + }, + { + "epoch": 0.13, + "learning_rate": 1.9520271029207008e-05, + "loss": 0.3901, + "step": 1591 + }, + { + "epoch": 0.13, + "learning_rate": 1.9519485474873027e-05, + "loss": 0.4353, + "step": 1592 + }, + { + "epoch": 0.13, + "learning_rate": 1.9518699293726727e-05, + "loss": 0.3701, + "step": 1593 + }, + { + "epoch": 0.13, + "learning_rate": 1.9517912485819878e-05, + "loss": 0.4238, + "step": 1594 + }, + { + "epoch": 0.13, + "learning_rate": 1.9517125051204292e-05, + "loss": 0.4679, + "step": 1595 + }, + { + "epoch": 0.13, + "learning_rate": 1.9516336989931813e-05, + "loss": 0.5188, + "step": 1596 + }, + { + "epoch": 0.13, + "learning_rate": 1.9515548302054335e-05, + "loss": 0.4892, + "step": 1597 + }, + { + "epoch": 0.13, + "learning_rate": 1.9514758987623784e-05, + "loss": 0.2911, + "step": 1598 + }, + { + "epoch": 0.13, + "learning_rate": 1.9513969046692137e-05, + "loss": 0.4767, + "step": 1599 + }, + { + "epoch": 0.13, + "learning_rate": 1.951317847931141e-05, + "loss": 0.3964, + "step": 1600 + }, + { + "epoch": 0.13, + "learning_rate": 1.9512387285533655e-05, + "loss": 0.4541, + "step": 1601 + }, + { + "epoch": 0.13, + "learning_rate": 1.951159546541096e-05, + "loss": 0.522, + "step": 1602 + }, + { + "epoch": 0.13, + "learning_rate": 1.9510803018995477e-05, + "loss": 0.4103, + "step": 1603 + }, + { + "epoch": 0.13, + "learning_rate": 1.9510009946339377e-05, + "loss": 0.4716, + "step": 1604 + }, + { + "epoch": 0.13, + "learning_rate": 1.9509216247494882e-05, + "loss": 0.3742, + "step": 1605 + }, + { + "epoch": 0.13, + "learning_rate": 1.950842192251425e-05, + "loss": 0.3811, + "step": 1606 + }, + { + "epoch": 0.13, + "learning_rate": 1.950762697144979e-05, + "loss": 0.3408, + "step": 1607 + }, + { + "epoch": 0.13, + "learning_rate": 1.950683139435384e-05, + "loss": 0.2408, + "step": 1608 + }, + { + "epoch": 0.13, + "learning_rate": 1.9506035191278784e-05, + "loss": 0.5414, + "step": 1609 + }, + { + "epoch": 0.13, + "learning_rate": 1.9505238362277054e-05, + "loss": 0.4198, + "step": 1610 + }, + { + "epoch": 0.13, + "learning_rate": 1.9504440907401113e-05, + "loss": 0.4553, + "step": 1611 + }, + { + "epoch": 0.13, + "learning_rate": 1.9503642826703468e-05, + "loss": 0.4552, + "step": 1612 + }, + { + "epoch": 0.13, + "learning_rate": 1.950284412023668e-05, + "loss": 0.3429, + "step": 1613 + }, + { + "epoch": 0.13, + "learning_rate": 1.9502044788053322e-05, + "loss": 0.474, + "step": 1614 + }, + { + "epoch": 0.13, + "learning_rate": 1.9501244830206037e-05, + "loss": 0.3958, + "step": 1615 + }, + { + "epoch": 0.13, + "learning_rate": 1.9500444246747502e-05, + "loss": 0.397, + "step": 1616 + }, + { + "epoch": 0.13, + "learning_rate": 1.9499643037730422e-05, + "loss": 0.3723, + "step": 1617 + }, + { + "epoch": 0.13, + "learning_rate": 1.949884120320756e-05, + "loss": 0.3618, + "step": 1618 + }, + { + "epoch": 0.13, + "learning_rate": 1.949803874323171e-05, + "loss": 0.3546, + "step": 1619 + }, + { + "epoch": 0.13, + "learning_rate": 1.949723565785571e-05, + "loss": 0.5023, + "step": 1620 + }, + { + "epoch": 0.13, + "learning_rate": 1.9496431947132438e-05, + "loss": 0.4134, + "step": 1621 + }, + { + "epoch": 0.13, + "learning_rate": 1.9495627611114817e-05, + "loss": 0.3906, + "step": 1622 + }, + { + "epoch": 0.13, + "learning_rate": 1.949482264985581e-05, + "loss": 0.5138, + "step": 1623 + }, + { + "epoch": 0.13, + "learning_rate": 1.9494017063408415e-05, + "loss": 0.5416, + "step": 1624 + }, + { + "epoch": 0.13, + "learning_rate": 1.9493210851825682e-05, + "loss": 0.4509, + "step": 1625 + }, + { + "epoch": 0.13, + "learning_rate": 1.949240401516069e-05, + "loss": 0.3872, + "step": 1626 + }, + { + "epoch": 0.13, + "learning_rate": 1.9491596553466568e-05, + "loss": 0.378, + "step": 1627 + }, + { + "epoch": 0.13, + "learning_rate": 1.9490788466796483e-05, + "loss": 0.4334, + "step": 1628 + }, + { + "epoch": 0.13, + "learning_rate": 1.9489979755203646e-05, + "loss": 0.3707, + "step": 1629 + }, + { + "epoch": 0.13, + "learning_rate": 1.9489170418741306e-05, + "loss": 0.4678, + "step": 1630 + }, + { + "epoch": 0.13, + "learning_rate": 1.948836045746275e-05, + "loss": 0.433, + "step": 1631 + }, + { + "epoch": 0.13, + "learning_rate": 1.9487549871421316e-05, + "loss": 0.4344, + "step": 1632 + }, + { + "epoch": 0.13, + "learning_rate": 1.9486738660670373e-05, + "loss": 0.5315, + "step": 1633 + }, + { + "epoch": 0.13, + "learning_rate": 1.9485926825263334e-05, + "loss": 0.3929, + "step": 1634 + }, + { + "epoch": 0.13, + "learning_rate": 1.948511436525366e-05, + "loss": 0.4857, + "step": 1635 + }, + { + "epoch": 0.13, + "learning_rate": 1.9484301280694845e-05, + "loss": 0.3747, + "step": 1636 + }, + { + "epoch": 0.13, + "learning_rate": 1.9483487571640424e-05, + "loss": 0.4798, + "step": 1637 + }, + { + "epoch": 0.13, + "learning_rate": 1.948267323814398e-05, + "loss": 0.3221, + "step": 1638 + }, + { + "epoch": 0.13, + "learning_rate": 1.948185828025913e-05, + "loss": 0.3148, + "step": 1639 + }, + { + "epoch": 0.13, + "learning_rate": 1.9481042698039534e-05, + "loss": 0.3998, + "step": 1640 + }, + { + "epoch": 0.13, + "learning_rate": 1.94802264915389e-05, + "loss": 0.4241, + "step": 1641 + }, + { + "epoch": 0.13, + "learning_rate": 1.9479409660810965e-05, + "loss": 0.4094, + "step": 1642 + }, + { + "epoch": 0.13, + "learning_rate": 1.9478592205909517e-05, + "loss": 0.4072, + "step": 1643 + }, + { + "epoch": 0.13, + "learning_rate": 1.947777412688838e-05, + "loss": 0.3626, + "step": 1644 + }, + { + "epoch": 0.13, + "learning_rate": 1.947695542380142e-05, + "loss": 0.4721, + "step": 1645 + }, + { + "epoch": 0.13, + "learning_rate": 1.9476136096702546e-05, + "loss": 0.3161, + "step": 1646 + }, + { + "epoch": 0.13, + "learning_rate": 1.9475316145645706e-05, + "loss": 0.4389, + "step": 1647 + }, + { + "epoch": 0.13, + "learning_rate": 1.947449557068489e-05, + "loss": 0.3301, + "step": 1648 + }, + { + "epoch": 0.13, + "learning_rate": 1.947367437187413e-05, + "loss": 0.4499, + "step": 1649 + }, + { + "epoch": 0.13, + "learning_rate": 1.9472852549267496e-05, + "loss": 0.5421, + "step": 1650 + }, + { + "epoch": 0.13, + "learning_rate": 1.9472030102919102e-05, + "loss": 0.4887, + "step": 1651 + }, + { + "epoch": 0.13, + "learning_rate": 1.9471207032883103e-05, + "loss": 0.4918, + "step": 1652 + }, + { + "epoch": 0.13, + "learning_rate": 1.9470383339213693e-05, + "loss": 0.4633, + "step": 1653 + }, + { + "epoch": 0.13, + "learning_rate": 1.946955902196511e-05, + "loss": 0.496, + "step": 1654 + }, + { + "epoch": 0.13, + "learning_rate": 1.9468734081191627e-05, + "loss": 0.3838, + "step": 1655 + }, + { + "epoch": 0.13, + "learning_rate": 1.9467908516947568e-05, + "loss": 0.5231, + "step": 1656 + }, + { + "epoch": 0.13, + "learning_rate": 1.946708232928729e-05, + "loss": 0.569, + "step": 1657 + }, + { + "epoch": 0.13, + "learning_rate": 1.9466255518265193e-05, + "loss": 0.4911, + "step": 1658 + }, + { + "epoch": 0.13, + "learning_rate": 1.946542808393572e-05, + "loss": 0.4887, + "step": 1659 + }, + { + "epoch": 0.13, + "learning_rate": 1.946460002635335e-05, + "loss": 0.4345, + "step": 1660 + }, + { + "epoch": 0.13, + "learning_rate": 1.946377134557261e-05, + "loss": 0.5363, + "step": 1661 + }, + { + "epoch": 0.13, + "learning_rate": 1.9462942041648062e-05, + "loss": 0.3022, + "step": 1662 + }, + { + "epoch": 0.13, + "learning_rate": 1.9462112114634316e-05, + "loss": 0.4302, + "step": 1663 + }, + { + "epoch": 0.13, + "learning_rate": 1.9461281564586014e-05, + "loss": 0.3774, + "step": 1664 + }, + { + "epoch": 0.13, + "learning_rate": 1.9460450391557847e-05, + "loss": 0.4341, + "step": 1665 + }, + { + "epoch": 0.13, + "learning_rate": 1.945961859560454e-05, + "loss": 0.4361, + "step": 1666 + }, + { + "epoch": 0.13, + "learning_rate": 1.9458786176780868e-05, + "loss": 0.3873, + "step": 1667 + }, + { + "epoch": 0.13, + "learning_rate": 1.945795313514164e-05, + "loss": 0.4237, + "step": 1668 + }, + { + "epoch": 0.13, + "learning_rate": 1.9457119470741707e-05, + "loss": 0.5772, + "step": 1669 + }, + { + "epoch": 0.13, + "learning_rate": 1.9456285183635958e-05, + "loss": 0.5132, + "step": 1670 + }, + { + "epoch": 0.13, + "learning_rate": 1.9455450273879332e-05, + "loss": 0.3145, + "step": 1671 + }, + { + "epoch": 0.13, + "learning_rate": 1.94546147415268e-05, + "loss": 0.5553, + "step": 1672 + }, + { + "epoch": 0.13, + "learning_rate": 1.9453778586633386e-05, + "loss": 0.4373, + "step": 1673 + }, + { + "epoch": 0.13, + "learning_rate": 1.9452941809254136e-05, + "loss": 0.6042, + "step": 1674 + }, + { + "epoch": 0.13, + "learning_rate": 1.9452104409444153e-05, + "loss": 0.4425, + "step": 1675 + }, + { + "epoch": 0.13, + "learning_rate": 1.9451266387258576e-05, + "loss": 0.3502, + "step": 1676 + }, + { + "epoch": 0.13, + "learning_rate": 1.9450427742752583e-05, + "loss": 0.4256, + "step": 1677 + }, + { + "epoch": 0.13, + "learning_rate": 1.9449588475981394e-05, + "loss": 0.3961, + "step": 1678 + }, + { + "epoch": 0.13, + "learning_rate": 1.9448748587000277e-05, + "loss": 0.4194, + "step": 1679 + }, + { + "epoch": 0.13, + "learning_rate": 1.944790807586453e-05, + "loss": 0.438, + "step": 1680 + }, + { + "epoch": 0.13, + "learning_rate": 1.9447066942629495e-05, + "loss": 0.2803, + "step": 1681 + }, + { + "epoch": 0.13, + "learning_rate": 1.9446225187350558e-05, + "loss": 0.5232, + "step": 1682 + }, + { + "epoch": 0.13, + "learning_rate": 1.9445382810083143e-05, + "loss": 0.4379, + "step": 1683 + }, + { + "epoch": 0.13, + "learning_rate": 1.944453981088272e-05, + "loss": 0.3789, + "step": 1684 + }, + { + "epoch": 0.13, + "learning_rate": 1.9443696189804793e-05, + "loss": 0.3598, + "step": 1685 + }, + { + "epoch": 0.13, + "learning_rate": 1.9442851946904914e-05, + "loss": 0.4064, + "step": 1686 + }, + { + "epoch": 0.13, + "learning_rate": 1.9442007082238673e-05, + "loss": 0.4124, + "step": 1687 + }, + { + "epoch": 0.13, + "learning_rate": 1.944116159586169e-05, + "loss": 0.3421, + "step": 1688 + }, + { + "epoch": 0.13, + "learning_rate": 1.944031548782965e-05, + "loss": 0.4213, + "step": 1689 + }, + { + "epoch": 0.13, + "learning_rate": 1.9439468758198258e-05, + "loss": 0.3991, + "step": 1690 + }, + { + "epoch": 0.13, + "learning_rate": 1.943862140702327e-05, + "loss": 0.4889, + "step": 1691 + }, + { + "epoch": 0.13, + "learning_rate": 1.9437773434360476e-05, + "loss": 0.4546, + "step": 1692 + }, + { + "epoch": 0.13, + "learning_rate": 1.943692484026571e-05, + "loss": 0.4437, + "step": 1693 + }, + { + "epoch": 0.13, + "learning_rate": 1.9436075624794853e-05, + "loss": 0.4146, + "step": 1694 + }, + { + "epoch": 0.13, + "learning_rate": 1.9435225788003822e-05, + "loss": 0.3858, + "step": 1695 + }, + { + "epoch": 0.13, + "learning_rate": 1.943437532994857e-05, + "loss": 0.4182, + "step": 1696 + }, + { + "epoch": 0.13, + "learning_rate": 1.9433524250685098e-05, + "loss": 0.457, + "step": 1697 + }, + { + "epoch": 0.13, + "learning_rate": 1.9432672550269446e-05, + "loss": 0.3386, + "step": 1698 + }, + { + "epoch": 0.13, + "learning_rate": 1.943182022875769e-05, + "loss": 0.3496, + "step": 1699 + }, + { + "epoch": 0.13, + "learning_rate": 1.9430967286205962e-05, + "loss": 0.3979, + "step": 1700 + }, + { + "epoch": 0.13, + "learning_rate": 1.9430113722670412e-05, + "loss": 0.3793, + "step": 1701 + }, + { + "epoch": 0.13, + "learning_rate": 1.942925953820725e-05, + "loss": 0.4054, + "step": 1702 + }, + { + "epoch": 0.13, + "learning_rate": 1.9428404732872716e-05, + "loss": 0.4238, + "step": 1703 + }, + { + "epoch": 0.13, + "learning_rate": 1.94275493067231e-05, + "loss": 0.4418, + "step": 1704 + }, + { + "epoch": 0.14, + "learning_rate": 1.9426693259814725e-05, + "loss": 0.4404, + "step": 1705 + }, + { + "epoch": 0.14, + "learning_rate": 1.9425836592203954e-05, + "loss": 0.404, + "step": 1706 + }, + { + "epoch": 0.14, + "learning_rate": 1.94249793039472e-05, + "loss": 0.4562, + "step": 1707 + }, + { + "epoch": 0.14, + "learning_rate": 1.9424121395100907e-05, + "loss": 0.4139, + "step": 1708 + }, + { + "epoch": 0.14, + "learning_rate": 1.9423262865721567e-05, + "loss": 0.4472, + "step": 1709 + }, + { + "epoch": 0.14, + "learning_rate": 1.9422403715865708e-05, + "loss": 0.4629, + "step": 1710 + }, + { + "epoch": 0.14, + "learning_rate": 1.9421543945589904e-05, + "loss": 0.3913, + "step": 1711 + }, + { + "epoch": 0.14, + "learning_rate": 1.9420683554950765e-05, + "loss": 0.3157, + "step": 1712 + }, + { + "epoch": 0.14, + "learning_rate": 1.9419822544004942e-05, + "loss": 0.4504, + "step": 1713 + }, + { + "epoch": 0.14, + "learning_rate": 1.941896091280913e-05, + "loss": 0.5915, + "step": 1714 + }, + { + "epoch": 0.14, + "learning_rate": 1.9418098661420064e-05, + "loss": 0.4434, + "step": 1715 + }, + { + "epoch": 0.14, + "learning_rate": 1.9417235789894517e-05, + "loss": 0.6136, + "step": 1716 + }, + { + "epoch": 0.14, + "learning_rate": 1.9416372298289306e-05, + "loss": 0.471, + "step": 1717 + }, + { + "epoch": 0.14, + "learning_rate": 1.941550818666129e-05, + "loss": 0.3851, + "step": 1718 + }, + { + "epoch": 0.14, + "learning_rate": 1.941464345506736e-05, + "loss": 0.475, + "step": 1719 + }, + { + "epoch": 0.14, + "learning_rate": 1.9413778103564462e-05, + "loss": 0.4926, + "step": 1720 + }, + { + "epoch": 0.14, + "learning_rate": 1.9412912132209573e-05, + "loss": 0.4543, + "step": 1721 + }, + { + "epoch": 0.14, + "learning_rate": 1.941204554105971e-05, + "loss": 0.5001, + "step": 1722 + }, + { + "epoch": 0.14, + "learning_rate": 1.941117833017194e-05, + "loss": 0.3733, + "step": 1723 + }, + { + "epoch": 0.14, + "learning_rate": 1.9410310499603356e-05, + "loss": 0.4498, + "step": 1724 + }, + { + "epoch": 0.14, + "learning_rate": 1.9409442049411104e-05, + "loss": 0.3807, + "step": 1725 + }, + { + "epoch": 0.14, + "learning_rate": 1.9408572979652373e-05, + "loss": 0.3875, + "step": 1726 + }, + { + "epoch": 0.14, + "learning_rate": 1.940770329038438e-05, + "loss": 0.379, + "step": 1727 + }, + { + "epoch": 0.14, + "learning_rate": 1.9406832981664392e-05, + "loss": 0.4007, + "step": 1728 + }, + { + "epoch": 0.14, + "learning_rate": 1.9405962053549717e-05, + "loss": 0.479, + "step": 1729 + }, + { + "epoch": 0.14, + "learning_rate": 1.9405090506097698e-05, + "loss": 0.4628, + "step": 1730 + }, + { + "epoch": 0.14, + "learning_rate": 1.9404218339365724e-05, + "loss": 0.3931, + "step": 1731 + }, + { + "epoch": 0.14, + "learning_rate": 1.940334555341122e-05, + "loss": 0.4249, + "step": 1732 + }, + { + "epoch": 0.14, + "learning_rate": 1.940247214829166e-05, + "loss": 0.3213, + "step": 1733 + }, + { + "epoch": 0.14, + "learning_rate": 1.9401598124064552e-05, + "loss": 0.4177, + "step": 1734 + }, + { + "epoch": 0.14, + "learning_rate": 1.9400723480787446e-05, + "loss": 0.4288, + "step": 1735 + }, + { + "epoch": 0.14, + "learning_rate": 1.9399848218517927e-05, + "loss": 0.3353, + "step": 1736 + }, + { + "epoch": 0.14, + "learning_rate": 1.9398972337313634e-05, + "loss": 0.4618, + "step": 1737 + }, + { + "epoch": 0.14, + "learning_rate": 1.939809583723224e-05, + "loss": 0.4126, + "step": 1738 + }, + { + "epoch": 0.14, + "learning_rate": 1.9397218718331455e-05, + "loss": 0.4859, + "step": 1739 + }, + { + "epoch": 0.14, + "learning_rate": 1.939634098066903e-05, + "loss": 0.478, + "step": 1740 + }, + { + "epoch": 0.14, + "learning_rate": 1.9395462624302768e-05, + "loss": 0.4132, + "step": 1741 + }, + { + "epoch": 0.14, + "learning_rate": 1.93945836492905e-05, + "loss": 0.5111, + "step": 1742 + }, + { + "epoch": 0.14, + "learning_rate": 1.93937040556901e-05, + "loss": 0.5754, + "step": 1743 + }, + { + "epoch": 0.14, + "learning_rate": 1.939282384355949e-05, + "loss": 0.4286, + "step": 1744 + }, + { + "epoch": 0.14, + "learning_rate": 1.9391943012956623e-05, + "loss": 0.466, + "step": 1745 + }, + { + "epoch": 0.14, + "learning_rate": 1.93910615639395e-05, + "loss": 0.5479, + "step": 1746 + }, + { + "epoch": 0.14, + "learning_rate": 1.9390179496566162e-05, + "loss": 0.4333, + "step": 1747 + }, + { + "epoch": 0.14, + "learning_rate": 1.938929681089469e-05, + "loss": 0.4633, + "step": 1748 + }, + { + "epoch": 0.14, + "learning_rate": 1.9388413506983196e-05, + "loss": 0.4618, + "step": 1749 + }, + { + "epoch": 0.14, + "learning_rate": 1.938752958488985e-05, + "loss": 0.5192, + "step": 1750 + }, + { + "epoch": 0.14, + "learning_rate": 1.9386645044672848e-05, + "loss": 0.4244, + "step": 1751 + }, + { + "epoch": 0.14, + "learning_rate": 1.9385759886390433e-05, + "loss": 0.4201, + "step": 1752 + }, + { + "epoch": 0.14, + "learning_rate": 1.9384874110100897e-05, + "loss": 0.4567, + "step": 1753 + }, + { + "epoch": 0.14, + "learning_rate": 1.9383987715862554e-05, + "loss": 0.3771, + "step": 1754 + }, + { + "epoch": 0.14, + "learning_rate": 1.9383100703733774e-05, + "loss": 0.5708, + "step": 1755 + }, + { + "epoch": 0.14, + "learning_rate": 1.9382213073772962e-05, + "loss": 0.5063, + "step": 1756 + }, + { + "epoch": 0.14, + "learning_rate": 1.938132482603856e-05, + "loss": 0.5559, + "step": 1757 + }, + { + "epoch": 0.14, + "learning_rate": 1.9380435960589065e-05, + "loss": 0.4657, + "step": 1758 + }, + { + "epoch": 0.14, + "learning_rate": 1.937954647748299e-05, + "loss": 0.3843, + "step": 1759 + }, + { + "epoch": 0.14, + "learning_rate": 1.9378656376778914e-05, + "loss": 0.4684, + "step": 1760 + }, + { + "epoch": 0.14, + "learning_rate": 1.9377765658535445e-05, + "loss": 0.492, + "step": 1761 + }, + { + "epoch": 0.14, + "learning_rate": 1.937687432281123e-05, + "loss": 0.1948, + "step": 1762 + }, + { + "epoch": 0.14, + "learning_rate": 1.9375982369664958e-05, + "loss": 0.3833, + "step": 1763 + }, + { + "epoch": 0.14, + "learning_rate": 1.937508979915536e-05, + "loss": 0.4787, + "step": 1764 + }, + { + "epoch": 0.14, + "learning_rate": 1.9374196611341212e-05, + "loss": 0.5933, + "step": 1765 + }, + { + "epoch": 0.14, + "learning_rate": 1.937330280628132e-05, + "loss": 0.5505, + "step": 1766 + }, + { + "epoch": 0.14, + "learning_rate": 1.937240838403454e-05, + "loss": 0.3933, + "step": 1767 + }, + { + "epoch": 0.14, + "learning_rate": 1.9371513344659764e-05, + "loss": 0.3971, + "step": 1768 + }, + { + "epoch": 0.14, + "learning_rate": 1.937061768821593e-05, + "loss": 0.4182, + "step": 1769 + }, + { + "epoch": 0.14, + "learning_rate": 1.936972141476201e-05, + "loss": 0.3785, + "step": 1770 + }, + { + "epoch": 0.14, + "learning_rate": 1.936882452435702e-05, + "loss": 0.445, + "step": 1771 + }, + { + "epoch": 0.14, + "learning_rate": 1.936792701706001e-05, + "loss": 0.3606, + "step": 1772 + }, + { + "epoch": 0.14, + "learning_rate": 1.9367028892930088e-05, + "loss": 0.3385, + "step": 1773 + }, + { + "epoch": 0.14, + "learning_rate": 1.9366130152026378e-05, + "loss": 0.4432, + "step": 1774 + }, + { + "epoch": 0.14, + "learning_rate": 1.936523079440807e-05, + "loss": 0.3853, + "step": 1775 + }, + { + "epoch": 0.14, + "learning_rate": 1.936433082013437e-05, + "loss": 0.5163, + "step": 1776 + }, + { + "epoch": 0.14, + "learning_rate": 1.936343022926455e-05, + "loss": 0.4225, + "step": 1777 + }, + { + "epoch": 0.14, + "learning_rate": 1.93625290218579e-05, + "loss": 0.5617, + "step": 1778 + }, + { + "epoch": 0.14, + "learning_rate": 1.9361627197973767e-05, + "loss": 0.4154, + "step": 1779 + }, + { + "epoch": 0.14, + "learning_rate": 1.9360724757671525e-05, + "loss": 0.409, + "step": 1780 + }, + { + "epoch": 0.14, + "learning_rate": 1.93598217010106e-05, + "loss": 0.4792, + "step": 1781 + }, + { + "epoch": 0.14, + "learning_rate": 1.9358918028050453e-05, + "loss": 0.5048, + "step": 1782 + }, + { + "epoch": 0.14, + "learning_rate": 1.9358013738850586e-05, + "loss": 0.4065, + "step": 1783 + }, + { + "epoch": 0.14, + "learning_rate": 1.935710883347054e-05, + "loss": 0.4198, + "step": 1784 + }, + { + "epoch": 0.14, + "learning_rate": 1.9356203311969903e-05, + "loss": 0.4731, + "step": 1785 + }, + { + "epoch": 0.14, + "learning_rate": 1.9355297174408298e-05, + "loss": 0.3551, + "step": 1786 + }, + { + "epoch": 0.14, + "learning_rate": 1.9354390420845387e-05, + "loss": 0.4404, + "step": 1787 + }, + { + "epoch": 0.14, + "learning_rate": 1.9353483051340876e-05, + "loss": 0.4316, + "step": 1788 + }, + { + "epoch": 0.14, + "learning_rate": 1.9352575065954515e-05, + "loss": 0.6085, + "step": 1789 + }, + { + "epoch": 0.14, + "learning_rate": 1.9351666464746087e-05, + "loss": 0.4416, + "step": 1790 + }, + { + "epoch": 0.14, + "learning_rate": 1.935075724777542e-05, + "loss": 0.3973, + "step": 1791 + }, + { + "epoch": 0.14, + "learning_rate": 1.9349847415102378e-05, + "loss": 0.4586, + "step": 1792 + }, + { + "epoch": 0.14, + "learning_rate": 1.9348936966786874e-05, + "loss": 0.3528, + "step": 1793 + }, + { + "epoch": 0.14, + "learning_rate": 1.9348025902888858e-05, + "loss": 0.6057, + "step": 1794 + }, + { + "epoch": 0.14, + "learning_rate": 1.9347114223468316e-05, + "loss": 0.4359, + "step": 1795 + }, + { + "epoch": 0.14, + "learning_rate": 1.9346201928585273e-05, + "loss": 0.5888, + "step": 1796 + }, + { + "epoch": 0.14, + "learning_rate": 1.9345289018299807e-05, + "loss": 0.2915, + "step": 1797 + }, + { + "epoch": 0.14, + "learning_rate": 1.9344375492672024e-05, + "loss": 0.3938, + "step": 1798 + }, + { + "epoch": 0.14, + "learning_rate": 1.934346135176208e-05, + "loss": 0.2569, + "step": 1799 + }, + { + "epoch": 0.14, + "learning_rate": 1.9342546595630162e-05, + "loss": 0.4962, + "step": 1800 + }, + { + "epoch": 0.14, + "learning_rate": 1.9341631224336503e-05, + "loss": 0.5044, + "step": 1801 + }, + { + "epoch": 0.14, + "learning_rate": 1.934071523794138e-05, + "loss": 0.4793, + "step": 1802 + }, + { + "epoch": 0.14, + "learning_rate": 1.9339798636505102e-05, + "loss": 0.4413, + "step": 1803 + }, + { + "epoch": 0.14, + "learning_rate": 1.9338881420088023e-05, + "loss": 0.4884, + "step": 1804 + }, + { + "epoch": 0.14, + "learning_rate": 1.933796358875054e-05, + "loss": 0.4623, + "step": 1805 + }, + { + "epoch": 0.14, + "learning_rate": 1.9337045142553085e-05, + "loss": 0.4435, + "step": 1806 + }, + { + "epoch": 0.14, + "learning_rate": 1.9336126081556134e-05, + "loss": 0.4457, + "step": 1807 + }, + { + "epoch": 0.14, + "learning_rate": 1.9335206405820208e-05, + "loss": 0.3622, + "step": 1808 + }, + { + "epoch": 0.14, + "learning_rate": 1.933428611540585e-05, + "loss": 0.3685, + "step": 1809 + }, + { + "epoch": 0.14, + "learning_rate": 1.9333365210373668e-05, + "loss": 0.4509, + "step": 1810 + }, + { + "epoch": 0.14, + "learning_rate": 1.93324436907843e-05, + "loss": 0.3588, + "step": 1811 + }, + { + "epoch": 0.14, + "learning_rate": 1.9331521556698415e-05, + "loss": 0.509, + "step": 1812 + }, + { + "epoch": 0.14, + "learning_rate": 1.9330598808176736e-05, + "loss": 0.4018, + "step": 1813 + }, + { + "epoch": 0.14, + "learning_rate": 1.9329675445280024e-05, + "loss": 0.4695, + "step": 1814 + }, + { + "epoch": 0.14, + "learning_rate": 1.9328751468069075e-05, + "loss": 0.2669, + "step": 1815 + }, + { + "epoch": 0.14, + "learning_rate": 1.932782687660473e-05, + "loss": 0.4428, + "step": 1816 + }, + { + "epoch": 0.14, + "learning_rate": 1.9326901670947868e-05, + "loss": 0.3833, + "step": 1817 + }, + { + "epoch": 0.14, + "learning_rate": 1.9325975851159406e-05, + "loss": 0.438, + "step": 1818 + }, + { + "epoch": 0.14, + "learning_rate": 1.932504941730031e-05, + "loss": 0.348, + "step": 1819 + }, + { + "epoch": 0.14, + "learning_rate": 1.932412236943158e-05, + "loss": 0.4243, + "step": 1820 + }, + { + "epoch": 0.14, + "learning_rate": 1.9323194707614253e-05, + "loss": 0.3604, + "step": 1821 + }, + { + "epoch": 0.14, + "learning_rate": 1.932226643190942e-05, + "loss": 0.456, + "step": 1822 + }, + { + "epoch": 0.14, + "learning_rate": 1.9321337542378193e-05, + "loss": 0.5635, + "step": 1823 + }, + { + "epoch": 0.14, + "learning_rate": 1.9320408039081745e-05, + "loss": 0.3783, + "step": 1824 + }, + { + "epoch": 0.14, + "learning_rate": 1.9319477922081273e-05, + "loss": 0.4569, + "step": 1825 + }, + { + "epoch": 0.14, + "learning_rate": 1.9318547191438018e-05, + "loss": 0.4178, + "step": 1826 + }, + { + "epoch": 0.14, + "learning_rate": 1.9317615847213274e-05, + "loss": 0.4462, + "step": 1827 + }, + { + "epoch": 0.14, + "learning_rate": 1.931668388946836e-05, + "loss": 0.3754, + "step": 1828 + }, + { + "epoch": 0.14, + "learning_rate": 1.9315751318264636e-05, + "loss": 0.4714, + "step": 1829 + }, + { + "epoch": 0.14, + "learning_rate": 1.9314818133663516e-05, + "loss": 0.5505, + "step": 1830 + }, + { + "epoch": 0.15, + "learning_rate": 1.9313884335726443e-05, + "loss": 0.4117, + "step": 1831 + }, + { + "epoch": 0.15, + "learning_rate": 1.93129499245149e-05, + "loss": 0.3923, + "step": 1832 + }, + { + "epoch": 0.15, + "learning_rate": 1.9312014900090416e-05, + "loss": 0.4969, + "step": 1833 + }, + { + "epoch": 0.15, + "learning_rate": 1.931107926251456e-05, + "loss": 0.39, + "step": 1834 + }, + { + "epoch": 0.15, + "learning_rate": 1.931014301184893e-05, + "loss": 0.4561, + "step": 1835 + }, + { + "epoch": 0.15, + "learning_rate": 1.9309206148155188e-05, + "loss": 0.3858, + "step": 1836 + }, + { + "epoch": 0.15, + "learning_rate": 1.930826867149501e-05, + "loss": 0.3945, + "step": 1837 + }, + { + "epoch": 0.15, + "learning_rate": 1.9307330581930127e-05, + "loss": 0.5572, + "step": 1838 + }, + { + "epoch": 0.15, + "learning_rate": 1.930639187952231e-05, + "loss": 0.3421, + "step": 1839 + }, + { + "epoch": 0.15, + "learning_rate": 1.930545256433337e-05, + "loss": 0.3826, + "step": 1840 + }, + { + "epoch": 0.15, + "learning_rate": 1.930451263642515e-05, + "loss": 0.4723, + "step": 1841 + }, + { + "epoch": 0.15, + "learning_rate": 1.9303572095859545e-05, + "loss": 0.411, + "step": 1842 + }, + { + "epoch": 0.15, + "learning_rate": 1.9302630942698487e-05, + "loss": 0.396, + "step": 1843 + }, + { + "epoch": 0.15, + "learning_rate": 1.9301689177003938e-05, + "loss": 0.3788, + "step": 1844 + }, + { + "epoch": 0.15, + "learning_rate": 1.9300746798837913e-05, + "loss": 0.3862, + "step": 1845 + }, + { + "epoch": 0.15, + "learning_rate": 1.9299803808262466e-05, + "loss": 0.4138, + "step": 1846 + }, + { + "epoch": 0.15, + "learning_rate": 1.9298860205339685e-05, + "loss": 0.3503, + "step": 1847 + }, + { + "epoch": 0.15, + "learning_rate": 1.9297915990131704e-05, + "loss": 0.3759, + "step": 1848 + }, + { + "epoch": 0.15, + "learning_rate": 1.9296971162700696e-05, + "loss": 0.4333, + "step": 1849 + }, + { + "epoch": 0.15, + "learning_rate": 1.9296025723108867e-05, + "loss": 0.4081, + "step": 1850 + }, + { + "epoch": 0.15, + "learning_rate": 1.9295079671418474e-05, + "loss": 0.4196, + "step": 1851 + }, + { + "epoch": 0.15, + "learning_rate": 1.929413300769181e-05, + "loss": 0.4196, + "step": 1852 + }, + { + "epoch": 0.15, + "learning_rate": 1.9293185731991212e-05, + "loss": 0.5225, + "step": 1853 + }, + { + "epoch": 0.15, + "learning_rate": 1.9292237844379043e-05, + "loss": 0.4639, + "step": 1854 + }, + { + "epoch": 0.15, + "learning_rate": 1.929128934491773e-05, + "loss": 0.4157, + "step": 1855 + }, + { + "epoch": 0.15, + "learning_rate": 1.929034023366972e-05, + "loss": 0.3912, + "step": 1856 + }, + { + "epoch": 0.15, + "learning_rate": 1.92893905106975e-05, + "loss": 0.3233, + "step": 1857 + }, + { + "epoch": 0.15, + "learning_rate": 1.9288440176063617e-05, + "loss": 0.4448, + "step": 1858 + }, + { + "epoch": 0.15, + "learning_rate": 1.9287489229830645e-05, + "loss": 0.5383, + "step": 1859 + }, + { + "epoch": 0.15, + "learning_rate": 1.9286537672061192e-05, + "loss": 0.4107, + "step": 1860 + }, + { + "epoch": 0.15, + "learning_rate": 1.9285585502817917e-05, + "loss": 0.3807, + "step": 1861 + }, + { + "epoch": 0.15, + "learning_rate": 1.9284632722163515e-05, + "loss": 0.3451, + "step": 1862 + }, + { + "epoch": 0.15, + "learning_rate": 1.9283679330160726e-05, + "loss": 0.4629, + "step": 1863 + }, + { + "epoch": 0.15, + "learning_rate": 1.9282725326872324e-05, + "loss": 0.2654, + "step": 1864 + }, + { + "epoch": 0.15, + "learning_rate": 1.9281770712361123e-05, + "loss": 0.4127, + "step": 1865 + }, + { + "epoch": 0.15, + "learning_rate": 1.928081548668998e-05, + "loss": 0.4733, + "step": 1866 + }, + { + "epoch": 0.15, + "learning_rate": 1.9279859649921797e-05, + "loss": 0.4492, + "step": 1867 + }, + { + "epoch": 0.15, + "learning_rate": 1.9278903202119508e-05, + "loss": 0.4335, + "step": 1868 + }, + { + "epoch": 0.15, + "learning_rate": 1.9277946143346086e-05, + "loss": 0.341, + "step": 1869 + }, + { + "epoch": 0.15, + "learning_rate": 1.9276988473664557e-05, + "loss": 0.4477, + "step": 1870 + }, + { + "epoch": 0.15, + "learning_rate": 1.9276030193137974e-05, + "loss": 0.4975, + "step": 1871 + }, + { + "epoch": 0.15, + "learning_rate": 1.927507130182944e-05, + "loss": 0.3626, + "step": 1872 + }, + { + "epoch": 0.15, + "learning_rate": 1.9274111799802084e-05, + "loss": 0.4011, + "step": 1873 + }, + { + "epoch": 0.15, + "learning_rate": 1.9273151687119093e-05, + "loss": 0.378, + "step": 1874 + }, + { + "epoch": 0.15, + "learning_rate": 1.927219096384368e-05, + "loss": 0.4333, + "step": 1875 + }, + { + "epoch": 0.15, + "learning_rate": 1.9271229630039107e-05, + "loss": 0.3804, + "step": 1876 + }, + { + "epoch": 0.15, + "learning_rate": 1.9270267685768676e-05, + "loss": 0.374, + "step": 1877 + }, + { + "epoch": 0.15, + "learning_rate": 1.9269305131095722e-05, + "loss": 0.4174, + "step": 1878 + }, + { + "epoch": 0.15, + "learning_rate": 1.9268341966083627e-05, + "loss": 0.4428, + "step": 1879 + }, + { + "epoch": 0.15, + "learning_rate": 1.9267378190795812e-05, + "loss": 0.4298, + "step": 1880 + }, + { + "epoch": 0.15, + "learning_rate": 1.9266413805295732e-05, + "loss": 0.3599, + "step": 1881 + }, + { + "epoch": 0.15, + "learning_rate": 1.9265448809646893e-05, + "loss": 0.3243, + "step": 1882 + }, + { + "epoch": 0.15, + "learning_rate": 1.9264483203912826e-05, + "loss": 0.4499, + "step": 1883 + }, + { + "epoch": 0.15, + "learning_rate": 1.9263516988157123e-05, + "loss": 0.4067, + "step": 1884 + }, + { + "epoch": 0.15, + "learning_rate": 1.92625501624434e-05, + "loss": 0.4943, + "step": 1885 + }, + { + "epoch": 0.15, + "learning_rate": 1.9261582726835316e-05, + "loss": 0.3354, + "step": 1886 + }, + { + "epoch": 0.15, + "learning_rate": 1.926061468139657e-05, + "loss": 0.4274, + "step": 1887 + }, + { + "epoch": 0.15, + "learning_rate": 1.9259646026190913e-05, + "loss": 0.3415, + "step": 1888 + }, + { + "epoch": 0.15, + "learning_rate": 1.9258676761282117e-05, + "loss": 0.3774, + "step": 1889 + }, + { + "epoch": 0.15, + "learning_rate": 1.9257706886734e-05, + "loss": 0.3696, + "step": 1890 + }, + { + "epoch": 0.15, + "learning_rate": 1.9256736402610437e-05, + "loss": 0.309, + "step": 1891 + }, + { + "epoch": 0.15, + "learning_rate": 1.9255765308975322e-05, + "loss": 0.4254, + "step": 1892 + }, + { + "epoch": 0.15, + "learning_rate": 1.9254793605892596e-05, + "loss": 0.4801, + "step": 1893 + }, + { + "epoch": 0.15, + "learning_rate": 1.9253821293426242e-05, + "loss": 0.4051, + "step": 1894 + }, + { + "epoch": 0.15, + "learning_rate": 1.9252848371640284e-05, + "loss": 0.3944, + "step": 1895 + }, + { + "epoch": 0.15, + "learning_rate": 1.925187484059878e-05, + "loss": 0.4012, + "step": 1896 + }, + { + "epoch": 0.15, + "learning_rate": 1.9250900700365837e-05, + "loss": 0.4762, + "step": 1897 + }, + { + "epoch": 0.15, + "learning_rate": 1.9249925951005593e-05, + "loss": 0.3592, + "step": 1898 + }, + { + "epoch": 0.15, + "learning_rate": 1.9248950592582235e-05, + "loss": 0.4472, + "step": 1899 + }, + { + "epoch": 0.15, + "learning_rate": 1.9247974625159983e-05, + "loss": 0.3321, + "step": 1900 + }, + { + "epoch": 0.15, + "learning_rate": 1.92469980488031e-05, + "loss": 0.4554, + "step": 1901 + }, + { + "epoch": 0.15, + "learning_rate": 1.924602086357589e-05, + "loss": 0.4518, + "step": 1902 + }, + { + "epoch": 0.15, + "learning_rate": 1.9245043069542696e-05, + "loss": 0.4336, + "step": 1903 + }, + { + "epoch": 0.15, + "learning_rate": 1.92440646667679e-05, + "loss": 0.304, + "step": 1904 + }, + { + "epoch": 0.15, + "learning_rate": 1.9243085655315924e-05, + "loss": 0.5521, + "step": 1905 + }, + { + "epoch": 0.15, + "learning_rate": 1.924210603525123e-05, + "loss": 0.475, + "step": 1906 + }, + { + "epoch": 0.15, + "learning_rate": 1.924112580663833e-05, + "loss": 0.405, + "step": 1907 + }, + { + "epoch": 0.15, + "learning_rate": 1.9240144969541754e-05, + "loss": 0.3572, + "step": 1908 + }, + { + "epoch": 0.15, + "learning_rate": 1.9239163524026097e-05, + "loss": 0.3812, + "step": 1909 + }, + { + "epoch": 0.15, + "learning_rate": 1.9238181470155978e-05, + "loss": 0.3443, + "step": 1910 + }, + { + "epoch": 0.15, + "learning_rate": 1.923719880799606e-05, + "loss": 0.4417, + "step": 1911 + }, + { + "epoch": 0.15, + "learning_rate": 1.9236215537611044e-05, + "loss": 0.472, + "step": 1912 + }, + { + "epoch": 0.15, + "learning_rate": 1.923523165906568e-05, + "loss": 0.4625, + "step": 1913 + }, + { + "epoch": 0.15, + "learning_rate": 1.923424717242475e-05, + "loss": 0.3636, + "step": 1914 + }, + { + "epoch": 0.15, + "learning_rate": 1.923326207775307e-05, + "loss": 0.4426, + "step": 1915 + }, + { + "epoch": 0.15, + "learning_rate": 1.9232276375115517e-05, + "loss": 0.4584, + "step": 1916 + }, + { + "epoch": 0.15, + "learning_rate": 1.9231290064576985e-05, + "loss": 0.4029, + "step": 1917 + }, + { + "epoch": 0.15, + "learning_rate": 1.923030314620242e-05, + "loss": 0.3649, + "step": 1918 + }, + { + "epoch": 0.15, + "learning_rate": 1.9229315620056805e-05, + "loss": 0.478, + "step": 1919 + }, + { + "epoch": 0.15, + "learning_rate": 1.9228327486205166e-05, + "loss": 0.5456, + "step": 1920 + }, + { + "epoch": 0.15, + "learning_rate": 1.9227338744712565e-05, + "loss": 0.4662, + "step": 1921 + }, + { + "epoch": 0.15, + "learning_rate": 1.9226349395644106e-05, + "loss": 0.5285, + "step": 1922 + }, + { + "epoch": 0.15, + "learning_rate": 1.9225359439064934e-05, + "loss": 0.3996, + "step": 1923 + }, + { + "epoch": 0.15, + "learning_rate": 1.9224368875040235e-05, + "loss": 0.3544, + "step": 1924 + }, + { + "epoch": 0.15, + "learning_rate": 1.922337770363523e-05, + "loss": 0.3348, + "step": 1925 + }, + { + "epoch": 0.15, + "learning_rate": 1.922238592491518e-05, + "loss": 0.4048, + "step": 1926 + }, + { + "epoch": 0.15, + "learning_rate": 1.9221393538945397e-05, + "loss": 0.4107, + "step": 1927 + }, + { + "epoch": 0.15, + "learning_rate": 1.9220400545791216e-05, + "loss": 0.3685, + "step": 1928 + }, + { + "epoch": 0.15, + "learning_rate": 1.9219406945518028e-05, + "loss": 0.4725, + "step": 1929 + }, + { + "epoch": 0.15, + "learning_rate": 1.921841273819125e-05, + "loss": 0.314, + "step": 1930 + }, + { + "epoch": 0.15, + "learning_rate": 1.9217417923876352e-05, + "loss": 0.4944, + "step": 1931 + }, + { + "epoch": 0.15, + "learning_rate": 1.9216422502638836e-05, + "loss": 0.4222, + "step": 1932 + }, + { + "epoch": 0.15, + "learning_rate": 1.9215426474544242e-05, + "loss": 0.3127, + "step": 1933 + }, + { + "epoch": 0.15, + "learning_rate": 1.9214429839658156e-05, + "loss": 0.3211, + "step": 1934 + }, + { + "epoch": 0.15, + "learning_rate": 1.9213432598046205e-05, + "loss": 0.4563, + "step": 1935 + }, + { + "epoch": 0.15, + "learning_rate": 1.9212434749774048e-05, + "loss": 0.3218, + "step": 1936 + }, + { + "epoch": 0.15, + "learning_rate": 1.921143629490739e-05, + "loss": 0.4026, + "step": 1937 + }, + { + "epoch": 0.15, + "learning_rate": 1.9210437233511974e-05, + "loss": 0.3038, + "step": 1938 + }, + { + "epoch": 0.15, + "learning_rate": 1.9209437565653587e-05, + "loss": 0.3211, + "step": 1939 + }, + { + "epoch": 0.15, + "learning_rate": 1.9208437291398045e-05, + "loss": 0.4985, + "step": 1940 + }, + { + "epoch": 0.15, + "learning_rate": 1.920743641081122e-05, + "loss": 0.3858, + "step": 1941 + }, + { + "epoch": 0.15, + "learning_rate": 1.920643492395901e-05, + "loss": 0.335, + "step": 1942 + }, + { + "epoch": 0.15, + "learning_rate": 1.9205432830907353e-05, + "loss": 0.3782, + "step": 1943 + }, + { + "epoch": 0.15, + "learning_rate": 1.9204430131722243e-05, + "loss": 0.3744, + "step": 1944 + }, + { + "epoch": 0.15, + "learning_rate": 1.9203426826469695e-05, + "loss": 0.4417, + "step": 1945 + }, + { + "epoch": 0.15, + "learning_rate": 1.9202422915215777e-05, + "loss": 0.4469, + "step": 1946 + }, + { + "epoch": 0.15, + "learning_rate": 1.920141839802659e-05, + "loss": 0.424, + "step": 1947 + }, + { + "epoch": 0.15, + "learning_rate": 1.9200413274968276e-05, + "loss": 0.3893, + "step": 1948 + }, + { + "epoch": 0.15, + "learning_rate": 1.9199407546107014e-05, + "loss": 0.497, + "step": 1949 + }, + { + "epoch": 0.15, + "learning_rate": 1.919840121150903e-05, + "loss": 0.4611, + "step": 1950 + }, + { + "epoch": 0.15, + "learning_rate": 1.9197394271240587e-05, + "loss": 0.5484, + "step": 1951 + }, + { + "epoch": 0.15, + "learning_rate": 1.919638672536799e-05, + "loss": 0.3939, + "step": 1952 + }, + { + "epoch": 0.15, + "learning_rate": 1.9195378573957574e-05, + "loss": 0.42, + "step": 1953 + }, + { + "epoch": 0.15, + "learning_rate": 1.9194369817075725e-05, + "loss": 0.4391, + "step": 1954 + }, + { + "epoch": 0.15, + "learning_rate": 1.9193360454788864e-05, + "loss": 0.4865, + "step": 1955 + }, + { + "epoch": 0.15, + "learning_rate": 1.919235048716345e-05, + "loss": 0.3365, + "step": 1956 + }, + { + "epoch": 0.16, + "learning_rate": 1.919133991426599e-05, + "loss": 0.3689, + "step": 1957 + }, + { + "epoch": 0.16, + "learning_rate": 1.919032873616302e-05, + "loss": 0.4785, + "step": 1958 + }, + { + "epoch": 0.16, + "learning_rate": 1.918931695292113e-05, + "loss": 0.3824, + "step": 1959 + }, + { + "epoch": 0.16, + "learning_rate": 1.918830456460693e-05, + "loss": 0.4335, + "step": 1960 + }, + { + "epoch": 0.16, + "learning_rate": 1.9187291571287088e-05, + "loss": 0.4293, + "step": 1961 + }, + { + "epoch": 0.16, + "learning_rate": 1.91862779730283e-05, + "loss": 0.3834, + "step": 1962 + }, + { + "epoch": 0.16, + "learning_rate": 1.918526376989731e-05, + "loss": 0.4822, + "step": 1963 + }, + { + "epoch": 0.16, + "learning_rate": 1.9184248961960895e-05, + "loss": 0.4192, + "step": 1964 + }, + { + "epoch": 0.16, + "learning_rate": 1.918323354928588e-05, + "loss": 0.5143, + "step": 1965 + }, + { + "epoch": 0.16, + "learning_rate": 1.918221753193912e-05, + "loss": 0.4138, + "step": 1966 + }, + { + "epoch": 0.16, + "learning_rate": 1.9181200909987524e-05, + "loss": 0.4173, + "step": 1967 + }, + { + "epoch": 0.16, + "learning_rate": 1.918018368349802e-05, + "loss": 0.4887, + "step": 1968 + }, + { + "epoch": 0.16, + "learning_rate": 1.9179165852537596e-05, + "loss": 0.3532, + "step": 1969 + }, + { + "epoch": 0.16, + "learning_rate": 1.9178147417173265e-05, + "loss": 0.5422, + "step": 1970 + }, + { + "epoch": 0.16, + "learning_rate": 1.917712837747209e-05, + "loss": 0.4204, + "step": 1971 + }, + { + "epoch": 0.16, + "learning_rate": 1.917610873350117e-05, + "loss": 0.4472, + "step": 1972 + }, + { + "epoch": 0.16, + "learning_rate": 1.917508848532764e-05, + "loss": 0.3995, + "step": 1973 + }, + { + "epoch": 0.16, + "learning_rate": 1.9174067633018682e-05, + "loss": 0.3006, + "step": 1974 + }, + { + "epoch": 0.16, + "learning_rate": 1.9173046176641515e-05, + "loss": 0.3251, + "step": 1975 + }, + { + "epoch": 0.16, + "learning_rate": 1.917202411626339e-05, + "loss": 0.3793, + "step": 1976 + }, + { + "epoch": 0.16, + "learning_rate": 1.9171001451951616e-05, + "loss": 0.5175, + "step": 1977 + }, + { + "epoch": 0.16, + "learning_rate": 1.916997818377352e-05, + "loss": 0.3925, + "step": 1978 + }, + { + "epoch": 0.16, + "learning_rate": 1.9168954311796487e-05, + "loss": 0.4335, + "step": 1979 + }, + { + "epoch": 0.16, + "learning_rate": 1.9167929836087932e-05, + "loss": 0.4239, + "step": 1980 + }, + { + "epoch": 0.16, + "learning_rate": 1.9166904756715307e-05, + "loss": 0.3991, + "step": 1981 + }, + { + "epoch": 0.16, + "learning_rate": 1.9165879073746112e-05, + "loss": 0.5109, + "step": 1982 + }, + { + "epoch": 0.16, + "learning_rate": 1.9164852787247887e-05, + "loss": 0.4758, + "step": 1983 + }, + { + "epoch": 0.16, + "learning_rate": 1.91638258972882e-05, + "loss": 0.318, + "step": 1984 + }, + { + "epoch": 0.16, + "learning_rate": 1.916279840393467e-05, + "loss": 0.5013, + "step": 1985 + }, + { + "epoch": 0.16, + "learning_rate": 1.916177030725496e-05, + "loss": 0.4973, + "step": 1986 + }, + { + "epoch": 0.16, + "learning_rate": 1.9160741607316755e-05, + "loss": 0.3693, + "step": 1987 + }, + { + "epoch": 0.16, + "learning_rate": 1.9159712304187795e-05, + "loss": 0.4409, + "step": 1988 + }, + { + "epoch": 0.16, + "learning_rate": 1.9158682397935852e-05, + "loss": 0.3491, + "step": 1989 + }, + { + "epoch": 0.16, + "learning_rate": 1.9157651888628744e-05, + "loss": 0.4969, + "step": 1990 + }, + { + "epoch": 0.16, + "learning_rate": 1.915662077633432e-05, + "loss": 0.5218, + "step": 1991 + }, + { + "epoch": 0.16, + "learning_rate": 1.915558906112048e-05, + "loss": 0.351, + "step": 1992 + }, + { + "epoch": 0.16, + "learning_rate": 1.915455674305515e-05, + "loss": 0.2734, + "step": 1993 + }, + { + "epoch": 0.16, + "learning_rate": 1.9153523822206312e-05, + "loss": 0.331, + "step": 1994 + }, + { + "epoch": 0.16, + "learning_rate": 1.9152490298641973e-05, + "loss": 0.4061, + "step": 1995 + }, + { + "epoch": 0.16, + "learning_rate": 1.9151456172430186e-05, + "loss": 0.4486, + "step": 1996 + }, + { + "epoch": 0.16, + "learning_rate": 1.9150421443639045e-05, + "loss": 0.4481, + "step": 1997 + }, + { + "epoch": 0.16, + "learning_rate": 1.9149386112336682e-05, + "loss": 0.4553, + "step": 1998 + }, + { + "epoch": 0.16, + "learning_rate": 1.9148350178591264e-05, + "loss": 0.4442, + "step": 1999 + }, + { + "epoch": 0.16, + "learning_rate": 1.914731364247101e-05, + "loss": 0.4421, + "step": 2000 + }, + { + "epoch": 0.16, + "learning_rate": 1.914627650404416e-05, + "loss": 0.3599, + "step": 2001 + }, + { + "epoch": 0.16, + "learning_rate": 1.9145238763379016e-05, + "loss": 0.3488, + "step": 2002 + }, + { + "epoch": 0.16, + "learning_rate": 1.9144200420543905e-05, + "loss": 0.4133, + "step": 2003 + }, + { + "epoch": 0.16, + "learning_rate": 1.9143161475607194e-05, + "loss": 0.4363, + "step": 2004 + }, + { + "epoch": 0.16, + "learning_rate": 1.9142121928637292e-05, + "loss": 0.501, + "step": 2005 + }, + { + "epoch": 0.16, + "learning_rate": 1.914108177970265e-05, + "loss": 0.3616, + "step": 2006 + }, + { + "epoch": 0.16, + "learning_rate": 1.914004102887176e-05, + "loss": 0.3728, + "step": 2007 + }, + { + "epoch": 0.16, + "learning_rate": 1.9138999676213146e-05, + "loss": 0.5084, + "step": 2008 + }, + { + "epoch": 0.16, + "learning_rate": 1.9137957721795376e-05, + "loss": 0.386, + "step": 2009 + }, + { + "epoch": 0.16, + "learning_rate": 1.913691516568706e-05, + "loss": 0.5451, + "step": 2010 + }, + { + "epoch": 0.16, + "learning_rate": 1.9135872007956846e-05, + "loss": 0.464, + "step": 2011 + }, + { + "epoch": 0.16, + "learning_rate": 1.9134828248673415e-05, + "loss": 0.4131, + "step": 2012 + }, + { + "epoch": 0.16, + "learning_rate": 1.9133783887905502e-05, + "loss": 0.4768, + "step": 2013 + }, + { + "epoch": 0.16, + "learning_rate": 1.913273892572187e-05, + "loss": 0.369, + "step": 2014 + }, + { + "epoch": 0.16, + "learning_rate": 1.9131693362191318e-05, + "loss": 0.3954, + "step": 2015 + }, + { + "epoch": 0.16, + "learning_rate": 1.91306471973827e-05, + "loss": 0.5101, + "step": 2016 + }, + { + "epoch": 0.16, + "learning_rate": 1.91296004313649e-05, + "loss": 0.4883, + "step": 2017 + }, + { + "epoch": 0.16, + "learning_rate": 1.9128553064206835e-05, + "loss": 0.4044, + "step": 2018 + }, + { + "epoch": 0.16, + "learning_rate": 1.9127505095977483e-05, + "loss": 0.5231, + "step": 2019 + }, + { + "epoch": 0.16, + "learning_rate": 1.9126456526745833e-05, + "loss": 0.4319, + "step": 2020 + }, + { + "epoch": 0.16, + "learning_rate": 1.9125407356580932e-05, + "loss": 0.3175, + "step": 2021 + }, + { + "epoch": 0.16, + "learning_rate": 1.9124357585551872e-05, + "loss": 0.5436, + "step": 2022 + }, + { + "epoch": 0.16, + "learning_rate": 1.9123307213727764e-05, + "loss": 0.448, + "step": 2023 + }, + { + "epoch": 0.16, + "learning_rate": 1.9122256241177776e-05, + "loss": 0.3601, + "step": 2024 + }, + { + "epoch": 0.16, + "learning_rate": 1.9121204667971107e-05, + "loss": 0.461, + "step": 2025 + }, + { + "epoch": 0.16, + "learning_rate": 1.9120152494177e-05, + "loss": 0.4224, + "step": 2026 + }, + { + "epoch": 0.16, + "learning_rate": 1.9119099719864735e-05, + "loss": 0.4894, + "step": 2027 + }, + { + "epoch": 0.16, + "learning_rate": 1.911804634510363e-05, + "loss": 0.4368, + "step": 2028 + }, + { + "epoch": 0.16, + "learning_rate": 1.911699236996305e-05, + "loss": 0.4115, + "step": 2029 + }, + { + "epoch": 0.16, + "learning_rate": 1.911593779451239e-05, + "loss": 0.3909, + "step": 2030 + }, + { + "epoch": 0.16, + "learning_rate": 1.911488261882109e-05, + "loss": 0.4357, + "step": 2031 + }, + { + "epoch": 0.16, + "learning_rate": 1.911382684295862e-05, + "loss": 0.398, + "step": 2032 + }, + { + "epoch": 0.16, + "learning_rate": 1.911277046699451e-05, + "loss": 0.4382, + "step": 2033 + }, + { + "epoch": 0.16, + "learning_rate": 1.9111713490998316e-05, + "loss": 0.3595, + "step": 2034 + }, + { + "epoch": 0.16, + "learning_rate": 1.911065591503963e-05, + "loss": 0.4332, + "step": 2035 + }, + { + "epoch": 0.16, + "learning_rate": 1.9109597739188088e-05, + "loss": 0.423, + "step": 2036 + }, + { + "epoch": 0.16, + "learning_rate": 1.9108538963513366e-05, + "loss": 0.4057, + "step": 2037 + }, + { + "epoch": 0.16, + "learning_rate": 1.9107479588085182e-05, + "loss": 0.4391, + "step": 2038 + }, + { + "epoch": 0.16, + "learning_rate": 1.910641961297329e-05, + "loss": 0.4179, + "step": 2039 + }, + { + "epoch": 0.16, + "learning_rate": 1.9105359038247484e-05, + "loss": 0.3756, + "step": 2040 + }, + { + "epoch": 0.16, + "learning_rate": 1.9104297863977595e-05, + "loss": 0.4555, + "step": 2041 + }, + { + "epoch": 0.16, + "learning_rate": 1.9103236090233507e-05, + "loss": 0.5421, + "step": 2042 + }, + { + "epoch": 0.16, + "learning_rate": 1.9102173717085114e-05, + "loss": 0.3793, + "step": 2043 + }, + { + "epoch": 0.16, + "learning_rate": 1.9101110744602384e-05, + "loss": 0.5003, + "step": 2044 + }, + { + "epoch": 0.16, + "learning_rate": 1.9100047172855306e-05, + "loss": 0.5598, + "step": 2045 + }, + { + "epoch": 0.16, + "learning_rate": 1.9098983001913903e-05, + "loss": 0.4327, + "step": 2046 + }, + { + "epoch": 0.16, + "learning_rate": 1.909791823184825e-05, + "loss": 0.4034, + "step": 2047 + }, + { + "epoch": 0.16, + "learning_rate": 1.909685286272846e-05, + "loss": 0.4512, + "step": 2048 + }, + { + "epoch": 0.16, + "learning_rate": 1.9095786894624685e-05, + "loss": 0.4214, + "step": 2049 + }, + { + "epoch": 0.16, + "learning_rate": 1.9094720327607102e-05, + "loss": 0.4919, + "step": 2050 + }, + { + "epoch": 0.16, + "learning_rate": 1.909365316174595e-05, + "loss": 0.4066, + "step": 2051 + }, + { + "epoch": 0.16, + "learning_rate": 1.9092585397111492e-05, + "loss": 0.3218, + "step": 2052 + }, + { + "epoch": 0.16, + "learning_rate": 1.9091517033774038e-05, + "loss": 0.4456, + "step": 2053 + }, + { + "epoch": 0.16, + "learning_rate": 1.9090448071803932e-05, + "loss": 0.4223, + "step": 2054 + }, + { + "epoch": 0.16, + "learning_rate": 1.908937851127156e-05, + "loss": 0.3923, + "step": 2055 + }, + { + "epoch": 0.16, + "learning_rate": 1.908830835224735e-05, + "loss": 0.426, + "step": 2056 + }, + { + "epoch": 0.16, + "learning_rate": 1.9087237594801762e-05, + "loss": 0.4025, + "step": 2057 + }, + { + "epoch": 0.16, + "learning_rate": 1.9086166239005305e-05, + "loss": 0.5424, + "step": 2058 + }, + { + "epoch": 0.16, + "learning_rate": 1.908509428492852e-05, + "loss": 0.4084, + "step": 2059 + }, + { + "epoch": 0.16, + "learning_rate": 1.9084021732641994e-05, + "loss": 0.3695, + "step": 2060 + }, + { + "epoch": 0.16, + "learning_rate": 1.9082948582216344e-05, + "loss": 0.4597, + "step": 2061 + }, + { + "epoch": 0.16, + "learning_rate": 1.9081874833722234e-05, + "loss": 0.3876, + "step": 2062 + }, + { + "epoch": 0.16, + "learning_rate": 1.908080048723037e-05, + "loss": 0.5321, + "step": 2063 + }, + { + "epoch": 0.16, + "learning_rate": 1.9079725542811484e-05, + "loss": 0.4228, + "step": 2064 + }, + { + "epoch": 0.16, + "learning_rate": 1.907865000053636e-05, + "loss": 0.4125, + "step": 2065 + }, + { + "epoch": 0.16, + "learning_rate": 1.9077573860475815e-05, + "loss": 0.4418, + "step": 2066 + }, + { + "epoch": 0.16, + "learning_rate": 1.9076497122700713e-05, + "loss": 0.3674, + "step": 2067 + }, + { + "epoch": 0.16, + "learning_rate": 1.9075419787281948e-05, + "loss": 0.4789, + "step": 2068 + }, + { + "epoch": 0.16, + "learning_rate": 1.9074341854290458e-05, + "loss": 0.2975, + "step": 2069 + }, + { + "epoch": 0.16, + "learning_rate": 1.907326332379722e-05, + "loss": 0.3549, + "step": 2070 + }, + { + "epoch": 0.16, + "learning_rate": 1.9072184195873248e-05, + "loss": 0.286, + "step": 2071 + }, + { + "epoch": 0.16, + "learning_rate": 1.9071104470589603e-05, + "loss": 0.3619, + "step": 2072 + }, + { + "epoch": 0.16, + "learning_rate": 1.9070024148017375e-05, + "loss": 0.4715, + "step": 2073 + }, + { + "epoch": 0.16, + "learning_rate": 1.9068943228227695e-05, + "loss": 0.434, + "step": 2074 + }, + { + "epoch": 0.16, + "learning_rate": 1.9067861711291744e-05, + "loss": 0.3929, + "step": 2075 + }, + { + "epoch": 0.16, + "learning_rate": 1.906677959728073e-05, + "loss": 0.4639, + "step": 2076 + }, + { + "epoch": 0.16, + "learning_rate": 1.9065696886265906e-05, + "loss": 0.5048, + "step": 2077 + }, + { + "epoch": 0.16, + "learning_rate": 1.9064613578318564e-05, + "loss": 0.2761, + "step": 2078 + }, + { + "epoch": 0.16, + "learning_rate": 1.9063529673510036e-05, + "loss": 0.3054, + "step": 2079 + }, + { + "epoch": 0.16, + "learning_rate": 1.9062445171911688e-05, + "loss": 0.4512, + "step": 2080 + }, + { + "epoch": 0.16, + "learning_rate": 1.9061360073594933e-05, + "loss": 0.4013, + "step": 2081 + }, + { + "epoch": 0.16, + "learning_rate": 1.9060274378631215e-05, + "loss": 0.5748, + "step": 2082 + }, + { + "epoch": 0.17, + "learning_rate": 1.9059188087092025e-05, + "loss": 0.4702, + "step": 2083 + }, + { + "epoch": 0.17, + "learning_rate": 1.905810119904889e-05, + "loss": 0.3379, + "step": 2084 + }, + { + "epoch": 0.17, + "learning_rate": 1.9057013714573375e-05, + "loss": 0.5644, + "step": 2085 + }, + { + "epoch": 0.17, + "learning_rate": 1.9055925633737088e-05, + "loss": 0.4501, + "step": 2086 + }, + { + "epoch": 0.17, + "learning_rate": 1.905483695661167e-05, + "loss": 0.4664, + "step": 2087 + }, + { + "epoch": 0.17, + "learning_rate": 1.905374768326881e-05, + "loss": 0.3591, + "step": 2088 + }, + { + "epoch": 0.17, + "learning_rate": 1.9052657813780226e-05, + "loss": 0.4382, + "step": 2089 + }, + { + "epoch": 0.17, + "learning_rate": 1.9051567348217686e-05, + "loss": 0.3202, + "step": 2090 + }, + { + "epoch": 0.17, + "learning_rate": 1.905047628665299e-05, + "loss": 0.3581, + "step": 2091 + }, + { + "epoch": 0.17, + "learning_rate": 1.9049384629157974e-05, + "loss": 0.374, + "step": 2092 + }, + { + "epoch": 0.17, + "learning_rate": 1.9048292375804527e-05, + "loss": 0.538, + "step": 2093 + }, + { + "epoch": 0.17, + "learning_rate": 1.9047199526664565e-05, + "loss": 0.5461, + "step": 2094 + }, + { + "epoch": 0.17, + "learning_rate": 1.9046106081810047e-05, + "loss": 0.499, + "step": 2095 + }, + { + "epoch": 0.17, + "learning_rate": 1.9045012041312966e-05, + "loss": 0.4814, + "step": 2096 + }, + { + "epoch": 0.17, + "learning_rate": 1.904391740524537e-05, + "loss": 0.3032, + "step": 2097 + }, + { + "epoch": 0.17, + "learning_rate": 1.9042822173679325e-05, + "loss": 0.4416, + "step": 2098 + }, + { + "epoch": 0.17, + "learning_rate": 1.9041726346686952e-05, + "loss": 0.3596, + "step": 2099 + }, + { + "epoch": 0.17, + "learning_rate": 1.9040629924340406e-05, + "loss": 0.3995, + "step": 2100 + }, + { + "epoch": 0.17, + "learning_rate": 1.903953290671188e-05, + "loss": 0.4241, + "step": 2101 + }, + { + "epoch": 0.17, + "learning_rate": 1.903843529387361e-05, + "loss": 0.4696, + "step": 2102 + }, + { + "epoch": 0.17, + "learning_rate": 1.903733708589786e-05, + "loss": 0.4785, + "step": 2103 + }, + { + "epoch": 0.17, + "learning_rate": 1.9036238282856952e-05, + "loss": 0.5723, + "step": 2104 + }, + { + "epoch": 0.17, + "learning_rate": 1.903513888482323e-05, + "loss": 0.4247, + "step": 2105 + }, + { + "epoch": 0.17, + "learning_rate": 1.903403889186909e-05, + "loss": 0.2982, + "step": 2106 + }, + { + "epoch": 0.17, + "learning_rate": 1.903293830406696e-05, + "loss": 0.483, + "step": 2107 + }, + { + "epoch": 0.17, + "learning_rate": 1.9031837121489303e-05, + "loss": 0.5181, + "step": 2108 + }, + { + "epoch": 0.17, + "learning_rate": 1.903073534420863e-05, + "loss": 0.3799, + "step": 2109 + }, + { + "epoch": 0.17, + "learning_rate": 1.9029632972297488e-05, + "loss": 0.4, + "step": 2110 + }, + { + "epoch": 0.17, + "learning_rate": 1.9028530005828462e-05, + "loss": 0.367, + "step": 2111 + }, + { + "epoch": 0.17, + "learning_rate": 1.9027426444874177e-05, + "loss": 0.4978, + "step": 2112 + }, + { + "epoch": 0.17, + "learning_rate": 1.90263222895073e-05, + "loss": 0.3986, + "step": 2113 + }, + { + "epoch": 0.17, + "learning_rate": 1.902521753980053e-05, + "loss": 0.4262, + "step": 2114 + }, + { + "epoch": 0.17, + "learning_rate": 1.9024112195826614e-05, + "loss": 0.4582, + "step": 2115 + }, + { + "epoch": 0.17, + "learning_rate": 1.902300625765833e-05, + "loss": 0.3908, + "step": 2116 + }, + { + "epoch": 0.17, + "learning_rate": 1.9021899725368498e-05, + "loss": 0.4041, + "step": 2117 + }, + { + "epoch": 0.17, + "learning_rate": 1.902079259902998e-05, + "loss": 0.3873, + "step": 2118 + }, + { + "epoch": 0.17, + "learning_rate": 1.901968487871568e-05, + "loss": 0.3163, + "step": 2119 + }, + { + "epoch": 0.17, + "learning_rate": 1.9018576564498527e-05, + "loss": 0.4693, + "step": 2120 + }, + { + "epoch": 0.17, + "learning_rate": 1.9017467656451498e-05, + "loss": 0.5117, + "step": 2121 + }, + { + "epoch": 0.17, + "learning_rate": 1.9016358154647618e-05, + "loss": 0.4398, + "step": 2122 + }, + { + "epoch": 0.17, + "learning_rate": 1.9015248059159937e-05, + "loss": 0.4237, + "step": 2123 + }, + { + "epoch": 0.17, + "learning_rate": 1.901413737006155e-05, + "loss": 0.448, + "step": 2124 + }, + { + "epoch": 0.17, + "learning_rate": 1.901302608742559e-05, + "loss": 0.4468, + "step": 2125 + }, + { + "epoch": 0.17, + "learning_rate": 1.9011914211325225e-05, + "loss": 0.4642, + "step": 2126 + }, + { + "epoch": 0.17, + "learning_rate": 1.9010801741833678e-05, + "loss": 0.3554, + "step": 2127 + }, + { + "epoch": 0.17, + "learning_rate": 1.900968867902419e-05, + "loss": 0.4719, + "step": 2128 + }, + { + "epoch": 0.17, + "learning_rate": 1.900857502297006e-05, + "loss": 0.3376, + "step": 2129 + }, + { + "epoch": 0.17, + "learning_rate": 1.9007460773744605e-05, + "loss": 0.2889, + "step": 2130 + }, + { + "epoch": 0.17, + "learning_rate": 1.90063459314212e-05, + "loss": 0.2846, + "step": 2131 + }, + { + "epoch": 0.17, + "learning_rate": 1.9005230496073256e-05, + "loss": 0.2707, + "step": 2132 + }, + { + "epoch": 0.17, + "learning_rate": 1.900411446777421e-05, + "loss": 0.4066, + "step": 2133 + }, + { + "epoch": 0.17, + "learning_rate": 1.900299784659755e-05, + "loss": 0.4449, + "step": 2134 + }, + { + "epoch": 0.17, + "learning_rate": 1.9001880632616806e-05, + "loss": 0.4353, + "step": 2135 + }, + { + "epoch": 0.17, + "learning_rate": 1.9000762825905535e-05, + "loss": 0.4566, + "step": 2136 + }, + { + "epoch": 0.17, + "learning_rate": 1.899964442653734e-05, + "loss": 0.3644, + "step": 2137 + }, + { + "epoch": 0.17, + "learning_rate": 1.8998525434585862e-05, + "loss": 0.4622, + "step": 2138 + }, + { + "epoch": 0.17, + "learning_rate": 1.8997405850124786e-05, + "loss": 0.3709, + "step": 2139 + }, + { + "epoch": 0.17, + "learning_rate": 1.8996285673227826e-05, + "loss": 0.3846, + "step": 2140 + }, + { + "epoch": 0.17, + "learning_rate": 1.899516490396874e-05, + "loss": 0.4274, + "step": 2141 + }, + { + "epoch": 0.17, + "learning_rate": 1.8994043542421328e-05, + "loss": 0.4285, + "step": 2142 + }, + { + "epoch": 0.17, + "learning_rate": 1.8992921588659424e-05, + "loss": 0.355, + "step": 2143 + }, + { + "epoch": 0.17, + "learning_rate": 1.8991799042756906e-05, + "loss": 0.3769, + "step": 2144 + }, + { + "epoch": 0.17, + "learning_rate": 1.8990675904787688e-05, + "loss": 0.2821, + "step": 2145 + }, + { + "epoch": 0.17, + "learning_rate": 1.898955217482572e-05, + "loss": 0.5438, + "step": 2146 + }, + { + "epoch": 0.17, + "learning_rate": 1.8988427852944997e-05, + "loss": 0.2819, + "step": 2147 + }, + { + "epoch": 0.17, + "learning_rate": 1.898730293921955e-05, + "loss": 0.3948, + "step": 2148 + }, + { + "epoch": 0.17, + "learning_rate": 1.8986177433723446e-05, + "loss": 0.4962, + "step": 2149 + }, + { + "epoch": 0.17, + "learning_rate": 1.89850513365308e-05, + "loss": 0.3876, + "step": 2150 + }, + { + "epoch": 0.17, + "learning_rate": 1.8983924647715756e-05, + "loss": 0.3826, + "step": 2151 + }, + { + "epoch": 0.17, + "learning_rate": 1.89827973673525e-05, + "loss": 0.3794, + "step": 2152 + }, + { + "epoch": 0.17, + "learning_rate": 1.8981669495515264e-05, + "loss": 0.4463, + "step": 2153 + }, + { + "epoch": 0.17, + "learning_rate": 1.8980541032278302e-05, + "loss": 0.5992, + "step": 2154 + }, + { + "epoch": 0.17, + "learning_rate": 1.8979411977715928e-05, + "loss": 0.3926, + "step": 2155 + }, + { + "epoch": 0.17, + "learning_rate": 1.8978282331902483e-05, + "loss": 0.4502, + "step": 2156 + }, + { + "epoch": 0.17, + "learning_rate": 1.8977152094912346e-05, + "loss": 0.4229, + "step": 2157 + }, + { + "epoch": 0.17, + "learning_rate": 1.897602126681994e-05, + "loss": 0.3499, + "step": 2158 + }, + { + "epoch": 0.17, + "learning_rate": 1.897488984769972e-05, + "loss": 0.4686, + "step": 2159 + }, + { + "epoch": 0.17, + "learning_rate": 1.8973757837626193e-05, + "loss": 0.331, + "step": 2160 + }, + { + "epoch": 0.17, + "learning_rate": 1.8972625236673887e-05, + "loss": 0.2937, + "step": 2161 + }, + { + "epoch": 0.17, + "learning_rate": 1.8971492044917386e-05, + "loss": 0.352, + "step": 2162 + }, + { + "epoch": 0.17, + "learning_rate": 1.8970358262431297e-05, + "loss": 0.5212, + "step": 2163 + }, + { + "epoch": 0.17, + "learning_rate": 1.8969223889290283e-05, + "loss": 0.4715, + "step": 2164 + }, + { + "epoch": 0.17, + "learning_rate": 1.8968088925569032e-05, + "loss": 0.5249, + "step": 2165 + }, + { + "epoch": 0.17, + "learning_rate": 1.896695337134228e-05, + "loss": 0.3933, + "step": 2166 + }, + { + "epoch": 0.17, + "learning_rate": 1.8965817226684794e-05, + "loss": 0.3574, + "step": 2167 + }, + { + "epoch": 0.17, + "learning_rate": 1.896468049167138e-05, + "loss": 0.4052, + "step": 2168 + }, + { + "epoch": 0.17, + "learning_rate": 1.896354316637689e-05, + "loss": 0.2252, + "step": 2169 + }, + { + "epoch": 0.17, + "learning_rate": 1.8962405250876218e-05, + "loss": 0.3668, + "step": 2170 + }, + { + "epoch": 0.17, + "learning_rate": 1.896126674524428e-05, + "loss": 0.3252, + "step": 2171 + }, + { + "epoch": 0.17, + "learning_rate": 1.896012764955605e-05, + "loss": 0.3122, + "step": 2172 + }, + { + "epoch": 0.17, + "learning_rate": 1.8958987963886526e-05, + "loss": 0.39, + "step": 2173 + }, + { + "epoch": 0.17, + "learning_rate": 1.8957847688310752e-05, + "loss": 0.3936, + "step": 2174 + }, + { + "epoch": 0.17, + "learning_rate": 1.8956706822903812e-05, + "loss": 0.3337, + "step": 2175 + }, + { + "epoch": 0.17, + "learning_rate": 1.8955565367740824e-05, + "loss": 0.3478, + "step": 2176 + }, + { + "epoch": 0.17, + "learning_rate": 1.8954423322896944e-05, + "loss": 0.3991, + "step": 2177 + }, + { + "epoch": 0.17, + "learning_rate": 1.895328068844738e-05, + "loss": 0.4501, + "step": 2178 + }, + { + "epoch": 0.17, + "learning_rate": 1.8952137464467358e-05, + "loss": 0.4349, + "step": 2179 + }, + { + "epoch": 0.17, + "learning_rate": 1.895099365103216e-05, + "loss": 0.344, + "step": 2180 + }, + { + "epoch": 0.17, + "learning_rate": 1.89498492482171e-05, + "loss": 0.413, + "step": 2181 + }, + { + "epoch": 0.17, + "learning_rate": 1.8948704256097533e-05, + "loss": 0.4534, + "step": 2182 + }, + { + "epoch": 0.17, + "learning_rate": 1.8947558674748844e-05, + "loss": 0.4423, + "step": 2183 + }, + { + "epoch": 0.17, + "learning_rate": 1.8946412504246474e-05, + "loss": 0.4468, + "step": 2184 + }, + { + "epoch": 0.17, + "learning_rate": 1.8945265744665886e-05, + "loss": 0.3955, + "step": 2185 + }, + { + "epoch": 0.17, + "learning_rate": 1.8944118396082594e-05, + "loss": 0.4999, + "step": 2186 + }, + { + "epoch": 0.17, + "learning_rate": 1.8942970458572138e-05, + "loss": 0.3697, + "step": 2187 + }, + { + "epoch": 0.17, + "learning_rate": 1.894182193221011e-05, + "loss": 0.3789, + "step": 2188 + }, + { + "epoch": 0.17, + "learning_rate": 1.894067281707213e-05, + "loss": 0.3916, + "step": 2189 + }, + { + "epoch": 0.17, + "learning_rate": 1.893952311323387e-05, + "loss": 0.3824, + "step": 2190 + }, + { + "epoch": 0.17, + "learning_rate": 1.8938372820771024e-05, + "loss": 0.4641, + "step": 2191 + }, + { + "epoch": 0.17, + "learning_rate": 1.8937221939759334e-05, + "loss": 0.4176, + "step": 2192 + }, + { + "epoch": 0.17, + "learning_rate": 1.8936070470274587e-05, + "loss": 0.4081, + "step": 2193 + }, + { + "epoch": 0.17, + "learning_rate": 1.8934918412392596e-05, + "loss": 0.3824, + "step": 2194 + }, + { + "epoch": 0.17, + "learning_rate": 1.893376576618922e-05, + "loss": 0.5199, + "step": 2195 + }, + { + "epoch": 0.17, + "learning_rate": 1.8932612531740354e-05, + "loss": 0.5104, + "step": 2196 + }, + { + "epoch": 0.17, + "learning_rate": 1.893145870912193e-05, + "loss": 0.4715, + "step": 2197 + }, + { + "epoch": 0.17, + "learning_rate": 1.8930304298409933e-05, + "loss": 0.3677, + "step": 2198 + }, + { + "epoch": 0.17, + "learning_rate": 1.8929149299680364e-05, + "loss": 0.4254, + "step": 2199 + }, + { + "epoch": 0.17, + "learning_rate": 1.8927993713009275e-05, + "loss": 0.3231, + "step": 2200 + }, + { + "epoch": 0.17, + "learning_rate": 1.892683753847276e-05, + "loss": 0.3727, + "step": 2201 + }, + { + "epoch": 0.17, + "learning_rate": 1.892568077614695e-05, + "loss": 0.439, + "step": 2202 + }, + { + "epoch": 0.17, + "learning_rate": 1.892452342610801e-05, + "loss": 0.537, + "step": 2203 + }, + { + "epoch": 0.17, + "learning_rate": 1.892336548843214e-05, + "loss": 0.4307, + "step": 2204 + }, + { + "epoch": 0.17, + "learning_rate": 1.892220696319559e-05, + "loss": 0.3031, + "step": 2205 + }, + { + "epoch": 0.17, + "learning_rate": 1.8921047850474645e-05, + "loss": 0.4848, + "step": 2206 + }, + { + "epoch": 0.17, + "learning_rate": 1.891988815034562e-05, + "loss": 0.345, + "step": 2207 + }, + { + "epoch": 0.17, + "learning_rate": 1.891872786288488e-05, + "loss": 0.5914, + "step": 2208 + }, + { + "epoch": 0.18, + "learning_rate": 1.8917566988168826e-05, + "loss": 0.4679, + "step": 2209 + }, + { + "epoch": 0.18, + "learning_rate": 1.8916405526273894e-05, + "loss": 0.4811, + "step": 2210 + }, + { + "epoch": 0.18, + "learning_rate": 1.8915243477276563e-05, + "loss": 0.4288, + "step": 2211 + }, + { + "epoch": 0.18, + "learning_rate": 1.8914080841253348e-05, + "loss": 0.3029, + "step": 2212 + }, + { + "epoch": 0.18, + "learning_rate": 1.8912917618280796e-05, + "loss": 0.4719, + "step": 2213 + }, + { + "epoch": 0.18, + "learning_rate": 1.8911753808435508e-05, + "loss": 0.4917, + "step": 2214 + }, + { + "epoch": 0.18, + "learning_rate": 1.891058941179411e-05, + "loss": 0.3915, + "step": 2215 + }, + { + "epoch": 0.18, + "learning_rate": 1.8909424428433278e-05, + "loss": 0.3953, + "step": 2216 + }, + { + "epoch": 0.18, + "learning_rate": 1.8908258858429716e-05, + "loss": 0.4228, + "step": 2217 + }, + { + "epoch": 0.18, + "learning_rate": 1.890709270186017e-05, + "loss": 0.4075, + "step": 2218 + }, + { + "epoch": 0.18, + "learning_rate": 1.890592595880143e-05, + "loss": 0.3597, + "step": 2219 + }, + { + "epoch": 0.18, + "learning_rate": 1.890475862933032e-05, + "loss": 0.5669, + "step": 2220 + }, + { + "epoch": 0.18, + "learning_rate": 1.8903590713523698e-05, + "loss": 0.3936, + "step": 2221 + }, + { + "epoch": 0.18, + "learning_rate": 1.8902422211458466e-05, + "loss": 0.2788, + "step": 2222 + }, + { + "epoch": 0.18, + "learning_rate": 1.890125312321157e-05, + "loss": 0.4251, + "step": 2223 + }, + { + "epoch": 0.18, + "learning_rate": 1.8900083448859986e-05, + "loss": 0.4534, + "step": 2224 + }, + { + "epoch": 0.18, + "learning_rate": 1.8898913188480733e-05, + "loss": 0.3466, + "step": 2225 + }, + { + "epoch": 0.18, + "learning_rate": 1.8897742342150863e-05, + "loss": 0.4368, + "step": 2226 + }, + { + "epoch": 0.18, + "learning_rate": 1.8896570909947477e-05, + "loss": 0.5173, + "step": 2227 + }, + { + "epoch": 0.18, + "learning_rate": 1.88953988919477e-05, + "loss": 0.3789, + "step": 2228 + }, + { + "epoch": 0.18, + "learning_rate": 1.8894226288228707e-05, + "loss": 0.4369, + "step": 2229 + }, + { + "epoch": 0.18, + "learning_rate": 1.8893053098867714e-05, + "loss": 0.4272, + "step": 2230 + }, + { + "epoch": 0.18, + "learning_rate": 1.889187932394196e-05, + "loss": 0.4872, + "step": 2231 + }, + { + "epoch": 0.18, + "learning_rate": 1.889070496352874e-05, + "loss": 0.4169, + "step": 2232 + }, + { + "epoch": 0.18, + "learning_rate": 1.888953001770538e-05, + "loss": 0.5049, + "step": 2233 + }, + { + "epoch": 0.18, + "learning_rate": 1.8888354486549238e-05, + "loss": 0.478, + "step": 2234 + }, + { + "epoch": 0.18, + "learning_rate": 1.888717837013772e-05, + "loss": 0.4091, + "step": 2235 + }, + { + "epoch": 0.18, + "learning_rate": 1.8886001668548273e-05, + "loss": 0.4921, + "step": 2236 + }, + { + "epoch": 0.18, + "learning_rate": 1.8884824381858368e-05, + "loss": 0.3643, + "step": 2237 + }, + { + "epoch": 0.18, + "learning_rate": 1.888364651014553e-05, + "loss": 0.3344, + "step": 2238 + }, + { + "epoch": 0.18, + "learning_rate": 1.888246805348732e-05, + "loss": 0.3386, + "step": 2239 + }, + { + "epoch": 0.18, + "learning_rate": 1.8881289011961323e-05, + "loss": 0.4314, + "step": 2240 + }, + { + "epoch": 0.18, + "learning_rate": 1.8880109385645184e-05, + "loss": 0.4037, + "step": 2241 + }, + { + "epoch": 0.18, + "learning_rate": 1.8878929174616566e-05, + "loss": 0.4162, + "step": 2242 + }, + { + "epoch": 0.18, + "learning_rate": 1.887774837895318e-05, + "loss": 0.4261, + "step": 2243 + }, + { + "epoch": 0.18, + "learning_rate": 1.887656699873279e-05, + "loss": 0.5008, + "step": 2244 + }, + { + "epoch": 0.18, + "learning_rate": 1.887538503403317e-05, + "loss": 0.4585, + "step": 2245 + }, + { + "epoch": 0.18, + "learning_rate": 1.8874202484932148e-05, + "loss": 0.5234, + "step": 2246 + }, + { + "epoch": 0.18, + "learning_rate": 1.8873019351507596e-05, + "loss": 0.4939, + "step": 2247 + }, + { + "epoch": 0.18, + "learning_rate": 1.887183563383741e-05, + "loss": 0.4145, + "step": 2248 + }, + { + "epoch": 0.18, + "learning_rate": 1.8870651331999542e-05, + "loss": 0.3583, + "step": 2249 + }, + { + "epoch": 0.18, + "learning_rate": 1.886946644607196e-05, + "loss": 0.3421, + "step": 2250 + }, + { + "epoch": 0.18, + "learning_rate": 1.8868280976132697e-05, + "loss": 0.3496, + "step": 2251 + }, + { + "epoch": 0.18, + "learning_rate": 1.8867094922259798e-05, + "loss": 0.4057, + "step": 2252 + }, + { + "epoch": 0.18, + "learning_rate": 1.8865908284531368e-05, + "loss": 0.3347, + "step": 2253 + }, + { + "epoch": 0.18, + "learning_rate": 1.8864721063025536e-05, + "loss": 0.3303, + "step": 2254 + }, + { + "epoch": 0.18, + "learning_rate": 1.8863533257820475e-05, + "loss": 0.2824, + "step": 2255 + }, + { + "epoch": 0.18, + "learning_rate": 1.8862344868994395e-05, + "loss": 0.455, + "step": 2256 + }, + { + "epoch": 0.18, + "learning_rate": 1.8861155896625553e-05, + "loss": 0.3619, + "step": 2257 + }, + { + "epoch": 0.18, + "learning_rate": 1.885996634079223e-05, + "loss": 0.3623, + "step": 2258 + }, + { + "epoch": 0.18, + "learning_rate": 1.8858776201572758e-05, + "loss": 0.3877, + "step": 2259 + }, + { + "epoch": 0.18, + "learning_rate": 1.8857585479045493e-05, + "loss": 0.2871, + "step": 2260 + }, + { + "epoch": 0.18, + "learning_rate": 1.8856394173288848e-05, + "loss": 0.5299, + "step": 2261 + }, + { + "epoch": 0.18, + "learning_rate": 1.8855202284381264e-05, + "loss": 0.4715, + "step": 2262 + }, + { + "epoch": 0.18, + "learning_rate": 1.8854009812401213e-05, + "loss": 0.3674, + "step": 2263 + }, + { + "epoch": 0.18, + "learning_rate": 1.885281675742722e-05, + "loss": 0.4199, + "step": 2264 + }, + { + "epoch": 0.18, + "learning_rate": 1.885162311953784e-05, + "loss": 0.3883, + "step": 2265 + }, + { + "epoch": 0.18, + "learning_rate": 1.885042889881167e-05, + "loss": 0.3299, + "step": 2266 + }, + { + "epoch": 0.18, + "learning_rate": 1.8849234095327343e-05, + "loss": 0.5086, + "step": 2267 + }, + { + "epoch": 0.18, + "learning_rate": 1.884803870916353e-05, + "loss": 0.4302, + "step": 2268 + }, + { + "epoch": 0.18, + "learning_rate": 1.884684274039894e-05, + "loss": 0.4863, + "step": 2269 + }, + { + "epoch": 0.18, + "learning_rate": 1.8845646189112327e-05, + "loss": 0.4748, + "step": 2270 + }, + { + "epoch": 0.18, + "learning_rate": 1.8844449055382473e-05, + "loss": 0.3609, + "step": 2271 + }, + { + "epoch": 0.18, + "learning_rate": 1.8843251339288207e-05, + "loss": 0.3633, + "step": 2272 + }, + { + "epoch": 0.18, + "learning_rate": 1.884205304090839e-05, + "loss": 0.3506, + "step": 2273 + }, + { + "epoch": 0.18, + "learning_rate": 1.8840854160321926e-05, + "loss": 0.3274, + "step": 2274 + }, + { + "epoch": 0.18, + "learning_rate": 1.8839654697607756e-05, + "loss": 0.3027, + "step": 2275 + }, + { + "epoch": 0.18, + "learning_rate": 1.8838454652844857e-05, + "loss": 0.3433, + "step": 2276 + }, + { + "epoch": 0.18, + "learning_rate": 1.8837254026112245e-05, + "loss": 0.2583, + "step": 2277 + }, + { + "epoch": 0.18, + "learning_rate": 1.883605281748898e-05, + "loss": 0.4209, + "step": 2278 + }, + { + "epoch": 0.18, + "learning_rate": 1.8834851027054152e-05, + "loss": 0.2946, + "step": 2279 + }, + { + "epoch": 0.18, + "learning_rate": 1.8833648654886898e-05, + "loss": 0.4426, + "step": 2280 + }, + { + "epoch": 0.18, + "learning_rate": 1.883244570106638e-05, + "loss": 0.2782, + "step": 2281 + }, + { + "epoch": 0.18, + "learning_rate": 1.8831242165671816e-05, + "loss": 0.3936, + "step": 2282 + }, + { + "epoch": 0.18, + "learning_rate": 1.8830038048782445e-05, + "loss": 0.4937, + "step": 2283 + }, + { + "epoch": 0.18, + "learning_rate": 1.8828833350477556e-05, + "loss": 0.3631, + "step": 2284 + }, + { + "epoch": 0.18, + "learning_rate": 1.8827628070836477e-05, + "loss": 0.5489, + "step": 2285 + }, + { + "epoch": 0.18, + "learning_rate": 1.8826422209938563e-05, + "loss": 0.2803, + "step": 2286 + }, + { + "epoch": 0.18, + "learning_rate": 1.8825215767863215e-05, + "loss": 0.47, + "step": 2287 + }, + { + "epoch": 0.18, + "learning_rate": 1.8824008744689873e-05, + "loss": 0.3655, + "step": 2288 + }, + { + "epoch": 0.18, + "learning_rate": 1.8822801140498014e-05, + "loss": 0.4499, + "step": 2289 + }, + { + "epoch": 0.18, + "learning_rate": 1.8821592955367154e-05, + "loss": 0.5626, + "step": 2290 + }, + { + "epoch": 0.18, + "learning_rate": 1.8820384189376845e-05, + "loss": 0.4171, + "step": 2291 + }, + { + "epoch": 0.18, + "learning_rate": 1.8819174842606675e-05, + "loss": 0.4184, + "step": 2292 + }, + { + "epoch": 0.18, + "learning_rate": 1.8817964915136277e-05, + "loss": 0.3277, + "step": 2293 + }, + { + "epoch": 0.18, + "learning_rate": 1.881675440704532e-05, + "loss": 0.4268, + "step": 2294 + }, + { + "epoch": 0.18, + "learning_rate": 1.881554331841351e-05, + "loss": 0.4049, + "step": 2295 + }, + { + "epoch": 0.18, + "learning_rate": 1.881433164932059e-05, + "loss": 0.4139, + "step": 2296 + }, + { + "epoch": 0.18, + "learning_rate": 1.881311939984634e-05, + "loss": 0.3823, + "step": 2297 + }, + { + "epoch": 0.18, + "learning_rate": 1.8811906570070583e-05, + "loss": 0.3131, + "step": 2298 + }, + { + "epoch": 0.18, + "learning_rate": 1.8810693160073184e-05, + "loss": 0.4299, + "step": 2299 + }, + { + "epoch": 0.18, + "learning_rate": 1.880947916993403e-05, + "loss": 0.4149, + "step": 2300 + }, + { + "epoch": 0.18, + "learning_rate": 1.8808264599733065e-05, + "loss": 0.2752, + "step": 2301 + }, + { + "epoch": 0.18, + "learning_rate": 1.8807049449550254e-05, + "loss": 0.2812, + "step": 2302 + }, + { + "epoch": 0.18, + "learning_rate": 1.8805833719465617e-05, + "loss": 0.5224, + "step": 2303 + }, + { + "epoch": 0.18, + "learning_rate": 1.88046174095592e-05, + "loss": 0.5012, + "step": 2304 + }, + { + "epoch": 0.18, + "learning_rate": 1.880340051991109e-05, + "loss": 0.3741, + "step": 2305 + }, + { + "epoch": 0.18, + "learning_rate": 1.8802183050601417e-05, + "loss": 0.3365, + "step": 2306 + }, + { + "epoch": 0.18, + "learning_rate": 1.8800965001710342e-05, + "loss": 0.4669, + "step": 2307 + }, + { + "epoch": 0.18, + "learning_rate": 1.879974637331807e-05, + "loss": 0.4839, + "step": 2308 + }, + { + "epoch": 0.18, + "learning_rate": 1.879852716550484e-05, + "loss": 0.4675, + "step": 2309 + }, + { + "epoch": 0.18, + "learning_rate": 1.8797307378350935e-05, + "loss": 0.449, + "step": 2310 + }, + { + "epoch": 0.18, + "learning_rate": 1.8796087011936665e-05, + "loss": 0.3752, + "step": 2311 + }, + { + "epoch": 0.18, + "learning_rate": 1.8794866066342394e-05, + "loss": 0.4026, + "step": 2312 + }, + { + "epoch": 0.18, + "learning_rate": 1.879364454164851e-05, + "loss": 0.3563, + "step": 2313 + }, + { + "epoch": 0.18, + "learning_rate": 1.879242243793544e-05, + "loss": 0.4135, + "step": 2314 + }, + { + "epoch": 0.18, + "learning_rate": 1.8791199755283664e-05, + "loss": 0.4275, + "step": 2315 + }, + { + "epoch": 0.18, + "learning_rate": 1.878997649377368e-05, + "loss": 0.3698, + "step": 2316 + }, + { + "epoch": 0.18, + "learning_rate": 1.8788752653486045e-05, + "loss": 0.5306, + "step": 2317 + }, + { + "epoch": 0.18, + "learning_rate": 1.878752823450133e-05, + "loss": 0.4045, + "step": 2318 + }, + { + "epoch": 0.18, + "learning_rate": 1.878630323690017e-05, + "loss": 0.3431, + "step": 2319 + }, + { + "epoch": 0.18, + "learning_rate": 1.8785077660763217e-05, + "loss": 0.3946, + "step": 2320 + }, + { + "epoch": 0.18, + "learning_rate": 1.8783851506171166e-05, + "loss": 0.4285, + "step": 2321 + }, + { + "epoch": 0.18, + "learning_rate": 1.8782624773204764e-05, + "loss": 0.384, + "step": 2322 + }, + { + "epoch": 0.18, + "learning_rate": 1.8781397461944777e-05, + "loss": 0.3722, + "step": 2323 + }, + { + "epoch": 0.18, + "learning_rate": 1.8780169572472024e-05, + "loss": 0.3734, + "step": 2324 + }, + { + "epoch": 0.18, + "learning_rate": 1.8778941104867347e-05, + "loss": 0.2507, + "step": 2325 + }, + { + "epoch": 0.18, + "learning_rate": 1.8777712059211643e-05, + "loss": 0.4406, + "step": 2326 + }, + { + "epoch": 0.18, + "learning_rate": 1.8776482435585836e-05, + "loss": 0.4249, + "step": 2327 + }, + { + "epoch": 0.18, + "learning_rate": 1.877525223407089e-05, + "loss": 0.4268, + "step": 2328 + }, + { + "epoch": 0.18, + "learning_rate": 1.877402145474781e-05, + "loss": 0.4474, + "step": 2329 + }, + { + "epoch": 0.18, + "learning_rate": 1.877279009769763e-05, + "loss": 0.5109, + "step": 2330 + }, + { + "epoch": 0.18, + "learning_rate": 1.8771558163001438e-05, + "loss": 0.4401, + "step": 2331 + }, + { + "epoch": 0.18, + "learning_rate": 1.8770325650740347e-05, + "loss": 0.3762, + "step": 2332 + }, + { + "epoch": 0.18, + "learning_rate": 1.876909256099551e-05, + "loss": 0.4048, + "step": 2333 + }, + { + "epoch": 0.18, + "learning_rate": 1.876785889384812e-05, + "loss": 0.445, + "step": 2334 + }, + { + "epoch": 0.18, + "learning_rate": 1.8766624649379415e-05, + "loss": 0.3985, + "step": 2335 + }, + { + "epoch": 0.19, + "learning_rate": 1.8765389827670657e-05, + "loss": 0.4192, + "step": 2336 + }, + { + "epoch": 0.19, + "learning_rate": 1.8764154428803155e-05, + "loss": 0.3202, + "step": 2337 + }, + { + "epoch": 0.19, + "learning_rate": 1.8762918452858256e-05, + "loss": 0.3233, + "step": 2338 + }, + { + "epoch": 0.19, + "learning_rate": 1.876168189991734e-05, + "loss": 0.4365, + "step": 2339 + }, + { + "epoch": 0.19, + "learning_rate": 1.876044477006183e-05, + "loss": 0.3746, + "step": 2340 + }, + { + "epoch": 0.19, + "learning_rate": 1.8759207063373183e-05, + "loss": 0.4385, + "step": 2341 + }, + { + "epoch": 0.19, + "learning_rate": 1.87579687799329e-05, + "loss": 0.4393, + "step": 2342 + }, + { + "epoch": 0.19, + "learning_rate": 1.875672991982251e-05, + "loss": 0.3652, + "step": 2343 + }, + { + "epoch": 0.19, + "learning_rate": 1.875549048312359e-05, + "loss": 0.3479, + "step": 2344 + }, + { + "epoch": 0.19, + "learning_rate": 1.8754250469917753e-05, + "loss": 0.5375, + "step": 2345 + }, + { + "epoch": 0.19, + "learning_rate": 1.8753009880286647e-05, + "loss": 0.4589, + "step": 2346 + }, + { + "epoch": 0.19, + "learning_rate": 1.8751768714311952e-05, + "loss": 0.4252, + "step": 2347 + }, + { + "epoch": 0.19, + "learning_rate": 1.87505269720754e-05, + "loss": 0.3849, + "step": 2348 + }, + { + "epoch": 0.19, + "learning_rate": 1.8749284653658754e-05, + "loss": 0.5014, + "step": 2349 + }, + { + "epoch": 0.19, + "learning_rate": 1.874804175914381e-05, + "loss": 0.3846, + "step": 2350 + }, + { + "epoch": 0.19, + "learning_rate": 1.8746798288612405e-05, + "loss": 0.3994, + "step": 2351 + }, + { + "epoch": 0.19, + "learning_rate": 1.8745554242146428e-05, + "loss": 0.4889, + "step": 2352 + }, + { + "epoch": 0.19, + "learning_rate": 1.874430961982778e-05, + "loss": 0.4205, + "step": 2353 + }, + { + "epoch": 0.19, + "learning_rate": 1.874306442173842e-05, + "loss": 0.3073, + "step": 2354 + }, + { + "epoch": 0.19, + "learning_rate": 1.8741818647960337e-05, + "loss": 0.373, + "step": 2355 + }, + { + "epoch": 0.19, + "learning_rate": 1.8740572298575558e-05, + "loss": 0.4651, + "step": 2356 + }, + { + "epoch": 0.19, + "learning_rate": 1.8739325373666152e-05, + "loss": 0.4527, + "step": 2357 + }, + { + "epoch": 0.19, + "learning_rate": 1.8738077873314218e-05, + "loss": 0.3904, + "step": 2358 + }, + { + "epoch": 0.19, + "learning_rate": 1.8736829797601903e-05, + "loss": 0.4976, + "step": 2359 + }, + { + "epoch": 0.19, + "learning_rate": 1.8735581146611387e-05, + "loss": 0.4467, + "step": 2360 + }, + { + "epoch": 0.19, + "learning_rate": 1.873433192042488e-05, + "loss": 0.3979, + "step": 2361 + }, + { + "epoch": 0.19, + "learning_rate": 1.8733082119124646e-05, + "loss": 0.3808, + "step": 2362 + }, + { + "epoch": 0.19, + "learning_rate": 1.8731831742792974e-05, + "loss": 0.4301, + "step": 2363 + }, + { + "epoch": 0.19, + "learning_rate": 1.87305807915122e-05, + "loss": 0.4781, + "step": 2364 + }, + { + "epoch": 0.19, + "learning_rate": 1.8729329265364685e-05, + "loss": 0.4562, + "step": 2365 + }, + { + "epoch": 0.19, + "learning_rate": 1.8728077164432844e-05, + "loss": 0.4567, + "step": 2366 + }, + { + "epoch": 0.19, + "learning_rate": 1.872682448879912e-05, + "loss": 0.3465, + "step": 2367 + }, + { + "epoch": 0.19, + "learning_rate": 1.8725571238545992e-05, + "loss": 0.3666, + "step": 2368 + }, + { + "epoch": 0.19, + "learning_rate": 1.872431741375598e-05, + "loss": 0.4242, + "step": 2369 + }, + { + "epoch": 0.19, + "learning_rate": 1.872306301451165e-05, + "loss": 0.3791, + "step": 2370 + }, + { + "epoch": 0.19, + "learning_rate": 1.872180804089559e-05, + "loss": 0.3532, + "step": 2371 + }, + { + "epoch": 0.19, + "learning_rate": 1.8720552492990438e-05, + "loss": 0.3618, + "step": 2372 + }, + { + "epoch": 0.19, + "learning_rate": 1.8719296370878866e-05, + "loss": 0.4912, + "step": 2373 + }, + { + "epoch": 0.19, + "learning_rate": 1.871803967464358e-05, + "loss": 0.373, + "step": 2374 + }, + { + "epoch": 0.19, + "learning_rate": 1.8716782404367333e-05, + "loss": 0.4097, + "step": 2375 + }, + { + "epoch": 0.19, + "learning_rate": 1.8715524560132906e-05, + "loss": 0.3661, + "step": 2376 + }, + { + "epoch": 0.19, + "learning_rate": 1.8714266142023124e-05, + "loss": 0.4028, + "step": 2377 + }, + { + "epoch": 0.19, + "learning_rate": 1.8713007150120846e-05, + "loss": 0.3584, + "step": 2378 + }, + { + "epoch": 0.19, + "learning_rate": 1.871174758450897e-05, + "loss": 0.4421, + "step": 2379 + }, + { + "epoch": 0.19, + "learning_rate": 1.8710487445270436e-05, + "loss": 0.437, + "step": 2380 + }, + { + "epoch": 0.19, + "learning_rate": 1.8709226732488216e-05, + "loss": 0.3627, + "step": 2381 + }, + { + "epoch": 0.19, + "learning_rate": 1.8707965446245317e-05, + "loss": 0.3066, + "step": 2382 + }, + { + "epoch": 0.19, + "learning_rate": 1.87067035866248e-05, + "loss": 0.3378, + "step": 2383 + }, + { + "epoch": 0.19, + "learning_rate": 1.8705441153709742e-05, + "loss": 0.3855, + "step": 2384 + }, + { + "epoch": 0.19, + "learning_rate": 1.8704178147583273e-05, + "loss": 0.3875, + "step": 2385 + }, + { + "epoch": 0.19, + "learning_rate": 1.8702914568328555e-05, + "loss": 0.3622, + "step": 2386 + }, + { + "epoch": 0.19, + "learning_rate": 1.8701650416028788e-05, + "loss": 0.327, + "step": 2387 + }, + { + "epoch": 0.19, + "learning_rate": 1.870038569076721e-05, + "loss": 0.3772, + "step": 2388 + }, + { + "epoch": 0.19, + "learning_rate": 1.86991203926271e-05, + "loss": 0.3047, + "step": 2389 + }, + { + "epoch": 0.19, + "learning_rate": 1.8697854521691767e-05, + "loss": 0.3646, + "step": 2390 + }, + { + "epoch": 0.19, + "learning_rate": 1.8696588078044566e-05, + "loss": 0.4898, + "step": 2391 + }, + { + "epoch": 0.19, + "learning_rate": 1.8695321061768886e-05, + "loss": 0.3465, + "step": 2392 + }, + { + "epoch": 0.19, + "learning_rate": 1.8694053472948154e-05, + "loss": 0.3109, + "step": 2393 + }, + { + "epoch": 0.19, + "learning_rate": 1.8692785311665835e-05, + "loss": 0.3955, + "step": 2394 + }, + { + "epoch": 0.19, + "learning_rate": 1.8691516578005426e-05, + "loss": 0.4042, + "step": 2395 + }, + { + "epoch": 0.19, + "learning_rate": 1.8690247272050474e-05, + "loss": 0.3681, + "step": 2396 + }, + { + "epoch": 0.19, + "learning_rate": 1.8688977393884555e-05, + "loss": 0.3663, + "step": 2397 + }, + { + "epoch": 0.19, + "learning_rate": 1.868770694359128e-05, + "loss": 0.417, + "step": 2398 + }, + { + "epoch": 0.19, + "learning_rate": 1.868643592125431e-05, + "loss": 0.3878, + "step": 2399 + }, + { + "epoch": 0.19, + "learning_rate": 1.8685164326957327e-05, + "loss": 0.5457, + "step": 2400 + }, + { + "epoch": 0.19, + "learning_rate": 1.8683892160784066e-05, + "loss": 0.3804, + "step": 2401 + }, + { + "epoch": 0.19, + "learning_rate": 1.868261942281829e-05, + "loss": 0.4675, + "step": 2402 + }, + { + "epoch": 0.19, + "learning_rate": 1.86813461131438e-05, + "loss": 0.4056, + "step": 2403 + }, + { + "epoch": 0.19, + "learning_rate": 1.8680072231844445e-05, + "loss": 0.3926, + "step": 2404 + }, + { + "epoch": 0.19, + "learning_rate": 1.8678797779004096e-05, + "loss": 0.2684, + "step": 2405 + }, + { + "epoch": 0.19, + "learning_rate": 1.8677522754706677e-05, + "loss": 0.4331, + "step": 2406 + }, + { + "epoch": 0.19, + "learning_rate": 1.8676247159036132e-05, + "loss": 0.4639, + "step": 2407 + }, + { + "epoch": 0.19, + "learning_rate": 1.8674970992076465e-05, + "loss": 0.382, + "step": 2408 + }, + { + "epoch": 0.19, + "learning_rate": 1.8673694253911696e-05, + "loss": 0.5268, + "step": 2409 + }, + { + "epoch": 0.19, + "learning_rate": 1.8672416944625896e-05, + "loss": 0.4804, + "step": 2410 + }, + { + "epoch": 0.19, + "learning_rate": 1.867113906430317e-05, + "loss": 0.4275, + "step": 2411 + }, + { + "epoch": 0.19, + "learning_rate": 1.8669860613027657e-05, + "loss": 0.3808, + "step": 2412 + }, + { + "epoch": 0.19, + "learning_rate": 1.8668581590883544e-05, + "loss": 0.5052, + "step": 2413 + }, + { + "epoch": 0.19, + "learning_rate": 1.8667301997955038e-05, + "loss": 0.4576, + "step": 2414 + }, + { + "epoch": 0.19, + "learning_rate": 1.8666021834326404e-05, + "loss": 0.4326, + "step": 2415 + }, + { + "epoch": 0.19, + "learning_rate": 1.866474110008193e-05, + "loss": 0.4057, + "step": 2416 + }, + { + "epoch": 0.19, + "learning_rate": 1.8663459795305946e-05, + "loss": 0.3775, + "step": 2417 + }, + { + "epoch": 0.19, + "learning_rate": 1.866217792008282e-05, + "loss": 0.4766, + "step": 2418 + }, + { + "epoch": 0.19, + "learning_rate": 1.866089547449696e-05, + "loss": 0.3622, + "step": 2419 + }, + { + "epoch": 0.19, + "learning_rate": 1.8659612458632802e-05, + "loss": 0.3943, + "step": 2420 + }, + { + "epoch": 0.19, + "learning_rate": 1.8658328872574833e-05, + "loss": 0.3362, + "step": 2421 + }, + { + "epoch": 0.19, + "learning_rate": 1.8657044716407573e-05, + "loss": 0.3819, + "step": 2422 + }, + { + "epoch": 0.19, + "learning_rate": 1.865575999021557e-05, + "loss": 0.5336, + "step": 2423 + }, + { + "epoch": 0.19, + "learning_rate": 1.8654474694083416e-05, + "loss": 0.5121, + "step": 2424 + }, + { + "epoch": 0.19, + "learning_rate": 1.8653188828095754e-05, + "loss": 0.4331, + "step": 2425 + }, + { + "epoch": 0.19, + "learning_rate": 1.865190239233724e-05, + "loss": 0.4301, + "step": 2426 + }, + { + "epoch": 0.19, + "learning_rate": 1.8650615386892587e-05, + "loss": 0.4443, + "step": 2427 + }, + { + "epoch": 0.19, + "learning_rate": 1.8649327811846533e-05, + "loss": 0.558, + "step": 2428 + }, + { + "epoch": 0.19, + "learning_rate": 1.8648039667283857e-05, + "loss": 0.4069, + "step": 2429 + }, + { + "epoch": 0.19, + "learning_rate": 1.8646750953289384e-05, + "loss": 0.351, + "step": 2430 + }, + { + "epoch": 0.19, + "learning_rate": 1.8645461669947966e-05, + "loss": 0.376, + "step": 2431 + }, + { + "epoch": 0.19, + "learning_rate": 1.8644171817344497e-05, + "loss": 0.4366, + "step": 2432 + }, + { + "epoch": 0.19, + "learning_rate": 1.8642881395563904e-05, + "loss": 0.3572, + "step": 2433 + }, + { + "epoch": 0.19, + "learning_rate": 1.864159040469116e-05, + "loss": 0.4239, + "step": 2434 + }, + { + "epoch": 0.19, + "learning_rate": 1.864029884481127e-05, + "loss": 0.4271, + "step": 2435 + }, + { + "epoch": 0.19, + "learning_rate": 1.8639006716009275e-05, + "loss": 0.4268, + "step": 2436 + }, + { + "epoch": 0.19, + "learning_rate": 1.8637714018370255e-05, + "loss": 0.4089, + "step": 2437 + }, + { + "epoch": 0.19, + "learning_rate": 1.8636420751979328e-05, + "loss": 0.4266, + "step": 2438 + }, + { + "epoch": 0.19, + "learning_rate": 1.863512691692165e-05, + "loss": 0.4105, + "step": 2439 + }, + { + "epoch": 0.19, + "learning_rate": 1.863383251328242e-05, + "loss": 0.3561, + "step": 2440 + }, + { + "epoch": 0.19, + "learning_rate": 1.8632537541146856e-05, + "loss": 0.3142, + "step": 2441 + }, + { + "epoch": 0.19, + "learning_rate": 1.8631242000600235e-05, + "loss": 0.4712, + "step": 2442 + }, + { + "epoch": 0.19, + "learning_rate": 1.8629945891727856e-05, + "loss": 0.4438, + "step": 2443 + }, + { + "epoch": 0.19, + "learning_rate": 1.8628649214615066e-05, + "loss": 0.3738, + "step": 2444 + }, + { + "epoch": 0.19, + "learning_rate": 1.8627351969347246e-05, + "loss": 0.3863, + "step": 2445 + }, + { + "epoch": 0.19, + "learning_rate": 1.8626054156009807e-05, + "loss": 0.4617, + "step": 2446 + }, + { + "epoch": 0.19, + "learning_rate": 1.862475577468821e-05, + "loss": 0.4225, + "step": 2447 + }, + { + "epoch": 0.19, + "learning_rate": 1.8623456825467948e-05, + "loss": 0.4789, + "step": 2448 + }, + { + "epoch": 0.19, + "learning_rate": 1.8622157308434544e-05, + "loss": 0.4229, + "step": 2449 + }, + { + "epoch": 0.19, + "learning_rate": 1.8620857223673567e-05, + "loss": 0.5003, + "step": 2450 + }, + { + "epoch": 0.19, + "learning_rate": 1.8619556571270624e-05, + "loss": 0.332, + "step": 2451 + }, + { + "epoch": 0.19, + "learning_rate": 1.8618255351311355e-05, + "loss": 0.4138, + "step": 2452 + }, + { + "epoch": 0.19, + "learning_rate": 1.8616953563881444e-05, + "loss": 0.3629, + "step": 2453 + }, + { + "epoch": 0.19, + "learning_rate": 1.8615651209066598e-05, + "loss": 0.3723, + "step": 2454 + }, + { + "epoch": 0.19, + "learning_rate": 1.8614348286952577e-05, + "loss": 0.396, + "step": 2455 + }, + { + "epoch": 0.19, + "learning_rate": 1.8613044797625173e-05, + "loss": 0.3353, + "step": 2456 + }, + { + "epoch": 0.19, + "learning_rate": 1.861174074117021e-05, + "loss": 0.3989, + "step": 2457 + }, + { + "epoch": 0.19, + "learning_rate": 1.8610436117673557e-05, + "loss": 0.381, + "step": 2458 + }, + { + "epoch": 0.19, + "learning_rate": 1.8609130927221116e-05, + "loss": 0.3954, + "step": 2459 + }, + { + "epoch": 0.19, + "learning_rate": 1.8607825169898827e-05, + "loss": 0.4202, + "step": 2460 + }, + { + "epoch": 0.19, + "learning_rate": 1.8606518845792672e-05, + "loss": 0.5616, + "step": 2461 + }, + { + "epoch": 0.2, + "learning_rate": 1.860521195498866e-05, + "loss": 0.4234, + "step": 2462 + }, + { + "epoch": 0.2, + "learning_rate": 1.8603904497572846e-05, + "loss": 0.2844, + "step": 2463 + }, + { + "epoch": 0.2, + "learning_rate": 1.8602596473631323e-05, + "loss": 0.466, + "step": 2464 + }, + { + "epoch": 0.2, + "learning_rate": 1.8601287883250215e-05, + "loss": 0.3733, + "step": 2465 + }, + { + "epoch": 0.2, + "learning_rate": 1.8599978726515685e-05, + "loss": 0.2443, + "step": 2466 + }, + { + "epoch": 0.2, + "learning_rate": 1.8598669003513934e-05, + "loss": 0.4375, + "step": 2467 + }, + { + "epoch": 0.2, + "learning_rate": 1.8597358714331207e-05, + "loss": 0.3611, + "step": 2468 + }, + { + "epoch": 0.2, + "learning_rate": 1.8596047859053776e-05, + "loss": 0.4305, + "step": 2469 + }, + { + "epoch": 0.2, + "learning_rate": 1.8594736437767954e-05, + "loss": 0.5194, + "step": 2470 + }, + { + "epoch": 0.2, + "learning_rate": 1.8593424450560094e-05, + "loss": 0.5188, + "step": 2471 + }, + { + "epoch": 0.2, + "learning_rate": 1.8592111897516583e-05, + "loss": 0.3487, + "step": 2472 + }, + { + "epoch": 0.2, + "learning_rate": 1.8590798778723843e-05, + "loss": 0.4964, + "step": 2473 + }, + { + "epoch": 0.2, + "learning_rate": 1.8589485094268344e-05, + "loss": 0.3977, + "step": 2474 + }, + { + "epoch": 0.2, + "learning_rate": 1.858817084423658e-05, + "loss": 0.404, + "step": 2475 + }, + { + "epoch": 0.2, + "learning_rate": 1.8586856028715087e-05, + "loss": 0.5014, + "step": 2476 + }, + { + "epoch": 0.2, + "learning_rate": 1.8585540647790445e-05, + "loss": 0.4108, + "step": 2477 + }, + { + "epoch": 0.2, + "learning_rate": 1.858422470154926e-05, + "loss": 0.4102, + "step": 2478 + }, + { + "epoch": 0.2, + "learning_rate": 1.8582908190078184e-05, + "loss": 0.6096, + "step": 2479 + }, + { + "epoch": 0.2, + "learning_rate": 1.8581591113463903e-05, + "loss": 0.5449, + "step": 2480 + }, + { + "epoch": 0.2, + "learning_rate": 1.858027347179314e-05, + "loss": 0.4717, + "step": 2481 + }, + { + "epoch": 0.2, + "learning_rate": 1.8578955265152652e-05, + "loss": 0.4211, + "step": 2482 + }, + { + "epoch": 0.2, + "learning_rate": 1.857763649362924e-05, + "loss": 0.5112, + "step": 2483 + }, + { + "epoch": 0.2, + "learning_rate": 1.857631715730974e-05, + "loss": 0.4761, + "step": 2484 + }, + { + "epoch": 0.2, + "learning_rate": 1.857499725628102e-05, + "loss": 0.3738, + "step": 2485 + }, + { + "epoch": 0.2, + "learning_rate": 1.8573676790629988e-05, + "loss": 0.3031, + "step": 2486 + }, + { + "epoch": 0.2, + "learning_rate": 1.8572355760443597e-05, + "loss": 0.3071, + "step": 2487 + }, + { + "epoch": 0.2, + "learning_rate": 1.8571034165808826e-05, + "loss": 0.3395, + "step": 2488 + }, + { + "epoch": 0.2, + "learning_rate": 1.85697120068127e-05, + "loss": 0.2864, + "step": 2489 + }, + { + "epoch": 0.2, + "learning_rate": 1.8568389283542263e-05, + "loss": 0.5133, + "step": 2490 + }, + { + "epoch": 0.2, + "learning_rate": 1.8567065996084628e-05, + "loss": 0.4333, + "step": 2491 + }, + { + "epoch": 0.2, + "learning_rate": 1.8565742144526917e-05, + "loss": 0.491, + "step": 2492 + }, + { + "epoch": 0.2, + "learning_rate": 1.85644177289563e-05, + "loss": 0.3917, + "step": 2493 + }, + { + "epoch": 0.2, + "learning_rate": 1.856309274945999e-05, + "loss": 0.3078, + "step": 2494 + }, + { + "epoch": 0.2, + "learning_rate": 1.8561767206125223e-05, + "loss": 0.375, + "step": 2495 + }, + { + "epoch": 0.2, + "learning_rate": 1.856044109903928e-05, + "loss": 0.474, + "step": 2496 + }, + { + "epoch": 0.2, + "learning_rate": 1.8559114428289482e-05, + "loss": 0.505, + "step": 2497 + }, + { + "epoch": 0.2, + "learning_rate": 1.8557787193963184e-05, + "loss": 0.4237, + "step": 2498 + }, + { + "epoch": 0.2, + "learning_rate": 1.8556459396147777e-05, + "loss": 0.4633, + "step": 2499 + }, + { + "epoch": 0.2, + "learning_rate": 1.8555131034930686e-05, + "loss": 0.4603, + "step": 2500 + }, + { + "epoch": 0.2, + "learning_rate": 1.8553802110399385e-05, + "loss": 0.3922, + "step": 2501 + }, + { + "epoch": 0.2, + "learning_rate": 1.8552472622641372e-05, + "loss": 0.3466, + "step": 2502 + }, + { + "epoch": 0.2, + "learning_rate": 1.8551142571744188e-05, + "loss": 0.5659, + "step": 2503 + }, + { + "epoch": 0.2, + "learning_rate": 1.854981195779541e-05, + "loss": 0.3675, + "step": 2504 + }, + { + "epoch": 0.2, + "learning_rate": 1.8548480780882658e-05, + "loss": 0.4471, + "step": 2505 + }, + { + "epoch": 0.2, + "learning_rate": 1.8547149041093574e-05, + "loss": 0.4304, + "step": 2506 + }, + { + "epoch": 0.2, + "learning_rate": 1.8545816738515855e-05, + "loss": 0.3701, + "step": 2507 + }, + { + "epoch": 0.2, + "learning_rate": 1.854448387323722e-05, + "loss": 0.3494, + "step": 2508 + }, + { + "epoch": 0.2, + "learning_rate": 1.8543150445345443e-05, + "loss": 0.383, + "step": 2509 + }, + { + "epoch": 0.2, + "learning_rate": 1.854181645492831e-05, + "loss": 0.3666, + "step": 2510 + }, + { + "epoch": 0.2, + "learning_rate": 1.8540481902073664e-05, + "loss": 0.4269, + "step": 2511 + }, + { + "epoch": 0.2, + "learning_rate": 1.8539146786869385e-05, + "loss": 0.485, + "step": 2512 + }, + { + "epoch": 0.2, + "learning_rate": 1.8537811109403372e-05, + "loss": 0.3052, + "step": 2513 + }, + { + "epoch": 0.2, + "learning_rate": 1.853647486976358e-05, + "loss": 0.5222, + "step": 2514 + }, + { + "epoch": 0.2, + "learning_rate": 1.8535138068037995e-05, + "loss": 0.378, + "step": 2515 + }, + { + "epoch": 0.2, + "learning_rate": 1.8533800704314633e-05, + "loss": 0.5193, + "step": 2516 + }, + { + "epoch": 0.2, + "learning_rate": 1.8532462778681558e-05, + "loss": 0.3425, + "step": 2517 + }, + { + "epoch": 0.2, + "learning_rate": 1.8531124291226866e-05, + "loss": 0.3583, + "step": 2518 + }, + { + "epoch": 0.2, + "learning_rate": 1.8529785242038688e-05, + "loss": 0.4077, + "step": 2519 + }, + { + "epoch": 0.2, + "learning_rate": 1.8528445631205195e-05, + "loss": 0.3931, + "step": 2520 + }, + { + "epoch": 0.2, + "learning_rate": 1.852710545881459e-05, + "loss": 0.4159, + "step": 2521 + }, + { + "epoch": 0.2, + "learning_rate": 1.8525764724955123e-05, + "loss": 0.4381, + "step": 2522 + }, + { + "epoch": 0.2, + "learning_rate": 1.8524423429715072e-05, + "loss": 0.3187, + "step": 2523 + }, + { + "epoch": 0.2, + "learning_rate": 1.8523081573182754e-05, + "loss": 0.4014, + "step": 2524 + }, + { + "epoch": 0.2, + "learning_rate": 1.8521739155446527e-05, + "loss": 0.4562, + "step": 2525 + }, + { + "epoch": 0.2, + "learning_rate": 1.852039617659478e-05, + "loss": 0.3336, + "step": 2526 + }, + { + "epoch": 0.2, + "learning_rate": 1.851905263671594e-05, + "loss": 0.396, + "step": 2527 + }, + { + "epoch": 0.2, + "learning_rate": 1.8517708535898477e-05, + "loss": 0.3941, + "step": 2528 + }, + { + "epoch": 0.2, + "learning_rate": 1.851636387423089e-05, + "loss": 0.323, + "step": 2529 + }, + { + "epoch": 0.2, + "learning_rate": 1.8515018651801723e-05, + "loss": 0.4142, + "step": 2530 + }, + { + "epoch": 0.2, + "learning_rate": 1.8513672868699547e-05, + "loss": 0.4074, + "step": 2531 + }, + { + "epoch": 0.2, + "learning_rate": 1.851232652501298e-05, + "loss": 0.2521, + "step": 2532 + }, + { + "epoch": 0.2, + "learning_rate": 1.851097962083067e-05, + "loss": 0.4501, + "step": 2533 + }, + { + "epoch": 0.2, + "learning_rate": 1.85096321562413e-05, + "loss": 0.3417, + "step": 2534 + }, + { + "epoch": 0.2, + "learning_rate": 1.8508284131333604e-05, + "loss": 0.4009, + "step": 2535 + }, + { + "epoch": 0.2, + "learning_rate": 1.850693554619633e-05, + "loss": 0.4421, + "step": 2536 + }, + { + "epoch": 0.2, + "learning_rate": 1.8505586400918288e-05, + "loss": 0.4176, + "step": 2537 + }, + { + "epoch": 0.2, + "learning_rate": 1.8504236695588308e-05, + "loss": 0.3623, + "step": 2538 + }, + { + "epoch": 0.2, + "learning_rate": 1.8502886430295262e-05, + "loss": 0.4448, + "step": 2539 + }, + { + "epoch": 0.2, + "learning_rate": 1.8501535605128054e-05, + "loss": 0.2763, + "step": 2540 + }, + { + "epoch": 0.2, + "learning_rate": 1.8500184220175636e-05, + "loss": 0.4208, + "step": 2541 + }, + { + "epoch": 0.2, + "learning_rate": 1.8498832275526988e-05, + "loss": 0.4382, + "step": 2542 + }, + { + "epoch": 0.2, + "learning_rate": 1.8497479771271125e-05, + "loss": 0.3727, + "step": 2543 + }, + { + "epoch": 0.2, + "learning_rate": 1.8496126707497112e-05, + "loss": 0.4216, + "step": 2544 + }, + { + "epoch": 0.2, + "learning_rate": 1.849477308429403e-05, + "loss": 0.3728, + "step": 2545 + }, + { + "epoch": 0.2, + "learning_rate": 1.8493418901751016e-05, + "loss": 0.4859, + "step": 2546 + }, + { + "epoch": 0.2, + "learning_rate": 1.849206415995724e-05, + "loss": 0.4352, + "step": 2547 + }, + { + "epoch": 0.2, + "learning_rate": 1.8490708859001896e-05, + "loss": 0.4603, + "step": 2548 + }, + { + "epoch": 0.2, + "learning_rate": 1.8489352998974227e-05, + "loss": 0.4223, + "step": 2549 + }, + { + "epoch": 0.2, + "learning_rate": 1.8487996579963515e-05, + "loss": 0.4468, + "step": 2550 + }, + { + "epoch": 0.2, + "learning_rate": 1.8486639602059066e-05, + "loss": 0.4122, + "step": 2551 + }, + { + "epoch": 0.2, + "learning_rate": 1.8485282065350237e-05, + "loss": 0.3851, + "step": 2552 + }, + { + "epoch": 0.2, + "learning_rate": 1.848392396992641e-05, + "loss": 0.3064, + "step": 2553 + }, + { + "epoch": 0.2, + "learning_rate": 1.8482565315877013e-05, + "loss": 0.4224, + "step": 2554 + }, + { + "epoch": 0.2, + "learning_rate": 1.8481206103291506e-05, + "loss": 0.4188, + "step": 2555 + }, + { + "epoch": 0.2, + "learning_rate": 1.8479846332259388e-05, + "loss": 0.4198, + "step": 2556 + }, + { + "epoch": 0.2, + "learning_rate": 1.847848600287019e-05, + "loss": 0.5132, + "step": 2557 + }, + { + "epoch": 0.2, + "learning_rate": 1.8477125115213484e-05, + "loss": 0.4505, + "step": 2558 + }, + { + "epoch": 0.2, + "learning_rate": 1.8475763669378878e-05, + "loss": 0.4718, + "step": 2559 + }, + { + "epoch": 0.2, + "learning_rate": 1.8474401665456016e-05, + "loss": 0.3125, + "step": 2560 + }, + { + "epoch": 0.2, + "learning_rate": 1.8473039103534583e-05, + "loss": 0.3936, + "step": 2561 + }, + { + "epoch": 0.2, + "learning_rate": 1.8471675983704295e-05, + "loss": 0.4666, + "step": 2562 + }, + { + "epoch": 0.2, + "learning_rate": 1.8470312306054903e-05, + "loss": 0.4, + "step": 2563 + }, + { + "epoch": 0.2, + "learning_rate": 1.8468948070676205e-05, + "loss": 0.3648, + "step": 2564 + }, + { + "epoch": 0.2, + "learning_rate": 1.8467583277658026e-05, + "loss": 0.3383, + "step": 2565 + }, + { + "epoch": 0.2, + "learning_rate": 1.8466217927090232e-05, + "loss": 0.33, + "step": 2566 + }, + { + "epoch": 0.2, + "learning_rate": 1.8464852019062726e-05, + "loss": 0.4527, + "step": 2567 + }, + { + "epoch": 0.2, + "learning_rate": 1.846348555366544e-05, + "loss": 0.3415, + "step": 2568 + }, + { + "epoch": 0.2, + "learning_rate": 1.8462118530988356e-05, + "loss": 0.5194, + "step": 2569 + }, + { + "epoch": 0.2, + "learning_rate": 1.8460750951121487e-05, + "loss": 0.4831, + "step": 2570 + }, + { + "epoch": 0.2, + "learning_rate": 1.8459382814154874e-05, + "loss": 0.4049, + "step": 2571 + }, + { + "epoch": 0.2, + "learning_rate": 1.845801412017861e-05, + "loss": 0.3519, + "step": 2572 + }, + { + "epoch": 0.2, + "learning_rate": 1.845664486928281e-05, + "loss": 0.449, + "step": 2573 + }, + { + "epoch": 0.2, + "learning_rate": 1.8455275061557643e-05, + "loss": 0.3235, + "step": 2574 + }, + { + "epoch": 0.2, + "learning_rate": 1.845390469709329e-05, + "loss": 0.3707, + "step": 2575 + }, + { + "epoch": 0.2, + "learning_rate": 1.8452533775979992e-05, + "loss": 0.3542, + "step": 2576 + }, + { + "epoch": 0.2, + "learning_rate": 1.845116229830802e-05, + "loss": 0.3638, + "step": 2577 + }, + { + "epoch": 0.2, + "learning_rate": 1.8449790264167672e-05, + "loss": 0.3391, + "step": 2578 + }, + { + "epoch": 0.2, + "learning_rate": 1.8448417673649292e-05, + "loss": 0.5309, + "step": 2579 + }, + { + "epoch": 0.2, + "learning_rate": 1.844704452684326e-05, + "loss": 0.418, + "step": 2580 + }, + { + "epoch": 0.2, + "learning_rate": 1.844567082383999e-05, + "loss": 0.4223, + "step": 2581 + }, + { + "epoch": 0.2, + "learning_rate": 1.8444296564729935e-05, + "loss": 0.509, + "step": 2582 + }, + { + "epoch": 0.2, + "learning_rate": 1.8442921749603586e-05, + "loss": 0.394, + "step": 2583 + }, + { + "epoch": 0.2, + "learning_rate": 1.8441546378551457e-05, + "loss": 0.4389, + "step": 2584 + }, + { + "epoch": 0.2, + "learning_rate": 1.8440170451664122e-05, + "loss": 0.4306, + "step": 2585 + }, + { + "epoch": 0.2, + "learning_rate": 1.8438793969032175e-05, + "loss": 0.48, + "step": 2586 + }, + { + "epoch": 0.2, + "learning_rate": 1.8437416930746248e-05, + "loss": 0.4074, + "step": 2587 + }, + { + "epoch": 0.21, + "learning_rate": 1.8436039336897015e-05, + "loss": 0.2581, + "step": 2588 + }, + { + "epoch": 0.21, + "learning_rate": 1.8434661187575183e-05, + "loss": 0.4802, + "step": 2589 + }, + { + "epoch": 0.21, + "learning_rate": 1.8433282482871497e-05, + "loss": 0.4264, + "step": 2590 + }, + { + "epoch": 0.21, + "learning_rate": 1.8431903222876737e-05, + "loss": 0.4158, + "step": 2591 + }, + { + "epoch": 0.21, + "learning_rate": 1.8430523407681723e-05, + "loss": 0.4058, + "step": 2592 + }, + { + "epoch": 0.21, + "learning_rate": 1.8429143037377305e-05, + "loss": 0.4315, + "step": 2593 + }, + { + "epoch": 0.21, + "learning_rate": 1.8427762112054378e-05, + "loss": 0.4494, + "step": 2594 + }, + { + "epoch": 0.21, + "learning_rate": 1.842638063180387e-05, + "loss": 0.3714, + "step": 2595 + }, + { + "epoch": 0.21, + "learning_rate": 1.8424998596716743e-05, + "loss": 0.4224, + "step": 2596 + }, + { + "epoch": 0.21, + "learning_rate": 1.8423616006883994e-05, + "loss": 0.3437, + "step": 2597 + }, + { + "epoch": 0.21, + "learning_rate": 1.8422232862396663e-05, + "loss": 0.3527, + "step": 2598 + }, + { + "epoch": 0.21, + "learning_rate": 1.8420849163345824e-05, + "loss": 0.4356, + "step": 2599 + }, + { + "epoch": 0.21, + "learning_rate": 1.8419464909822585e-05, + "loss": 0.4464, + "step": 2600 + }, + { + "epoch": 0.21, + "learning_rate": 1.8418080101918095e-05, + "loss": 0.4478, + "step": 2601 + }, + { + "epoch": 0.21, + "learning_rate": 1.8416694739723535e-05, + "loss": 0.3835, + "step": 2602 + }, + { + "epoch": 0.21, + "learning_rate": 1.841530882333012e-05, + "loss": 0.4936, + "step": 2603 + }, + { + "epoch": 0.21, + "learning_rate": 1.8413922352829118e-05, + "loss": 0.4094, + "step": 2604 + }, + { + "epoch": 0.21, + "learning_rate": 1.8412535328311813e-05, + "loss": 0.355, + "step": 2605 + }, + { + "epoch": 0.21, + "learning_rate": 1.8411147749869536e-05, + "loss": 0.3142, + "step": 2606 + }, + { + "epoch": 0.21, + "learning_rate": 1.840975961759365e-05, + "loss": 0.4102, + "step": 2607 + }, + { + "epoch": 0.21, + "learning_rate": 1.8408370931575556e-05, + "loss": 0.3809, + "step": 2608 + }, + { + "epoch": 0.21, + "learning_rate": 1.84069816919067e-05, + "loss": 0.3693, + "step": 2609 + }, + { + "epoch": 0.21, + "learning_rate": 1.8405591898678546e-05, + "loss": 0.4487, + "step": 2610 + }, + { + "epoch": 0.21, + "learning_rate": 1.8404201551982612e-05, + "loss": 0.5515, + "step": 2611 + }, + { + "epoch": 0.21, + "learning_rate": 1.8402810651910444e-05, + "loss": 0.3384, + "step": 2612 + }, + { + "epoch": 0.21, + "learning_rate": 1.840141919855363e-05, + "loss": 0.5313, + "step": 2613 + }, + { + "epoch": 0.21, + "learning_rate": 1.8400027192003782e-05, + "loss": 0.4097, + "step": 2614 + }, + { + "epoch": 0.21, + "learning_rate": 1.8398634632352562e-05, + "loss": 0.4316, + "step": 2615 + }, + { + "epoch": 0.21, + "learning_rate": 1.8397241519691667e-05, + "loss": 0.3866, + "step": 2616 + }, + { + "epoch": 0.21, + "learning_rate": 1.839584785411282e-05, + "loss": 0.3741, + "step": 2617 + }, + { + "epoch": 0.21, + "learning_rate": 1.839445363570779e-05, + "loss": 0.3391, + "step": 2618 + }, + { + "epoch": 0.21, + "learning_rate": 1.8393058864568383e-05, + "loss": 0.3665, + "step": 2619 + }, + { + "epoch": 0.21, + "learning_rate": 1.839166354078643e-05, + "loss": 0.3865, + "step": 2620 + }, + { + "epoch": 0.21, + "learning_rate": 1.8390267664453815e-05, + "loss": 0.4856, + "step": 2621 + }, + { + "epoch": 0.21, + "learning_rate": 1.8388871235662442e-05, + "loss": 0.3268, + "step": 2622 + }, + { + "epoch": 0.21, + "learning_rate": 1.8387474254504265e-05, + "loss": 0.3783, + "step": 2623 + }, + { + "epoch": 0.21, + "learning_rate": 1.8386076721071265e-05, + "loss": 0.5544, + "step": 2624 + }, + { + "epoch": 0.21, + "learning_rate": 1.8384678635455467e-05, + "loss": 0.3742, + "step": 2625 + }, + { + "epoch": 0.21, + "learning_rate": 1.838327999774892e-05, + "loss": 0.321, + "step": 2626 + }, + { + "epoch": 0.21, + "learning_rate": 1.838188080804373e-05, + "loss": 0.4016, + "step": 2627 + }, + { + "epoch": 0.21, + "learning_rate": 1.8380481066432014e-05, + "loss": 0.4145, + "step": 2628 + }, + { + "epoch": 0.21, + "learning_rate": 1.8379080773005947e-05, + "loss": 0.4047, + "step": 2629 + }, + { + "epoch": 0.21, + "learning_rate": 1.8377679927857727e-05, + "loss": 0.3722, + "step": 2630 + }, + { + "epoch": 0.21, + "learning_rate": 1.8376278531079594e-05, + "loss": 0.3649, + "step": 2631 + }, + { + "epoch": 0.21, + "learning_rate": 1.8374876582763828e-05, + "loss": 0.3615, + "step": 2632 + }, + { + "epoch": 0.21, + "learning_rate": 1.8373474083002732e-05, + "loss": 0.5294, + "step": 2633 + }, + { + "epoch": 0.21, + "learning_rate": 1.837207103188866e-05, + "loss": 0.3572, + "step": 2634 + }, + { + "epoch": 0.21, + "learning_rate": 1.8370667429513992e-05, + "loss": 0.3513, + "step": 2635 + }, + { + "epoch": 0.21, + "learning_rate": 1.8369263275971153e-05, + "loss": 0.4933, + "step": 2636 + }, + { + "epoch": 0.21, + "learning_rate": 1.8367858571352603e-05, + "loss": 0.394, + "step": 2637 + }, + { + "epoch": 0.21, + "learning_rate": 1.8366453315750822e-05, + "loss": 0.4345, + "step": 2638 + }, + { + "epoch": 0.21, + "learning_rate": 1.8365047509258346e-05, + "loss": 0.48, + "step": 2639 + }, + { + "epoch": 0.21, + "learning_rate": 1.8363641151967747e-05, + "loss": 0.4377, + "step": 2640 + }, + { + "epoch": 0.21, + "learning_rate": 1.836223424397162e-05, + "loss": 0.333, + "step": 2641 + }, + { + "epoch": 0.21, + "learning_rate": 1.8360826785362603e-05, + "loss": 0.4331, + "step": 2642 + }, + { + "epoch": 0.21, + "learning_rate": 1.835941877623337e-05, + "loss": 0.3781, + "step": 2643 + }, + { + "epoch": 0.21, + "learning_rate": 1.835801021667664e-05, + "loss": 0.3103, + "step": 2644 + }, + { + "epoch": 0.21, + "learning_rate": 1.8356601106785148e-05, + "loss": 0.5003, + "step": 2645 + }, + { + "epoch": 0.21, + "learning_rate": 1.8355191446651687e-05, + "loss": 0.3469, + "step": 2646 + }, + { + "epoch": 0.21, + "learning_rate": 1.8353781236369065e-05, + "loss": 0.3918, + "step": 2647 + }, + { + "epoch": 0.21, + "learning_rate": 1.8352370476030147e-05, + "loss": 0.3908, + "step": 2648 + }, + { + "epoch": 0.21, + "learning_rate": 1.8350959165727826e-05, + "loss": 0.3591, + "step": 2649 + }, + { + "epoch": 0.21, + "learning_rate": 1.8349547305555023e-05, + "loss": 0.2727, + "step": 2650 + }, + { + "epoch": 0.21, + "learning_rate": 1.8348134895604708e-05, + "loss": 0.3965, + "step": 2651 + }, + { + "epoch": 0.21, + "learning_rate": 1.8346721935969878e-05, + "loss": 0.4042, + "step": 2652 + }, + { + "epoch": 0.21, + "learning_rate": 1.8345308426743568e-05, + "loss": 0.3886, + "step": 2653 + }, + { + "epoch": 0.21, + "learning_rate": 1.8343894368018854e-05, + "loss": 0.4656, + "step": 2654 + }, + { + "epoch": 0.21, + "learning_rate": 1.8342479759888844e-05, + "loss": 0.313, + "step": 2655 + }, + { + "epoch": 0.21, + "learning_rate": 1.8341064602446686e-05, + "loss": 0.4428, + "step": 2656 + }, + { + "epoch": 0.21, + "learning_rate": 1.8339648895785556e-05, + "loss": 0.3032, + "step": 2657 + }, + { + "epoch": 0.21, + "learning_rate": 1.8338232639998672e-05, + "loss": 0.3008, + "step": 2658 + }, + { + "epoch": 0.21, + "learning_rate": 1.8336815835179295e-05, + "loss": 0.3534, + "step": 2659 + }, + { + "epoch": 0.21, + "learning_rate": 1.8335398481420705e-05, + "loss": 0.407, + "step": 2660 + }, + { + "epoch": 0.21, + "learning_rate": 1.8333980578816234e-05, + "loss": 0.543, + "step": 2661 + }, + { + "epoch": 0.21, + "learning_rate": 1.8332562127459242e-05, + "loss": 0.4436, + "step": 2662 + }, + { + "epoch": 0.21, + "learning_rate": 1.833114312744313e-05, + "loss": 0.4423, + "step": 2663 + }, + { + "epoch": 0.21, + "learning_rate": 1.8329723578861328e-05, + "loss": 0.314, + "step": 2664 + }, + { + "epoch": 0.21, + "learning_rate": 1.8328303481807306e-05, + "loss": 0.3519, + "step": 2665 + }, + { + "epoch": 0.21, + "learning_rate": 1.832688283637458e-05, + "loss": 0.3145, + "step": 2666 + }, + { + "epoch": 0.21, + "learning_rate": 1.8325461642656676e-05, + "loss": 0.2871, + "step": 2667 + }, + { + "epoch": 0.21, + "learning_rate": 1.832403990074719e-05, + "loss": 0.2951, + "step": 2668 + }, + { + "epoch": 0.21, + "learning_rate": 1.8322617610739726e-05, + "loss": 0.3693, + "step": 2669 + }, + { + "epoch": 0.21, + "learning_rate": 1.8321194772727938e-05, + "loss": 0.339, + "step": 2670 + }, + { + "epoch": 0.21, + "learning_rate": 1.8319771386805514e-05, + "loss": 0.3601, + "step": 2671 + }, + { + "epoch": 0.21, + "learning_rate": 1.8318347453066176e-05, + "loss": 0.3389, + "step": 2672 + }, + { + "epoch": 0.21, + "learning_rate": 1.8316922971603685e-05, + "loss": 0.394, + "step": 2673 + }, + { + "epoch": 0.21, + "learning_rate": 1.8315497942511836e-05, + "loss": 0.4483, + "step": 2674 + }, + { + "epoch": 0.21, + "learning_rate": 1.8314072365884455e-05, + "loss": 0.3682, + "step": 2675 + }, + { + "epoch": 0.21, + "learning_rate": 1.831264624181542e-05, + "loss": 0.4039, + "step": 2676 + }, + { + "epoch": 0.21, + "learning_rate": 1.8311219570398618e-05, + "loss": 0.4199, + "step": 2677 + }, + { + "epoch": 0.21, + "learning_rate": 1.8309792351728006e-05, + "loss": 0.3453, + "step": 2678 + }, + { + "epoch": 0.21, + "learning_rate": 1.830836458589755e-05, + "loss": 0.5116, + "step": 2679 + }, + { + "epoch": 0.21, + "learning_rate": 1.8306936273001258e-05, + "loss": 0.4464, + "step": 2680 + }, + { + "epoch": 0.21, + "learning_rate": 1.830550741313319e-05, + "loss": 0.3929, + "step": 2681 + }, + { + "epoch": 0.21, + "learning_rate": 1.830407800638742e-05, + "loss": 0.3781, + "step": 2682 + }, + { + "epoch": 0.21, + "learning_rate": 1.830264805285807e-05, + "loss": 0.3904, + "step": 2683 + }, + { + "epoch": 0.21, + "learning_rate": 1.8301217552639294e-05, + "loss": 0.3835, + "step": 2684 + }, + { + "epoch": 0.21, + "learning_rate": 1.8299786505825286e-05, + "loss": 0.4283, + "step": 2685 + }, + { + "epoch": 0.21, + "learning_rate": 1.8298354912510273e-05, + "loss": 0.3648, + "step": 2686 + }, + { + "epoch": 0.21, + "learning_rate": 1.8296922772788522e-05, + "loss": 0.4264, + "step": 2687 + }, + { + "epoch": 0.21, + "learning_rate": 1.8295490086754325e-05, + "loss": 0.4635, + "step": 2688 + }, + { + "epoch": 0.21, + "learning_rate": 1.829405685450202e-05, + "loss": 0.3919, + "step": 2689 + }, + { + "epoch": 0.21, + "learning_rate": 1.8292623076125983e-05, + "loss": 0.4077, + "step": 2690 + }, + { + "epoch": 0.21, + "learning_rate": 1.8291188751720615e-05, + "loss": 0.3375, + "step": 2691 + }, + { + "epoch": 0.21, + "learning_rate": 1.828975388138036e-05, + "loss": 0.4012, + "step": 2692 + }, + { + "epoch": 0.21, + "learning_rate": 1.8288318465199705e-05, + "loss": 0.333, + "step": 2693 + }, + { + "epoch": 0.21, + "learning_rate": 1.8286882503273157e-05, + "loss": 0.4421, + "step": 2694 + }, + { + "epoch": 0.21, + "learning_rate": 1.828544599569527e-05, + "loss": 0.361, + "step": 2695 + }, + { + "epoch": 0.21, + "learning_rate": 1.8284008942560634e-05, + "loss": 0.4517, + "step": 2696 + }, + { + "epoch": 0.21, + "learning_rate": 1.8282571343963865e-05, + "loss": 0.3747, + "step": 2697 + }, + { + "epoch": 0.21, + "learning_rate": 1.8281133199999628e-05, + "loss": 0.3425, + "step": 2698 + }, + { + "epoch": 0.21, + "learning_rate": 1.8279694510762616e-05, + "loss": 0.4278, + "step": 2699 + }, + { + "epoch": 0.21, + "learning_rate": 1.8278255276347563e-05, + "loss": 0.4334, + "step": 2700 + }, + { + "epoch": 0.21, + "learning_rate": 1.8276815496849227e-05, + "loss": 0.4914, + "step": 2701 + }, + { + "epoch": 0.21, + "learning_rate": 1.827537517236242e-05, + "loss": 0.5092, + "step": 2702 + }, + { + "epoch": 0.21, + "learning_rate": 1.8273934302981975e-05, + "loss": 0.3157, + "step": 2703 + }, + { + "epoch": 0.21, + "learning_rate": 1.8272492888802767e-05, + "loss": 0.3275, + "step": 2704 + }, + { + "epoch": 0.21, + "learning_rate": 1.8271050929919707e-05, + "loss": 0.3495, + "step": 2705 + }, + { + "epoch": 0.21, + "learning_rate": 1.8269608426427743e-05, + "loss": 0.5227, + "step": 2706 + }, + { + "epoch": 0.21, + "learning_rate": 1.8268165378421852e-05, + "loss": 0.4709, + "step": 2707 + }, + { + "epoch": 0.21, + "learning_rate": 1.826672178599706e-05, + "loss": 0.4502, + "step": 2708 + }, + { + "epoch": 0.21, + "learning_rate": 1.826527764924841e-05, + "loss": 0.4191, + "step": 2709 + }, + { + "epoch": 0.21, + "learning_rate": 1.8263832968271e-05, + "loss": 0.4247, + "step": 2710 + }, + { + "epoch": 0.21, + "learning_rate": 1.826238774315995e-05, + "loss": 0.3751, + "step": 2711 + }, + { + "epoch": 0.21, + "learning_rate": 1.8260941974010425e-05, + "loss": 0.3106, + "step": 2712 + }, + { + "epoch": 0.21, + "learning_rate": 1.825949566091762e-05, + "loss": 0.35, + "step": 2713 + }, + { + "epoch": 0.22, + "learning_rate": 1.8258048803976763e-05, + "loss": 0.3555, + "step": 2714 + }, + { + "epoch": 0.22, + "learning_rate": 1.8256601403283133e-05, + "loss": 0.3851, + "step": 2715 + }, + { + "epoch": 0.22, + "learning_rate": 1.8255153458932028e-05, + "loss": 0.3666, + "step": 2716 + }, + { + "epoch": 0.22, + "learning_rate": 1.825370497101879e-05, + "loss": 0.3363, + "step": 2717 + }, + { + "epoch": 0.22, + "learning_rate": 1.825225593963879e-05, + "loss": 0.3756, + "step": 2718 + }, + { + "epoch": 0.22, + "learning_rate": 1.8250806364887446e-05, + "loss": 0.3621, + "step": 2719 + }, + { + "epoch": 0.22, + "learning_rate": 1.8249356246860205e-05, + "loss": 0.3026, + "step": 2720 + }, + { + "epoch": 0.22, + "learning_rate": 1.8247905585652545e-05, + "loss": 0.4131, + "step": 2721 + }, + { + "epoch": 0.22, + "learning_rate": 1.824645438135999e-05, + "loss": 0.3393, + "step": 2722 + }, + { + "epoch": 0.22, + "learning_rate": 1.8245002634078095e-05, + "loss": 0.3545, + "step": 2723 + }, + { + "epoch": 0.22, + "learning_rate": 1.8243550343902447e-05, + "loss": 0.3449, + "step": 2724 + }, + { + "epoch": 0.22, + "learning_rate": 1.8242097510928672e-05, + "loss": 0.4115, + "step": 2725 + }, + { + "epoch": 0.22, + "learning_rate": 1.824064413525244e-05, + "loss": 0.3476, + "step": 2726 + }, + { + "epoch": 0.22, + "learning_rate": 1.823919021696944e-05, + "loss": 0.3684, + "step": 2727 + }, + { + "epoch": 0.22, + "learning_rate": 1.8237735756175408e-05, + "loss": 0.515, + "step": 2728 + }, + { + "epoch": 0.22, + "learning_rate": 1.8236280752966115e-05, + "loss": 0.306, + "step": 2729 + }, + { + "epoch": 0.22, + "learning_rate": 1.8234825207437365e-05, + "loss": 0.341, + "step": 2730 + }, + { + "epoch": 0.22, + "learning_rate": 1.8233369119685e-05, + "loss": 0.3561, + "step": 2731 + }, + { + "epoch": 0.22, + "learning_rate": 1.8231912489804893e-05, + "loss": 0.3068, + "step": 2732 + }, + { + "epoch": 0.22, + "learning_rate": 1.8230455317892957e-05, + "loss": 0.3192, + "step": 2733 + }, + { + "epoch": 0.22, + "learning_rate": 1.822899760404514e-05, + "loss": 0.364, + "step": 2734 + }, + { + "epoch": 0.22, + "learning_rate": 1.822753934835743e-05, + "loss": 0.4656, + "step": 2735 + }, + { + "epoch": 0.22, + "learning_rate": 1.822608055092584e-05, + "loss": 0.3655, + "step": 2736 + }, + { + "epoch": 0.22, + "learning_rate": 1.8224621211846426e-05, + "loss": 0.5365, + "step": 2737 + }, + { + "epoch": 0.22, + "learning_rate": 1.8223161331215285e-05, + "loss": 0.3953, + "step": 2738 + }, + { + "epoch": 0.22, + "learning_rate": 1.822170090912853e-05, + "loss": 0.3923, + "step": 2739 + }, + { + "epoch": 0.22, + "learning_rate": 1.8220239945682337e-05, + "loss": 0.3809, + "step": 2740 + }, + { + "epoch": 0.22, + "learning_rate": 1.8218778440972893e-05, + "loss": 0.4338, + "step": 2741 + }, + { + "epoch": 0.22, + "learning_rate": 1.8217316395096438e-05, + "loss": 0.4043, + "step": 2742 + }, + { + "epoch": 0.22, + "learning_rate": 1.8215853808149237e-05, + "loss": 0.374, + "step": 2743 + }, + { + "epoch": 0.22, + "learning_rate": 1.8214390680227588e-05, + "loss": 0.3646, + "step": 2744 + }, + { + "epoch": 0.22, + "learning_rate": 1.8212927011427847e-05, + "loss": 0.4915, + "step": 2745 + }, + { + "epoch": 0.22, + "learning_rate": 1.8211462801846375e-05, + "loss": 0.4083, + "step": 2746 + }, + { + "epoch": 0.22, + "learning_rate": 1.820999805157959e-05, + "loss": 0.3488, + "step": 2747 + }, + { + "epoch": 0.22, + "learning_rate": 1.8208532760723937e-05, + "loss": 0.3371, + "step": 2748 + }, + { + "epoch": 0.22, + "learning_rate": 1.82070669293759e-05, + "loss": 0.4493, + "step": 2749 + }, + { + "epoch": 0.22, + "learning_rate": 1.8205600557631995e-05, + "loss": 0.4655, + "step": 2750 + }, + { + "epoch": 0.22, + "learning_rate": 1.8204133645588774e-05, + "loss": 0.4536, + "step": 2751 + }, + { + "epoch": 0.22, + "learning_rate": 1.8202666193342834e-05, + "loss": 0.4623, + "step": 2752 + }, + { + "epoch": 0.22, + "learning_rate": 1.8201198200990787e-05, + "loss": 0.4227, + "step": 2753 + }, + { + "epoch": 0.22, + "learning_rate": 1.8199729668629303e-05, + "loss": 0.4358, + "step": 2754 + }, + { + "epoch": 0.22, + "learning_rate": 1.8198260596355077e-05, + "loss": 0.367, + "step": 2755 + }, + { + "epoch": 0.22, + "learning_rate": 1.8196790984264835e-05, + "loss": 0.5431, + "step": 2756 + }, + { + "epoch": 0.22, + "learning_rate": 1.8195320832455347e-05, + "loss": 0.4014, + "step": 2757 + }, + { + "epoch": 0.22, + "learning_rate": 1.819385014102342e-05, + "loss": 0.4354, + "step": 2758 + }, + { + "epoch": 0.22, + "learning_rate": 1.8192378910065882e-05, + "loss": 0.4475, + "step": 2759 + }, + { + "epoch": 0.22, + "learning_rate": 1.8190907139679614e-05, + "loss": 0.4369, + "step": 2760 + }, + { + "epoch": 0.22, + "learning_rate": 1.8189434829961525e-05, + "loss": 0.3687, + "step": 2761 + }, + { + "epoch": 0.22, + "learning_rate": 1.8187961981008554e-05, + "loss": 0.3824, + "step": 2762 + }, + { + "epoch": 0.22, + "learning_rate": 1.8186488592917686e-05, + "loss": 0.3423, + "step": 2763 + }, + { + "epoch": 0.22, + "learning_rate": 1.8185014665785936e-05, + "loss": 0.4205, + "step": 2764 + }, + { + "epoch": 0.22, + "learning_rate": 1.8183540199710354e-05, + "loss": 0.3479, + "step": 2765 + }, + { + "epoch": 0.22, + "learning_rate": 1.8182065194788024e-05, + "loss": 0.4239, + "step": 2766 + }, + { + "epoch": 0.22, + "learning_rate": 1.8180589651116073e-05, + "loss": 0.5009, + "step": 2767 + }, + { + "epoch": 0.22, + "learning_rate": 1.8179113568791656e-05, + "loss": 0.4513, + "step": 2768 + }, + { + "epoch": 0.22, + "learning_rate": 1.8177636947911964e-05, + "loss": 0.544, + "step": 2769 + }, + { + "epoch": 0.22, + "learning_rate": 1.817615978857423e-05, + "loss": 0.464, + "step": 2770 + }, + { + "epoch": 0.22, + "learning_rate": 1.8174682090875713e-05, + "loss": 0.4543, + "step": 2771 + }, + { + "epoch": 0.22, + "learning_rate": 1.8173203854913714e-05, + "loss": 0.3657, + "step": 2772 + }, + { + "epoch": 0.22, + "learning_rate": 1.817172508078557e-05, + "loss": 0.3402, + "step": 2773 + }, + { + "epoch": 0.22, + "learning_rate": 1.817024576858865e-05, + "loss": 0.3431, + "step": 2774 + }, + { + "epoch": 0.22, + "learning_rate": 1.8168765918420358e-05, + "loss": 0.4326, + "step": 2775 + }, + { + "epoch": 0.22, + "learning_rate": 1.8167285530378134e-05, + "loss": 0.4707, + "step": 2776 + }, + { + "epoch": 0.22, + "learning_rate": 1.8165804604559455e-05, + "loss": 0.3807, + "step": 2777 + }, + { + "epoch": 0.22, + "learning_rate": 1.816432314106184e-05, + "loss": 0.3342, + "step": 2778 + }, + { + "epoch": 0.22, + "learning_rate": 1.8162841139982827e-05, + "loss": 0.3796, + "step": 2779 + }, + { + "epoch": 0.22, + "learning_rate": 1.816135860142e-05, + "loss": 0.4941, + "step": 2780 + }, + { + "epoch": 0.22, + "learning_rate": 1.8159875525470984e-05, + "loss": 0.3524, + "step": 2781 + }, + { + "epoch": 0.22, + "learning_rate": 1.815839191223342e-05, + "loss": 0.3324, + "step": 2782 + }, + { + "epoch": 0.22, + "learning_rate": 1.815690776180501e-05, + "loss": 0.5058, + "step": 2783 + }, + { + "epoch": 0.22, + "learning_rate": 1.815542307428347e-05, + "loss": 0.3859, + "step": 2784 + }, + { + "epoch": 0.22, + "learning_rate": 1.8153937849766567e-05, + "loss": 0.327, + "step": 2785 + }, + { + "epoch": 0.22, + "learning_rate": 1.8152452088352084e-05, + "loss": 0.3795, + "step": 2786 + }, + { + "epoch": 0.22, + "learning_rate": 1.8150965790137863e-05, + "loss": 0.4089, + "step": 2787 + }, + { + "epoch": 0.22, + "learning_rate": 1.814947895522176e-05, + "loss": 0.3856, + "step": 2788 + }, + { + "epoch": 0.22, + "learning_rate": 1.8147991583701685e-05, + "loss": 0.3958, + "step": 2789 + }, + { + "epoch": 0.22, + "learning_rate": 1.8146503675675568e-05, + "loss": 0.3605, + "step": 2790 + }, + { + "epoch": 0.22, + "learning_rate": 1.814501523124138e-05, + "loss": 0.3737, + "step": 2791 + }, + { + "epoch": 0.22, + "learning_rate": 1.8143526250497134e-05, + "loss": 0.3276, + "step": 2792 + }, + { + "epoch": 0.22, + "learning_rate": 1.8142036733540868e-05, + "loss": 0.4414, + "step": 2793 + }, + { + "epoch": 0.22, + "learning_rate": 1.814054668047066e-05, + "loss": 0.5026, + "step": 2794 + }, + { + "epoch": 0.22, + "learning_rate": 1.8139056091384623e-05, + "loss": 0.3882, + "step": 2795 + }, + { + "epoch": 0.22, + "learning_rate": 1.8137564966380905e-05, + "loss": 0.3861, + "step": 2796 + }, + { + "epoch": 0.22, + "learning_rate": 1.813607330555769e-05, + "loss": 0.5219, + "step": 2797 + }, + { + "epoch": 0.22, + "learning_rate": 1.8134581109013193e-05, + "loss": 0.404, + "step": 2798 + }, + { + "epoch": 0.22, + "learning_rate": 1.8133088376845675e-05, + "loss": 0.4957, + "step": 2799 + }, + { + "epoch": 0.22, + "learning_rate": 1.8131595109153416e-05, + "loss": 0.4187, + "step": 2800 + }, + { + "epoch": 0.22, + "learning_rate": 1.813010130603475e-05, + "loss": 0.5176, + "step": 2801 + }, + { + "epoch": 0.22, + "learning_rate": 1.812860696758803e-05, + "loss": 0.3985, + "step": 2802 + }, + { + "epoch": 0.22, + "learning_rate": 1.8127112093911655e-05, + "loss": 0.3624, + "step": 2803 + }, + { + "epoch": 0.22, + "learning_rate": 1.8125616685104055e-05, + "loss": 0.4203, + "step": 2804 + }, + { + "epoch": 0.22, + "learning_rate": 1.8124120741263692e-05, + "loss": 0.5074, + "step": 2805 + }, + { + "epoch": 0.22, + "learning_rate": 1.812262426248907e-05, + "loss": 0.3691, + "step": 2806 + }, + { + "epoch": 0.22, + "learning_rate": 1.8121127248878726e-05, + "loss": 0.3232, + "step": 2807 + }, + { + "epoch": 0.22, + "learning_rate": 1.8119629700531228e-05, + "loss": 0.4957, + "step": 2808 + }, + { + "epoch": 0.22, + "learning_rate": 1.8118131617545183e-05, + "loss": 0.3373, + "step": 2809 + }, + { + "epoch": 0.22, + "learning_rate": 1.8116633000019233e-05, + "loss": 0.3932, + "step": 2810 + }, + { + "epoch": 0.22, + "learning_rate": 1.8115133848052052e-05, + "loss": 0.3582, + "step": 2811 + }, + { + "epoch": 0.22, + "learning_rate": 1.8113634161742356e-05, + "loss": 0.3867, + "step": 2812 + }, + { + "epoch": 0.22, + "learning_rate": 1.8112133941188892e-05, + "loss": 0.342, + "step": 2813 + }, + { + "epoch": 0.22, + "learning_rate": 1.811063318649044e-05, + "loss": 0.3641, + "step": 2814 + }, + { + "epoch": 0.22, + "learning_rate": 1.8109131897745823e-05, + "loss": 0.5225, + "step": 2815 + }, + { + "epoch": 0.22, + "learning_rate": 1.8107630075053883e-05, + "loss": 0.3322, + "step": 2816 + }, + { + "epoch": 0.22, + "learning_rate": 1.810612771851352e-05, + "loss": 0.3969, + "step": 2817 + }, + { + "epoch": 0.22, + "learning_rate": 1.8104624828223644e-05, + "loss": 0.2965, + "step": 2818 + }, + { + "epoch": 0.22, + "learning_rate": 1.8103121404283222e-05, + "loss": 0.2746, + "step": 2819 + }, + { + "epoch": 0.22, + "learning_rate": 1.8101617446791248e-05, + "loss": 0.4774, + "step": 2820 + }, + { + "epoch": 0.22, + "learning_rate": 1.8100112955846746e-05, + "loss": 0.466, + "step": 2821 + }, + { + "epoch": 0.22, + "learning_rate": 1.8098607931548782e-05, + "loss": 0.3129, + "step": 2822 + }, + { + "epoch": 0.22, + "learning_rate": 1.8097102373996453e-05, + "loss": 0.3385, + "step": 2823 + }, + { + "epoch": 0.22, + "learning_rate": 1.809559628328889e-05, + "loss": 0.4426, + "step": 2824 + }, + { + "epoch": 0.22, + "learning_rate": 1.8094089659525274e-05, + "loss": 0.3191, + "step": 2825 + }, + { + "epoch": 0.22, + "learning_rate": 1.8092582502804793e-05, + "loss": 0.3699, + "step": 2826 + }, + { + "epoch": 0.22, + "learning_rate": 1.8091074813226696e-05, + "loss": 0.3692, + "step": 2827 + }, + { + "epoch": 0.22, + "learning_rate": 1.8089566590890253e-05, + "loss": 0.3376, + "step": 2828 + }, + { + "epoch": 0.22, + "learning_rate": 1.8088057835894775e-05, + "loss": 0.3619, + "step": 2829 + }, + { + "epoch": 0.22, + "learning_rate": 1.8086548548339604e-05, + "loss": 0.4827, + "step": 2830 + }, + { + "epoch": 0.22, + "learning_rate": 1.8085038728324123e-05, + "loss": 0.4796, + "step": 2831 + }, + { + "epoch": 0.22, + "learning_rate": 1.8083528375947744e-05, + "loss": 0.3915, + "step": 2832 + }, + { + "epoch": 0.22, + "learning_rate": 1.808201749130992e-05, + "loss": 0.4582, + "step": 2833 + }, + { + "epoch": 0.22, + "learning_rate": 1.8080506074510128e-05, + "loss": 0.475, + "step": 2834 + }, + { + "epoch": 0.22, + "learning_rate": 1.8078994125647896e-05, + "loss": 0.3059, + "step": 2835 + }, + { + "epoch": 0.22, + "learning_rate": 1.807748164482277e-05, + "loss": 0.3971, + "step": 2836 + }, + { + "epoch": 0.22, + "learning_rate": 1.8075968632134343e-05, + "loss": 0.3734, + "step": 2837 + }, + { + "epoch": 0.22, + "learning_rate": 1.8074455087682247e-05, + "loss": 0.3699, + "step": 2838 + }, + { + "epoch": 0.22, + "learning_rate": 1.8072941011566133e-05, + "loss": 0.3703, + "step": 2839 + }, + { + "epoch": 0.22, + "learning_rate": 1.8071426403885698e-05, + "loss": 0.4075, + "step": 2840 + }, + { + "epoch": 0.23, + "learning_rate": 1.8069911264740667e-05, + "loss": 0.5296, + "step": 2841 + }, + { + "epoch": 0.23, + "learning_rate": 1.8068395594230815e-05, + "loss": 0.2939, + "step": 2842 + }, + { + "epoch": 0.23, + "learning_rate": 1.8066879392455932e-05, + "loss": 0.3356, + "step": 2843 + }, + { + "epoch": 0.23, + "learning_rate": 1.8065362659515856e-05, + "loss": 0.2914, + "step": 2844 + }, + { + "epoch": 0.23, + "learning_rate": 1.806384539551046e-05, + "loss": 0.2352, + "step": 2845 + }, + { + "epoch": 0.23, + "learning_rate": 1.8062327600539643e-05, + "loss": 0.4645, + "step": 2846 + }, + { + "epoch": 0.23, + "learning_rate": 1.8060809274703352e-05, + "loss": 0.3284, + "step": 2847 + }, + { + "epoch": 0.23, + "learning_rate": 1.805929041810155e-05, + "loss": 0.3046, + "step": 2848 + }, + { + "epoch": 0.23, + "learning_rate": 1.8057771030834255e-05, + "loss": 0.418, + "step": 2849 + }, + { + "epoch": 0.23, + "learning_rate": 1.8056251113001508e-05, + "loss": 0.3579, + "step": 2850 + }, + { + "epoch": 0.23, + "learning_rate": 1.8054730664703393e-05, + "loss": 0.338, + "step": 2851 + }, + { + "epoch": 0.23, + "learning_rate": 1.8053209686040017e-05, + "loss": 0.4153, + "step": 2852 + }, + { + "epoch": 0.23, + "learning_rate": 1.8051688177111532e-05, + "loss": 0.2311, + "step": 2853 + }, + { + "epoch": 0.23, + "learning_rate": 1.805016613801813e-05, + "loss": 0.2566, + "step": 2854 + }, + { + "epoch": 0.23, + "learning_rate": 1.8048643568860015e-05, + "loss": 0.4372, + "step": 2855 + }, + { + "epoch": 0.23, + "learning_rate": 1.804712046973745e-05, + "loss": 0.3899, + "step": 2856 + }, + { + "epoch": 0.23, + "learning_rate": 1.8045596840750722e-05, + "loss": 0.4223, + "step": 2857 + }, + { + "epoch": 0.23, + "learning_rate": 1.804407268200016e-05, + "loss": 0.5447, + "step": 2858 + }, + { + "epoch": 0.23, + "learning_rate": 1.8042547993586114e-05, + "loss": 0.3232, + "step": 2859 + }, + { + "epoch": 0.23, + "learning_rate": 1.8041022775608977e-05, + "loss": 0.3692, + "step": 2860 + }, + { + "epoch": 0.23, + "learning_rate": 1.803949702816919e-05, + "loss": 0.4581, + "step": 2861 + }, + { + "epoch": 0.23, + "learning_rate": 1.80379707513672e-05, + "loss": 0.5019, + "step": 2862 + }, + { + "epoch": 0.23, + "learning_rate": 1.8036443945303514e-05, + "loss": 0.5065, + "step": 2863 + }, + { + "epoch": 0.23, + "learning_rate": 1.8034916610078665e-05, + "loss": 0.439, + "step": 2864 + }, + { + "epoch": 0.23, + "learning_rate": 1.8033388745793218e-05, + "loss": 0.4591, + "step": 2865 + }, + { + "epoch": 0.23, + "learning_rate": 1.8031860352547777e-05, + "loss": 0.4943, + "step": 2866 + }, + { + "epoch": 0.23, + "learning_rate": 1.8030331430442974e-05, + "loss": 0.4817, + "step": 2867 + }, + { + "epoch": 0.23, + "learning_rate": 1.8028801979579487e-05, + "loss": 0.4299, + "step": 2868 + }, + { + "epoch": 0.23, + "learning_rate": 1.8027272000058028e-05, + "loss": 0.4195, + "step": 2869 + }, + { + "epoch": 0.23, + "learning_rate": 1.8025741491979326e-05, + "loss": 0.4548, + "step": 2870 + }, + { + "epoch": 0.23, + "learning_rate": 1.8024210455444168e-05, + "loss": 0.4328, + "step": 2871 + }, + { + "epoch": 0.23, + "learning_rate": 1.8022678890553364e-05, + "loss": 0.4196, + "step": 2872 + }, + { + "epoch": 0.23, + "learning_rate": 1.8021146797407752e-05, + "loss": 0.4004, + "step": 2873 + }, + { + "epoch": 0.23, + "learning_rate": 1.801961417610822e-05, + "loss": 0.3306, + "step": 2874 + }, + { + "epoch": 0.23, + "learning_rate": 1.801808102675568e-05, + "loss": 0.4759, + "step": 2875 + }, + { + "epoch": 0.23, + "learning_rate": 1.801654734945109e-05, + "loss": 0.3542, + "step": 2876 + }, + { + "epoch": 0.23, + "learning_rate": 1.801501314429543e-05, + "loss": 0.3855, + "step": 2877 + }, + { + "epoch": 0.23, + "learning_rate": 1.801347841138972e-05, + "loss": 0.4708, + "step": 2878 + }, + { + "epoch": 0.23, + "learning_rate": 1.8011943150835013e-05, + "loss": 0.4384, + "step": 2879 + }, + { + "epoch": 0.23, + "learning_rate": 1.80104073627324e-05, + "loss": 0.3778, + "step": 2880 + }, + { + "epoch": 0.23, + "learning_rate": 1.8008871047183005e-05, + "loss": 0.4631, + "step": 2881 + }, + { + "epoch": 0.23, + "learning_rate": 1.800733420428799e-05, + "loss": 0.3518, + "step": 2882 + }, + { + "epoch": 0.23, + "learning_rate": 1.8005796834148545e-05, + "loss": 0.3291, + "step": 2883 + }, + { + "epoch": 0.23, + "learning_rate": 1.8004258936865902e-05, + "loss": 0.44, + "step": 2884 + }, + { + "epoch": 0.23, + "learning_rate": 1.800272051254132e-05, + "loss": 0.4451, + "step": 2885 + }, + { + "epoch": 0.23, + "learning_rate": 1.80011815612761e-05, + "loss": 0.4873, + "step": 2886 + }, + { + "epoch": 0.23, + "learning_rate": 1.7999642083171576e-05, + "loss": 0.286, + "step": 2887 + }, + { + "epoch": 0.23, + "learning_rate": 1.799810207832911e-05, + "loss": 0.3977, + "step": 2888 + }, + { + "epoch": 0.23, + "learning_rate": 1.7996561546850105e-05, + "loss": 0.4264, + "step": 2889 + }, + { + "epoch": 0.23, + "learning_rate": 1.7995020488836e-05, + "loss": 0.2862, + "step": 2890 + }, + { + "epoch": 0.23, + "learning_rate": 1.799347890438827e-05, + "loss": 0.3817, + "step": 2891 + }, + { + "epoch": 0.23, + "learning_rate": 1.799193679360841e-05, + "loss": 0.3239, + "step": 2892 + }, + { + "epoch": 0.23, + "learning_rate": 1.799039415659797e-05, + "loss": 0.4092, + "step": 2893 + }, + { + "epoch": 0.23, + "learning_rate": 1.798885099345852e-05, + "loss": 0.3285, + "step": 2894 + }, + { + "epoch": 0.23, + "learning_rate": 1.7987307304291676e-05, + "loss": 0.4258, + "step": 2895 + }, + { + "epoch": 0.23, + "learning_rate": 1.7985763089199073e-05, + "loss": 0.4189, + "step": 2896 + }, + { + "epoch": 0.23, + "learning_rate": 1.79842183482824e-05, + "loss": 0.3264, + "step": 2897 + }, + { + "epoch": 0.23, + "learning_rate": 1.7982673081643364e-05, + "loss": 0.3541, + "step": 2898 + }, + { + "epoch": 0.23, + "learning_rate": 1.7981127289383718e-05, + "loss": 0.3946, + "step": 2899 + }, + { + "epoch": 0.23, + "learning_rate": 1.797958097160524e-05, + "loss": 0.4526, + "step": 2900 + }, + { + "epoch": 0.23, + "learning_rate": 1.797803412840975e-05, + "loss": 0.4462, + "step": 2901 + }, + { + "epoch": 0.23, + "learning_rate": 1.7976486759899103e-05, + "loss": 0.428, + "step": 2902 + }, + { + "epoch": 0.23, + "learning_rate": 1.797493886617518e-05, + "loss": 0.3995, + "step": 2903 + }, + { + "epoch": 0.23, + "learning_rate": 1.797339044733991e-05, + "loss": 0.4562, + "step": 2904 + }, + { + "epoch": 0.23, + "learning_rate": 1.797184150349524e-05, + "loss": 0.464, + "step": 2905 + }, + { + "epoch": 0.23, + "learning_rate": 1.7970292034743172e-05, + "loss": 0.3033, + "step": 2906 + }, + { + "epoch": 0.23, + "learning_rate": 1.7968742041185718e-05, + "loss": 0.4658, + "step": 2907 + }, + { + "epoch": 0.23, + "learning_rate": 1.7967191522924946e-05, + "loss": 0.3765, + "step": 2908 + }, + { + "epoch": 0.23, + "learning_rate": 1.7965640480062945e-05, + "loss": 0.4006, + "step": 2909 + }, + { + "epoch": 0.23, + "learning_rate": 1.796408891270185e-05, + "loss": 0.4572, + "step": 2910 + }, + { + "epoch": 0.23, + "learning_rate": 1.7962536820943822e-05, + "loss": 0.3745, + "step": 2911 + }, + { + "epoch": 0.23, + "learning_rate": 1.7960984204891055e-05, + "loss": 0.5658, + "step": 2912 + }, + { + "epoch": 0.23, + "learning_rate": 1.7959431064645786e-05, + "loss": 0.363, + "step": 2913 + }, + { + "epoch": 0.23, + "learning_rate": 1.7957877400310275e-05, + "loss": 0.4308, + "step": 2914 + }, + { + "epoch": 0.23, + "learning_rate": 1.7956323211986833e-05, + "loss": 0.3822, + "step": 2915 + }, + { + "epoch": 0.23, + "learning_rate": 1.795476849977779e-05, + "loss": 0.4091, + "step": 2916 + }, + { + "epoch": 0.23, + "learning_rate": 1.7953213263785513e-05, + "loss": 0.4128, + "step": 2917 + }, + { + "epoch": 0.23, + "learning_rate": 1.7951657504112416e-05, + "loss": 0.4479, + "step": 2918 + }, + { + "epoch": 0.23, + "learning_rate": 1.795010122086093e-05, + "loss": 0.4431, + "step": 2919 + }, + { + "epoch": 0.23, + "learning_rate": 1.7948544414133534e-05, + "loss": 0.333, + "step": 2920 + }, + { + "epoch": 0.23, + "learning_rate": 1.7946987084032733e-05, + "loss": 0.4109, + "step": 2921 + }, + { + "epoch": 0.23, + "learning_rate": 1.794542923066107e-05, + "loss": 0.365, + "step": 2922 + }, + { + "epoch": 0.23, + "learning_rate": 1.7943870854121126e-05, + "loss": 0.363, + "step": 2923 + }, + { + "epoch": 0.23, + "learning_rate": 1.794231195451551e-05, + "loss": 0.307, + "step": 2924 + }, + { + "epoch": 0.23, + "learning_rate": 1.7940752531946867e-05, + "loss": 0.4455, + "step": 2925 + }, + { + "epoch": 0.23, + "learning_rate": 1.793919258651788e-05, + "loss": 0.441, + "step": 2926 + }, + { + "epoch": 0.23, + "learning_rate": 1.7937632118331255e-05, + "loss": 0.3302, + "step": 2927 + }, + { + "epoch": 0.23, + "learning_rate": 1.7936071127489755e-05, + "loss": 0.4819, + "step": 2928 + }, + { + "epoch": 0.23, + "learning_rate": 1.7934509614096156e-05, + "loss": 0.3709, + "step": 2929 + }, + { + "epoch": 0.23, + "learning_rate": 1.7932947578253273e-05, + "loss": 0.3409, + "step": 2930 + }, + { + "epoch": 0.23, + "learning_rate": 1.793138502006397e-05, + "loss": 0.395, + "step": 2931 + }, + { + "epoch": 0.23, + "learning_rate": 1.792982193963112e-05, + "loss": 0.3221, + "step": 2932 + }, + { + "epoch": 0.23, + "learning_rate": 1.7928258337057657e-05, + "loss": 0.367, + "step": 2933 + }, + { + "epoch": 0.23, + "learning_rate": 1.792669421244653e-05, + "loss": 0.4078, + "step": 2934 + }, + { + "epoch": 0.23, + "learning_rate": 1.7925129565900728e-05, + "loss": 0.3909, + "step": 2935 + }, + { + "epoch": 0.23, + "learning_rate": 1.792356439752328e-05, + "loss": 0.4512, + "step": 2936 + }, + { + "epoch": 0.23, + "learning_rate": 1.792199870741724e-05, + "loss": 0.3525, + "step": 2937 + }, + { + "epoch": 0.23, + "learning_rate": 1.79204324956857e-05, + "loss": 0.5426, + "step": 2938 + }, + { + "epoch": 0.23, + "learning_rate": 1.7918865762431794e-05, + "loss": 0.4668, + "step": 2939 + }, + { + "epoch": 0.23, + "learning_rate": 1.7917298507758684e-05, + "loss": 0.3812, + "step": 2940 + }, + { + "epoch": 0.23, + "learning_rate": 1.7915730731769558e-05, + "loss": 0.3028, + "step": 2941 + }, + { + "epoch": 0.23, + "learning_rate": 1.7914162434567653e-05, + "loss": 0.406, + "step": 2942 + }, + { + "epoch": 0.23, + "learning_rate": 1.791259361625623e-05, + "loss": 0.4341, + "step": 2943 + }, + { + "epoch": 0.23, + "learning_rate": 1.7911024276938595e-05, + "loss": 0.419, + "step": 2944 + }, + { + "epoch": 0.23, + "learning_rate": 1.7909454416718075e-05, + "loss": 0.4087, + "step": 2945 + }, + { + "epoch": 0.23, + "learning_rate": 1.790788403569804e-05, + "loss": 0.3682, + "step": 2946 + }, + { + "epoch": 0.23, + "learning_rate": 1.7906313133981887e-05, + "loss": 0.4198, + "step": 2947 + }, + { + "epoch": 0.23, + "learning_rate": 1.7904741711673064e-05, + "loss": 0.3854, + "step": 2948 + }, + { + "epoch": 0.23, + "learning_rate": 1.790316976887503e-05, + "loss": 0.3499, + "step": 2949 + }, + { + "epoch": 0.23, + "learning_rate": 1.7901597305691294e-05, + "loss": 0.3843, + "step": 2950 + }, + { + "epoch": 0.23, + "learning_rate": 1.7900024322225394e-05, + "loss": 0.3305, + "step": 2951 + }, + { + "epoch": 0.23, + "learning_rate": 1.789845081858091e-05, + "loss": 0.453, + "step": 2952 + }, + { + "epoch": 0.23, + "learning_rate": 1.7896876794861443e-05, + "loss": 0.3709, + "step": 2953 + }, + { + "epoch": 0.23, + "learning_rate": 1.7895302251170636e-05, + "loss": 0.3575, + "step": 2954 + }, + { + "epoch": 0.23, + "learning_rate": 1.789372718761216e-05, + "loss": 0.4692, + "step": 2955 + }, + { + "epoch": 0.23, + "learning_rate": 1.7892151604289738e-05, + "loss": 0.4822, + "step": 2956 + }, + { + "epoch": 0.23, + "learning_rate": 1.7890575501307105e-05, + "loss": 0.3849, + "step": 2957 + }, + { + "epoch": 0.23, + "learning_rate": 1.7888998878768045e-05, + "loss": 0.342, + "step": 2958 + }, + { + "epoch": 0.23, + "learning_rate": 1.7887421736776364e-05, + "loss": 0.2647, + "step": 2959 + }, + { + "epoch": 0.23, + "learning_rate": 1.7885844075435915e-05, + "loss": 0.3779, + "step": 2960 + }, + { + "epoch": 0.23, + "learning_rate": 1.788426589485058e-05, + "loss": 0.4399, + "step": 2961 + }, + { + "epoch": 0.23, + "learning_rate": 1.788268719512427e-05, + "loss": 0.3735, + "step": 2962 + }, + { + "epoch": 0.23, + "learning_rate": 1.788110797636094e-05, + "loss": 0.3773, + "step": 2963 + }, + { + "epoch": 0.23, + "learning_rate": 1.7879528238664567e-05, + "loss": 0.4346, + "step": 2964 + }, + { + "epoch": 0.23, + "learning_rate": 1.7877947982139177e-05, + "loss": 0.4581, + "step": 2965 + }, + { + "epoch": 0.23, + "learning_rate": 1.7876367206888817e-05, + "loss": 0.5298, + "step": 2966 + }, + { + "epoch": 0.24, + "learning_rate": 1.7874785913017575e-05, + "loss": 0.3119, + "step": 2967 + }, + { + "epoch": 0.24, + "learning_rate": 1.7873204100629572e-05, + "loss": 0.3867, + "step": 2968 + }, + { + "epoch": 0.24, + "learning_rate": 1.7871621769828965e-05, + "loss": 0.3848, + "step": 2969 + }, + { + "epoch": 0.24, + "learning_rate": 1.7870038920719935e-05, + "loss": 0.2982, + "step": 2970 + }, + { + "epoch": 0.24, + "learning_rate": 1.7868455553406713e-05, + "loss": 0.4204, + "step": 2971 + }, + { + "epoch": 0.24, + "learning_rate": 1.7866871667993554e-05, + "loss": 0.4569, + "step": 2972 + }, + { + "epoch": 0.24, + "learning_rate": 1.786528726458475e-05, + "loss": 0.3447, + "step": 2973 + }, + { + "epoch": 0.24, + "learning_rate": 1.786370234328462e-05, + "loss": 0.3558, + "step": 2974 + }, + { + "epoch": 0.24, + "learning_rate": 1.7862116904197534e-05, + "loss": 0.4253, + "step": 2975 + }, + { + "epoch": 0.24, + "learning_rate": 1.7860530947427878e-05, + "loss": 0.493, + "step": 2976 + }, + { + "epoch": 0.24, + "learning_rate": 1.785894447308008e-05, + "loss": 0.4877, + "step": 2977 + }, + { + "epoch": 0.24, + "learning_rate": 1.7857357481258603e-05, + "loss": 0.3123, + "step": 2978 + }, + { + "epoch": 0.24, + "learning_rate": 1.7855769972067944e-05, + "loss": 0.3563, + "step": 2979 + }, + { + "epoch": 0.24, + "learning_rate": 1.785418194561263e-05, + "loss": 0.3992, + "step": 2980 + }, + { + "epoch": 0.24, + "learning_rate": 1.7852593401997232e-05, + "loss": 0.3453, + "step": 2981 + }, + { + "epoch": 0.24, + "learning_rate": 1.785100434132634e-05, + "loss": 0.3188, + "step": 2982 + }, + { + "epoch": 0.24, + "learning_rate": 1.7849414763704587e-05, + "loss": 0.3723, + "step": 2983 + }, + { + "epoch": 0.24, + "learning_rate": 1.7847824669236643e-05, + "loss": 0.3046, + "step": 2984 + }, + { + "epoch": 0.24, + "learning_rate": 1.7846234058027207e-05, + "loss": 0.4787, + "step": 2985 + }, + { + "epoch": 0.24, + "learning_rate": 1.7844642930181008e-05, + "loss": 0.5216, + "step": 2986 + }, + { + "epoch": 0.24, + "learning_rate": 1.7843051285802823e-05, + "loss": 0.3974, + "step": 2987 + }, + { + "epoch": 0.24, + "learning_rate": 1.7841459124997445e-05, + "loss": 0.5136, + "step": 2988 + }, + { + "epoch": 0.24, + "learning_rate": 1.7839866447869717e-05, + "loss": 0.4093, + "step": 2989 + }, + { + "epoch": 0.24, + "learning_rate": 1.7838273254524505e-05, + "loss": 0.3695, + "step": 2990 + }, + { + "epoch": 0.24, + "learning_rate": 1.7836679545066712e-05, + "loss": 0.373, + "step": 2991 + }, + { + "epoch": 0.24, + "learning_rate": 1.7835085319601283e-05, + "loss": 0.3775, + "step": 2992 + }, + { + "epoch": 0.24, + "learning_rate": 1.783349057823318e-05, + "loss": 0.4879, + "step": 2993 + }, + { + "epoch": 0.24, + "learning_rate": 1.783189532106742e-05, + "loss": 0.3474, + "step": 2994 + }, + { + "epoch": 0.24, + "learning_rate": 1.783029954820904e-05, + "loss": 0.4347, + "step": 2995 + }, + { + "epoch": 0.24, + "learning_rate": 1.7828703259763107e-05, + "loss": 0.3329, + "step": 2996 + }, + { + "epoch": 0.24, + "learning_rate": 1.782710645583473e-05, + "loss": 0.4159, + "step": 2997 + }, + { + "epoch": 0.24, + "learning_rate": 1.7825509136529065e-05, + "loss": 0.532, + "step": 2998 + }, + { + "epoch": 0.24, + "learning_rate": 1.782391130195127e-05, + "loss": 0.3672, + "step": 2999 + }, + { + "epoch": 0.24, + "learning_rate": 1.7822312952206565e-05, + "loss": 0.4616, + "step": 3000 + }, + { + "epoch": 0.24, + "learning_rate": 1.782071408740019e-05, + "loss": 0.3994, + "step": 3001 + }, + { + "epoch": 0.24, + "learning_rate": 1.781911470763742e-05, + "loss": 0.4838, + "step": 3002 + }, + { + "epoch": 0.24, + "learning_rate": 1.7817514813023577e-05, + "loss": 0.4772, + "step": 3003 + }, + { + "epoch": 0.24, + "learning_rate": 1.781591440366399e-05, + "loss": 0.3322, + "step": 3004 + }, + { + "epoch": 0.24, + "learning_rate": 1.7814313479664054e-05, + "loss": 0.3985, + "step": 3005 + }, + { + "epoch": 0.24, + "learning_rate": 1.781271204112917e-05, + "loss": 0.3948, + "step": 3006 + }, + { + "epoch": 0.24, + "learning_rate": 1.7811110088164797e-05, + "loss": 0.3819, + "step": 3007 + }, + { + "epoch": 0.24, + "learning_rate": 1.7809507620876406e-05, + "loss": 0.2907, + "step": 3008 + }, + { + "epoch": 0.24, + "learning_rate": 1.7807904639369512e-05, + "loss": 0.4749, + "step": 3009 + }, + { + "epoch": 0.24, + "learning_rate": 1.7806301143749672e-05, + "loss": 0.3855, + "step": 3010 + }, + { + "epoch": 0.24, + "learning_rate": 1.780469713412246e-05, + "loss": 0.4006, + "step": 3011 + }, + { + "epoch": 0.24, + "learning_rate": 1.78030926105935e-05, + "loss": 0.3709, + "step": 3012 + }, + { + "epoch": 0.24, + "learning_rate": 1.7801487573268433e-05, + "loss": 0.3722, + "step": 3013 + }, + { + "epoch": 0.24, + "learning_rate": 1.7799882022252948e-05, + "loss": 0.368, + "step": 3014 + }, + { + "epoch": 0.24, + "learning_rate": 1.7798275957652764e-05, + "loss": 0.4309, + "step": 3015 + }, + { + "epoch": 0.24, + "learning_rate": 1.779666937957363e-05, + "loss": 0.3555, + "step": 3016 + }, + { + "epoch": 0.24, + "learning_rate": 1.7795062288121335e-05, + "loss": 0.3699, + "step": 3017 + }, + { + "epoch": 0.24, + "learning_rate": 1.7793454683401692e-05, + "loss": 0.348, + "step": 3018 + }, + { + "epoch": 0.24, + "learning_rate": 1.779184656552056e-05, + "loss": 0.3151, + "step": 3019 + }, + { + "epoch": 0.24, + "learning_rate": 1.7790237934583824e-05, + "loss": 0.3503, + "step": 3020 + }, + { + "epoch": 0.24, + "learning_rate": 1.7788628790697404e-05, + "loss": 0.3815, + "step": 3021 + }, + { + "epoch": 0.24, + "learning_rate": 1.7787019133967252e-05, + "loss": 0.2979, + "step": 3022 + }, + { + "epoch": 0.24, + "learning_rate": 1.778540896449936e-05, + "loss": 0.5024, + "step": 3023 + }, + { + "epoch": 0.24, + "learning_rate": 1.778379828239975e-05, + "loss": 0.3902, + "step": 3024 + }, + { + "epoch": 0.24, + "learning_rate": 1.778218708777448e-05, + "loss": 0.3476, + "step": 3025 + }, + { + "epoch": 0.24, + "learning_rate": 1.7780575380729626e-05, + "loss": 0.3676, + "step": 3026 + }, + { + "epoch": 0.24, + "learning_rate": 1.777896316137133e-05, + "loss": 0.4076, + "step": 3027 + }, + { + "epoch": 0.24, + "learning_rate": 1.7777350429805734e-05, + "loss": 0.3099, + "step": 3028 + }, + { + "epoch": 0.24, + "learning_rate": 1.777573718613904e-05, + "loss": 0.4164, + "step": 3029 + }, + { + "epoch": 0.24, + "learning_rate": 1.7774123430477464e-05, + "loss": 0.4115, + "step": 3030 + }, + { + "epoch": 0.24, + "learning_rate": 1.7772509162927266e-05, + "loss": 0.3067, + "step": 3031 + }, + { + "epoch": 0.24, + "learning_rate": 1.7770894383594737e-05, + "loss": 0.4029, + "step": 3032 + }, + { + "epoch": 0.24, + "learning_rate": 1.7769279092586205e-05, + "loss": 0.3797, + "step": 3033 + }, + { + "epoch": 0.24, + "learning_rate": 1.776766329000803e-05, + "loss": 0.3247, + "step": 3034 + }, + { + "epoch": 0.24, + "learning_rate": 1.7766046975966603e-05, + "loss": 0.3948, + "step": 3035 + }, + { + "epoch": 0.24, + "learning_rate": 1.7764430150568347e-05, + "loss": 0.4321, + "step": 3036 + }, + { + "epoch": 0.24, + "learning_rate": 1.776281281391973e-05, + "loss": 0.3691, + "step": 3037 + }, + { + "epoch": 0.24, + "learning_rate": 1.776119496612724e-05, + "loss": 0.4673, + "step": 3038 + }, + { + "epoch": 0.24, + "learning_rate": 1.7759576607297405e-05, + "loss": 0.4106, + "step": 3039 + }, + { + "epoch": 0.24, + "learning_rate": 1.7757957737536785e-05, + "loss": 0.4264, + "step": 3040 + }, + { + "epoch": 0.24, + "learning_rate": 1.775633835695198e-05, + "loss": 0.4524, + "step": 3041 + }, + { + "epoch": 0.24, + "learning_rate": 1.7754718465649618e-05, + "loss": 0.4278, + "step": 3042 + }, + { + "epoch": 0.24, + "learning_rate": 1.7753098063736355e-05, + "loss": 0.4345, + "step": 3043 + }, + { + "epoch": 0.24, + "learning_rate": 1.775147715131889e-05, + "loss": 0.4714, + "step": 3044 + }, + { + "epoch": 0.24, + "learning_rate": 1.7749855728503952e-05, + "loss": 0.3413, + "step": 3045 + }, + { + "epoch": 0.24, + "learning_rate": 1.7748233795398308e-05, + "loss": 0.423, + "step": 3046 + }, + { + "epoch": 0.24, + "learning_rate": 1.7746611352108744e-05, + "loss": 0.3827, + "step": 3047 + }, + { + "epoch": 0.24, + "learning_rate": 1.7744988398742102e-05, + "loss": 0.3788, + "step": 3048 + }, + { + "epoch": 0.24, + "learning_rate": 1.7743364935405238e-05, + "loss": 0.4545, + "step": 3049 + }, + { + "epoch": 0.24, + "learning_rate": 1.7741740962205053e-05, + "loss": 0.2418, + "step": 3050 + }, + { + "epoch": 0.24, + "learning_rate": 1.7740116479248474e-05, + "loss": 0.372, + "step": 3051 + }, + { + "epoch": 0.24, + "learning_rate": 1.773849148664247e-05, + "loss": 0.4185, + "step": 3052 + }, + { + "epoch": 0.24, + "learning_rate": 1.773686598449404e-05, + "loss": 0.3968, + "step": 3053 + }, + { + "epoch": 0.24, + "learning_rate": 1.7735239972910208e-05, + "loss": 0.3759, + "step": 3054 + }, + { + "epoch": 0.24, + "learning_rate": 1.7733613451998043e-05, + "loss": 0.3525, + "step": 3055 + }, + { + "epoch": 0.24, + "learning_rate": 1.7731986421864645e-05, + "loss": 0.4577, + "step": 3056 + }, + { + "epoch": 0.24, + "learning_rate": 1.7730358882617148e-05, + "loss": 0.5591, + "step": 3057 + }, + { + "epoch": 0.24, + "learning_rate": 1.772873083436271e-05, + "loss": 0.3295, + "step": 3058 + }, + { + "epoch": 0.24, + "learning_rate": 1.7727102277208538e-05, + "loss": 0.3361, + "step": 3059 + }, + { + "epoch": 0.24, + "learning_rate": 1.772547321126186e-05, + "loss": 0.3554, + "step": 3060 + }, + { + "epoch": 0.24, + "learning_rate": 1.7723843636629945e-05, + "loss": 0.4803, + "step": 3061 + }, + { + "epoch": 0.24, + "learning_rate": 1.772221355342009e-05, + "loss": 0.4, + "step": 3062 + }, + { + "epoch": 0.24, + "learning_rate": 1.7720582961739628e-05, + "loss": 0.4143, + "step": 3063 + }, + { + "epoch": 0.24, + "learning_rate": 1.771895186169593e-05, + "loss": 0.3406, + "step": 3064 + }, + { + "epoch": 0.24, + "learning_rate": 1.7717320253396393e-05, + "loss": 0.3848, + "step": 3065 + }, + { + "epoch": 0.24, + "learning_rate": 1.771568813694845e-05, + "loss": 0.3823, + "step": 3066 + }, + { + "epoch": 0.24, + "learning_rate": 1.771405551245957e-05, + "loss": 0.3312, + "step": 3067 + }, + { + "epoch": 0.24, + "learning_rate": 1.771242238003725e-05, + "loss": 0.4434, + "step": 3068 + }, + { + "epoch": 0.24, + "learning_rate": 1.7710788739789025e-05, + "loss": 0.3147, + "step": 3069 + }, + { + "epoch": 0.24, + "learning_rate": 1.7709154591822466e-05, + "loss": 0.3793, + "step": 3070 + }, + { + "epoch": 0.24, + "learning_rate": 1.770751993624517e-05, + "loss": 0.374, + "step": 3071 + }, + { + "epoch": 0.24, + "learning_rate": 1.770588477316477e-05, + "loss": 0.3901, + "step": 3072 + }, + { + "epoch": 0.24, + "learning_rate": 1.770424910268894e-05, + "loss": 0.3581, + "step": 3073 + }, + { + "epoch": 0.24, + "learning_rate": 1.7702612924925377e-05, + "loss": 0.417, + "step": 3074 + }, + { + "epoch": 0.24, + "learning_rate": 1.7700976239981815e-05, + "loss": 0.4447, + "step": 3075 + }, + { + "epoch": 0.24, + "learning_rate": 1.769933904796602e-05, + "loss": 0.4164, + "step": 3076 + }, + { + "epoch": 0.24, + "learning_rate": 1.76977013489858e-05, + "loss": 0.3631, + "step": 3077 + }, + { + "epoch": 0.24, + "learning_rate": 1.7696063143148982e-05, + "loss": 0.3354, + "step": 3078 + }, + { + "epoch": 0.24, + "learning_rate": 1.7694424430563436e-05, + "loss": 0.4935, + "step": 3079 + }, + { + "epoch": 0.24, + "learning_rate": 1.769278521133707e-05, + "loss": 0.3232, + "step": 3080 + }, + { + "epoch": 0.24, + "learning_rate": 1.769114548557781e-05, + "loss": 0.3154, + "step": 3081 + }, + { + "epoch": 0.24, + "learning_rate": 1.768950525339362e-05, + "loss": 0.3265, + "step": 3082 + }, + { + "epoch": 0.24, + "learning_rate": 1.7687864514892516e-05, + "loss": 0.3993, + "step": 3083 + }, + { + "epoch": 0.24, + "learning_rate": 1.7686223270182524e-05, + "loss": 0.4531, + "step": 3084 + }, + { + "epoch": 0.24, + "learning_rate": 1.7684581519371714e-05, + "loss": 0.3634, + "step": 3085 + }, + { + "epoch": 0.24, + "learning_rate": 1.768293926256819e-05, + "loss": 0.3712, + "step": 3086 + }, + { + "epoch": 0.24, + "learning_rate": 1.7681296499880077e-05, + "loss": 0.3728, + "step": 3087 + }, + { + "epoch": 0.24, + "learning_rate": 1.767965323141555e-05, + "loss": 0.3342, + "step": 3088 + }, + { + "epoch": 0.24, + "learning_rate": 1.7678009457282816e-05, + "loss": 0.3141, + "step": 3089 + }, + { + "epoch": 0.24, + "learning_rate": 1.7676365177590097e-05, + "loss": 0.3203, + "step": 3090 + }, + { + "epoch": 0.24, + "learning_rate": 1.7674720392445672e-05, + "loss": 0.3452, + "step": 3091 + }, + { + "epoch": 0.24, + "learning_rate": 1.7673075101957837e-05, + "loss": 0.5555, + "step": 3092 + }, + { + "epoch": 0.25, + "learning_rate": 1.7671429306234924e-05, + "loss": 0.4385, + "step": 3093 + }, + { + "epoch": 0.25, + "learning_rate": 1.7669783005385305e-05, + "loss": 0.3241, + "step": 3094 + }, + { + "epoch": 0.25, + "learning_rate": 1.766813619951738e-05, + "loss": 0.4238, + "step": 3095 + }, + { + "epoch": 0.25, + "learning_rate": 1.7666488888739587e-05, + "loss": 0.4025, + "step": 3096 + }, + { + "epoch": 0.25, + "learning_rate": 1.7664841073160383e-05, + "loss": 0.4866, + "step": 3097 + }, + { + "epoch": 0.25, + "learning_rate": 1.766319275288828e-05, + "loss": 0.3943, + "step": 3098 + }, + { + "epoch": 0.25, + "learning_rate": 1.7661543928031802e-05, + "loss": 0.3076, + "step": 3099 + }, + { + "epoch": 0.25, + "learning_rate": 1.7659894598699527e-05, + "loss": 0.4513, + "step": 3100 + }, + { + "epoch": 0.25, + "learning_rate": 1.765824476500005e-05, + "loss": 0.3972, + "step": 3101 + }, + { + "epoch": 0.25, + "learning_rate": 1.7656594427041997e-05, + "loss": 0.4178, + "step": 3102 + }, + { + "epoch": 0.25, + "learning_rate": 1.765494358493405e-05, + "loss": 0.4416, + "step": 3103 + }, + { + "epoch": 0.25, + "learning_rate": 1.7653292238784897e-05, + "loss": 0.3538, + "step": 3104 + }, + { + "epoch": 0.25, + "learning_rate": 1.7651640388703275e-05, + "loss": 0.429, + "step": 3105 + }, + { + "epoch": 0.25, + "learning_rate": 1.7649988034797952e-05, + "loss": 0.3993, + "step": 3106 + }, + { + "epoch": 0.25, + "learning_rate": 1.7648335177177725e-05, + "loss": 0.3443, + "step": 3107 + }, + { + "epoch": 0.25, + "learning_rate": 1.764668181595143e-05, + "loss": 0.3607, + "step": 3108 + }, + { + "epoch": 0.25, + "learning_rate": 1.764502795122793e-05, + "loss": 0.5418, + "step": 3109 + }, + { + "epoch": 0.25, + "learning_rate": 1.7643373583116123e-05, + "loss": 0.4476, + "step": 3110 + }, + { + "epoch": 0.25, + "learning_rate": 1.7641718711724947e-05, + "loss": 0.3995, + "step": 3111 + }, + { + "epoch": 0.25, + "learning_rate": 1.764006333716336e-05, + "loss": 0.3261, + "step": 3112 + }, + { + "epoch": 0.25, + "learning_rate": 1.7638407459540364e-05, + "loss": 0.4312, + "step": 3113 + }, + { + "epoch": 0.25, + "learning_rate": 1.7636751078964995e-05, + "loss": 0.4085, + "step": 3114 + }, + { + "epoch": 0.25, + "learning_rate": 1.763509419554631e-05, + "loss": 0.3446, + "step": 3115 + }, + { + "epoch": 0.25, + "learning_rate": 1.763343680939341e-05, + "loss": 0.3512, + "step": 3116 + }, + { + "epoch": 0.25, + "learning_rate": 1.7631778920615427e-05, + "loss": 0.4798, + "step": 3117 + }, + { + "epoch": 0.25, + "learning_rate": 1.7630120529321518e-05, + "loss": 0.4431, + "step": 3118 + }, + { + "epoch": 0.25, + "learning_rate": 1.7628461635620895e-05, + "loss": 0.3321, + "step": 3119 + }, + { + "epoch": 0.25, + "learning_rate": 1.7626802239622772e-05, + "loss": 0.4237, + "step": 3120 + }, + { + "epoch": 0.25, + "learning_rate": 1.7625142341436423e-05, + "loss": 0.3802, + "step": 3121 + }, + { + "epoch": 0.25, + "learning_rate": 1.762348194117114e-05, + "loss": 0.3823, + "step": 3122 + }, + { + "epoch": 0.25, + "learning_rate": 1.7621821038936257e-05, + "loss": 0.4927, + "step": 3123 + }, + { + "epoch": 0.25, + "learning_rate": 1.7620159634841127e-05, + "loss": 0.48, + "step": 3124 + }, + { + "epoch": 0.25, + "learning_rate": 1.761849772899515e-05, + "loss": 0.3875, + "step": 3125 + }, + { + "epoch": 0.25, + "learning_rate": 1.7616835321507757e-05, + "loss": 0.3448, + "step": 3126 + }, + { + "epoch": 0.25, + "learning_rate": 1.761517241248841e-05, + "loss": 0.2883, + "step": 3127 + }, + { + "epoch": 0.25, + "learning_rate": 1.76135090020466e-05, + "loss": 0.3491, + "step": 3128 + }, + { + "epoch": 0.25, + "learning_rate": 1.7611845090291858e-05, + "loss": 0.4459, + "step": 3129 + }, + { + "epoch": 0.25, + "learning_rate": 1.761018067733374e-05, + "loss": 0.4104, + "step": 3130 + }, + { + "epoch": 0.25, + "learning_rate": 1.7608515763281843e-05, + "loss": 0.3821, + "step": 3131 + }, + { + "epoch": 0.25, + "learning_rate": 1.760685034824579e-05, + "loss": 0.4513, + "step": 3132 + }, + { + "epoch": 0.25, + "learning_rate": 1.760518443233525e-05, + "loss": 0.3931, + "step": 3133 + }, + { + "epoch": 0.25, + "learning_rate": 1.7603518015659905e-05, + "loss": 0.4582, + "step": 3134 + }, + { + "epoch": 0.25, + "learning_rate": 1.7601851098329484e-05, + "loss": 0.3846, + "step": 3135 + }, + { + "epoch": 0.25, + "learning_rate": 1.7600183680453745e-05, + "loss": 0.3781, + "step": 3136 + }, + { + "epoch": 0.25, + "learning_rate": 1.7598515762142484e-05, + "loss": 0.3236, + "step": 3137 + }, + { + "epoch": 0.25, + "learning_rate": 1.759684734350552e-05, + "loss": 0.4432, + "step": 3138 + }, + { + "epoch": 0.25, + "learning_rate": 1.759517842465271e-05, + "loss": 0.3234, + "step": 3139 + }, + { + "epoch": 0.25, + "learning_rate": 1.759350900569395e-05, + "loss": 0.4111, + "step": 3140 + }, + { + "epoch": 0.25, + "learning_rate": 1.759183908673916e-05, + "loss": 0.3638, + "step": 3141 + }, + { + "epoch": 0.25, + "learning_rate": 1.759016866789829e-05, + "loss": 0.3065, + "step": 3142 + }, + { + "epoch": 0.25, + "learning_rate": 1.7588497749281338e-05, + "loss": 0.3657, + "step": 3143 + }, + { + "epoch": 0.25, + "learning_rate": 1.7586826330998324e-05, + "loss": 0.3672, + "step": 3144 + }, + { + "epoch": 0.25, + "learning_rate": 1.7585154413159304e-05, + "loss": 0.3084, + "step": 3145 + }, + { + "epoch": 0.25, + "learning_rate": 1.758348199587436e-05, + "loss": 0.2902, + "step": 3146 + }, + { + "epoch": 0.25, + "learning_rate": 1.7581809079253616e-05, + "loss": 0.465, + "step": 3147 + }, + { + "epoch": 0.25, + "learning_rate": 1.7580135663407226e-05, + "loss": 0.4023, + "step": 3148 + }, + { + "epoch": 0.25, + "learning_rate": 1.7578461748445374e-05, + "loss": 0.3883, + "step": 3149 + }, + { + "epoch": 0.25, + "learning_rate": 1.7576787334478283e-05, + "loss": 0.4104, + "step": 3150 + }, + { + "epoch": 0.25, + "learning_rate": 1.7575112421616203e-05, + "loss": 0.35, + "step": 3151 + }, + { + "epoch": 0.25, + "learning_rate": 1.757343700996942e-05, + "loss": 0.4289, + "step": 3152 + }, + { + "epoch": 0.25, + "learning_rate": 1.757176109964825e-05, + "loss": 0.4423, + "step": 3153 + }, + { + "epoch": 0.25, + "learning_rate": 1.7570084690763042e-05, + "loss": 0.4813, + "step": 3154 + }, + { + "epoch": 0.25, + "learning_rate": 1.7568407783424187e-05, + "loss": 0.3614, + "step": 3155 + }, + { + "epoch": 0.25, + "learning_rate": 1.7566730377742093e-05, + "loss": 0.4607, + "step": 3156 + }, + { + "epoch": 0.25, + "learning_rate": 1.7565052473827213e-05, + "loss": 0.3242, + "step": 3157 + }, + { + "epoch": 0.25, + "learning_rate": 1.7563374071790028e-05, + "loss": 0.3291, + "step": 3158 + }, + { + "epoch": 0.25, + "learning_rate": 1.7561695171741054e-05, + "loss": 0.3982, + "step": 3159 + }, + { + "epoch": 0.25, + "learning_rate": 1.7560015773790837e-05, + "loss": 0.409, + "step": 3160 + }, + { + "epoch": 0.25, + "learning_rate": 1.7558335878049955e-05, + "loss": 0.5179, + "step": 3161 + }, + { + "epoch": 0.25, + "learning_rate": 1.7556655484629028e-05, + "loss": 0.3912, + "step": 3162 + }, + { + "epoch": 0.25, + "learning_rate": 1.7554974593638697e-05, + "loss": 0.3294, + "step": 3163 + }, + { + "epoch": 0.25, + "learning_rate": 1.755329320518964e-05, + "loss": 0.3635, + "step": 3164 + }, + { + "epoch": 0.25, + "learning_rate": 1.7551611319392573e-05, + "loss": 0.4657, + "step": 3165 + }, + { + "epoch": 0.25, + "learning_rate": 1.7549928936358232e-05, + "loss": 0.3742, + "step": 3166 + }, + { + "epoch": 0.25, + "learning_rate": 1.75482460561974e-05, + "loss": 0.4341, + "step": 3167 + }, + { + "epoch": 0.25, + "learning_rate": 1.7546562679020884e-05, + "loss": 0.276, + "step": 3168 + }, + { + "epoch": 0.25, + "learning_rate": 1.7544878804939528e-05, + "loss": 0.3424, + "step": 3169 + }, + { + "epoch": 0.25, + "learning_rate": 1.7543194434064208e-05, + "loss": 0.36, + "step": 3170 + }, + { + "epoch": 0.25, + "learning_rate": 1.754150956650583e-05, + "loss": 0.3574, + "step": 3171 + }, + { + "epoch": 0.25, + "learning_rate": 1.753982420237533e-05, + "loss": 0.4456, + "step": 3172 + }, + { + "epoch": 0.25, + "learning_rate": 1.753813834178369e-05, + "loss": 0.4968, + "step": 3173 + }, + { + "epoch": 0.25, + "learning_rate": 1.753645198484191e-05, + "loss": 0.3409, + "step": 3174 + }, + { + "epoch": 0.25, + "learning_rate": 1.753476513166103e-05, + "loss": 0.3411, + "step": 3175 + }, + { + "epoch": 0.25, + "learning_rate": 1.7533077782352123e-05, + "loss": 0.3484, + "step": 3176 + }, + { + "epoch": 0.25, + "learning_rate": 1.753138993702629e-05, + "loss": 0.3422, + "step": 3177 + }, + { + "epoch": 0.25, + "learning_rate": 1.752970159579467e-05, + "loss": 0.4097, + "step": 3178 + }, + { + "epoch": 0.25, + "learning_rate": 1.7528012758768426e-05, + "loss": 0.4289, + "step": 3179 + }, + { + "epoch": 0.25, + "learning_rate": 1.7526323426058767e-05, + "loss": 0.4604, + "step": 3180 + }, + { + "epoch": 0.25, + "learning_rate": 1.7524633597776923e-05, + "loss": 0.4859, + "step": 3181 + }, + { + "epoch": 0.25, + "learning_rate": 1.7522943274034165e-05, + "loss": 0.4414, + "step": 3182 + }, + { + "epoch": 0.25, + "learning_rate": 1.752125245494179e-05, + "loss": 0.4194, + "step": 3183 + }, + { + "epoch": 0.25, + "learning_rate": 1.751956114061113e-05, + "loss": 0.4934, + "step": 3184 + }, + { + "epoch": 0.25, + "learning_rate": 1.751786933115355e-05, + "loss": 0.4549, + "step": 3185 + }, + { + "epoch": 0.25, + "learning_rate": 1.751617702668045e-05, + "loss": 0.3434, + "step": 3186 + }, + { + "epoch": 0.25, + "learning_rate": 1.751448422730326e-05, + "loss": 0.4322, + "step": 3187 + }, + { + "epoch": 0.25, + "learning_rate": 1.7512790933133435e-05, + "loss": 0.4928, + "step": 3188 + }, + { + "epoch": 0.25, + "learning_rate": 1.7511097144282482e-05, + "loss": 0.4309, + "step": 3189 + }, + { + "epoch": 0.25, + "learning_rate": 1.7509402860861923e-05, + "loss": 0.4595, + "step": 3190 + }, + { + "epoch": 0.25, + "learning_rate": 1.7507708082983313e-05, + "loss": 0.3919, + "step": 3191 + }, + { + "epoch": 0.25, + "learning_rate": 1.7506012810758254e-05, + "loss": 0.5459, + "step": 3192 + }, + { + "epoch": 0.25, + "learning_rate": 1.750431704429837e-05, + "loss": 0.4813, + "step": 3193 + }, + { + "epoch": 0.25, + "learning_rate": 1.7502620783715316e-05, + "loss": 0.3879, + "step": 3194 + }, + { + "epoch": 0.25, + "learning_rate": 1.7500924029120782e-05, + "loss": 0.4372, + "step": 3195 + }, + { + "epoch": 0.25, + "learning_rate": 1.7499226780626494e-05, + "loss": 0.3959, + "step": 3196 + }, + { + "epoch": 0.25, + "learning_rate": 1.7497529038344208e-05, + "loss": 0.3722, + "step": 3197 + }, + { + "epoch": 0.25, + "learning_rate": 1.7495830802385707e-05, + "loss": 0.4584, + "step": 3198 + }, + { + "epoch": 0.25, + "learning_rate": 1.7494132072862818e-05, + "loss": 0.3352, + "step": 3199 + }, + { + "epoch": 0.25, + "learning_rate": 1.7492432849887387e-05, + "loss": 0.335, + "step": 3200 + }, + { + "epoch": 0.25, + "learning_rate": 1.749073313357131e-05, + "loss": 0.4428, + "step": 3201 + }, + { + "epoch": 0.25, + "learning_rate": 1.7489032924026496e-05, + "loss": 0.3078, + "step": 3202 + }, + { + "epoch": 0.25, + "learning_rate": 1.74873322213649e-05, + "loss": 0.3032, + "step": 3203 + }, + { + "epoch": 0.25, + "learning_rate": 1.7485631025698504e-05, + "loss": 0.5853, + "step": 3204 + }, + { + "epoch": 0.25, + "learning_rate": 1.7483929337139326e-05, + "loss": 0.3252, + "step": 3205 + }, + { + "epoch": 0.25, + "learning_rate": 1.748222715579941e-05, + "loss": 0.2807, + "step": 3206 + }, + { + "epoch": 0.25, + "learning_rate": 1.7480524481790835e-05, + "loss": 0.4971, + "step": 3207 + }, + { + "epoch": 0.25, + "learning_rate": 1.7478821315225717e-05, + "loss": 0.3704, + "step": 3208 + }, + { + "epoch": 0.25, + "learning_rate": 1.7477117656216206e-05, + "loss": 0.5769, + "step": 3209 + }, + { + "epoch": 0.25, + "learning_rate": 1.7475413504874474e-05, + "loss": 0.3344, + "step": 3210 + }, + { + "epoch": 0.25, + "learning_rate": 1.7473708861312727e-05, + "loss": 0.3967, + "step": 3211 + }, + { + "epoch": 0.25, + "learning_rate": 1.7472003725643215e-05, + "loss": 0.4552, + "step": 3212 + }, + { + "epoch": 0.25, + "learning_rate": 1.747029809797821e-05, + "loss": 0.3521, + "step": 3213 + }, + { + "epoch": 0.25, + "learning_rate": 1.7468591978430024e-05, + "loss": 0.3377, + "step": 3214 + }, + { + "epoch": 0.25, + "learning_rate": 1.746688536711099e-05, + "loss": 0.4233, + "step": 3215 + }, + { + "epoch": 0.25, + "learning_rate": 1.7465178264133482e-05, + "loss": 0.427, + "step": 3216 + }, + { + "epoch": 0.25, + "learning_rate": 1.7463470669609907e-05, + "loss": 0.3631, + "step": 3217 + }, + { + "epoch": 0.25, + "learning_rate": 1.74617625836527e-05, + "loss": 0.3374, + "step": 3218 + }, + { + "epoch": 0.26, + "learning_rate": 1.746005400637433e-05, + "loss": 0.3726, + "step": 3219 + }, + { + "epoch": 0.26, + "learning_rate": 1.74583449378873e-05, + "loss": 0.4837, + "step": 3220 + }, + { + "epoch": 0.26, + "learning_rate": 1.7456635378304143e-05, + "loss": 0.3562, + "step": 3221 + }, + { + "epoch": 0.26, + "learning_rate": 1.7454925327737426e-05, + "loss": 0.4718, + "step": 3222 + }, + { + "epoch": 0.26, + "learning_rate": 1.7453214786299746e-05, + "loss": 0.4017, + "step": 3223 + }, + { + "epoch": 0.26, + "learning_rate": 1.7451503754103735e-05, + "loss": 0.3534, + "step": 3224 + }, + { + "epoch": 0.26, + "learning_rate": 1.7449792231262056e-05, + "loss": 0.4034, + "step": 3225 + }, + { + "epoch": 0.26, + "learning_rate": 1.7448080217887403e-05, + "loss": 0.4501, + "step": 3226 + }, + { + "epoch": 0.26, + "learning_rate": 1.7446367714092508e-05, + "loss": 0.4466, + "step": 3227 + }, + { + "epoch": 0.26, + "learning_rate": 1.7444654719990128e-05, + "loss": 0.3036, + "step": 3228 + }, + { + "epoch": 0.26, + "learning_rate": 1.7442941235693058e-05, + "loss": 0.4375, + "step": 3229 + }, + { + "epoch": 0.26, + "learning_rate": 1.744122726131412e-05, + "loss": 0.4218, + "step": 3230 + }, + { + "epoch": 0.26, + "learning_rate": 1.7439512796966165e-05, + "loss": 0.4227, + "step": 3231 + }, + { + "epoch": 0.26, + "learning_rate": 1.7437797842762098e-05, + "loss": 0.2846, + "step": 3232 + }, + { + "epoch": 0.26, + "learning_rate": 1.743608239881483e-05, + "loss": 0.3826, + "step": 3233 + }, + { + "epoch": 0.26, + "learning_rate": 1.7434366465237312e-05, + "loss": 0.3177, + "step": 3234 + }, + { + "epoch": 0.26, + "learning_rate": 1.7432650042142535e-05, + "loss": 0.4252, + "step": 3235 + }, + { + "epoch": 0.26, + "learning_rate": 1.743093312964352e-05, + "loss": 0.495, + "step": 3236 + }, + { + "epoch": 0.26, + "learning_rate": 1.742921572785331e-05, + "loss": 0.5606, + "step": 3237 + }, + { + "epoch": 0.26, + "learning_rate": 1.7427497836884995e-05, + "loss": 0.5505, + "step": 3238 + }, + { + "epoch": 0.26, + "learning_rate": 1.7425779456851683e-05, + "loss": 0.39, + "step": 3239 + }, + { + "epoch": 0.26, + "learning_rate": 1.7424060587866526e-05, + "loss": 0.5537, + "step": 3240 + }, + { + "epoch": 0.26, + "learning_rate": 1.74223412300427e-05, + "loss": 0.4516, + "step": 3241 + }, + { + "epoch": 0.26, + "learning_rate": 1.7420621383493423e-05, + "loss": 0.3031, + "step": 3242 + }, + { + "epoch": 0.26, + "learning_rate": 1.7418901048331927e-05, + "loss": 0.4465, + "step": 3243 + }, + { + "epoch": 0.26, + "learning_rate": 1.7417180224671497e-05, + "loss": 0.4056, + "step": 3244 + }, + { + "epoch": 0.26, + "learning_rate": 1.741545891262544e-05, + "loss": 0.4393, + "step": 3245 + }, + { + "epoch": 0.26, + "learning_rate": 1.7413737112307092e-05, + "loss": 0.3928, + "step": 3246 + }, + { + "epoch": 0.26, + "learning_rate": 1.741201482382983e-05, + "loss": 0.3437, + "step": 3247 + }, + { + "epoch": 0.26, + "learning_rate": 1.7410292047307054e-05, + "loss": 0.3645, + "step": 3248 + }, + { + "epoch": 0.26, + "learning_rate": 1.7408568782852204e-05, + "loss": 0.3553, + "step": 3249 + }, + { + "epoch": 0.26, + "learning_rate": 1.7406845030578747e-05, + "loss": 0.4897, + "step": 3250 + }, + { + "epoch": 0.26, + "learning_rate": 1.7405120790600185e-05, + "loss": 0.4219, + "step": 3251 + }, + { + "epoch": 0.26, + "learning_rate": 1.740339606303005e-05, + "loss": 0.4773, + "step": 3252 + }, + { + "epoch": 0.26, + "learning_rate": 1.7401670847981906e-05, + "loss": 0.4006, + "step": 3253 + }, + { + "epoch": 0.26, + "learning_rate": 1.7399945145569353e-05, + "loss": 0.3857, + "step": 3254 + }, + { + "epoch": 0.26, + "learning_rate": 1.7398218955906017e-05, + "loss": 0.3951, + "step": 3255 + }, + { + "epoch": 0.26, + "learning_rate": 1.7396492279105562e-05, + "loss": 0.379, + "step": 3256 + }, + { + "epoch": 0.26, + "learning_rate": 1.7394765115281678e-05, + "loss": 0.3867, + "step": 3257 + }, + { + "epoch": 0.26, + "learning_rate": 1.7393037464548094e-05, + "loss": 0.357, + "step": 3258 + }, + { + "epoch": 0.26, + "learning_rate": 1.7391309327018566e-05, + "loss": 0.3332, + "step": 3259 + }, + { + "epoch": 0.26, + "learning_rate": 1.7389580702806884e-05, + "loss": 0.3758, + "step": 3260 + }, + { + "epoch": 0.26, + "learning_rate": 1.7387851592026868e-05, + "loss": 0.3739, + "step": 3261 + }, + { + "epoch": 0.26, + "learning_rate": 1.738612199479237e-05, + "loss": 0.3985, + "step": 3262 + }, + { + "epoch": 0.26, + "learning_rate": 1.7384391911217283e-05, + "loss": 0.3876, + "step": 3263 + }, + { + "epoch": 0.26, + "learning_rate": 1.738266134141552e-05, + "loss": 0.4395, + "step": 3264 + }, + { + "epoch": 0.26, + "learning_rate": 1.738093028550103e-05, + "loss": 0.3177, + "step": 3265 + }, + { + "epoch": 0.26, + "learning_rate": 1.7379198743587794e-05, + "loss": 0.4019, + "step": 3266 + }, + { + "epoch": 0.26, + "learning_rate": 1.7377466715789828e-05, + "loss": 0.3905, + "step": 3267 + }, + { + "epoch": 0.26, + "learning_rate": 1.7375734202221174e-05, + "loss": 0.3716, + "step": 3268 + }, + { + "epoch": 0.26, + "learning_rate": 1.7374001202995918e-05, + "loss": 0.4072, + "step": 3269 + }, + { + "epoch": 0.26, + "learning_rate": 1.7372267718228163e-05, + "loss": 0.392, + "step": 3270 + }, + { + "epoch": 0.26, + "learning_rate": 1.7370533748032047e-05, + "loss": 0.3716, + "step": 3271 + }, + { + "epoch": 0.26, + "learning_rate": 1.7368799292521754e-05, + "loss": 0.2819, + "step": 3272 + }, + { + "epoch": 0.26, + "learning_rate": 1.736706435181148e-05, + "loss": 0.5185, + "step": 3273 + }, + { + "epoch": 0.26, + "learning_rate": 1.736532892601547e-05, + "loss": 0.3582, + "step": 3274 + }, + { + "epoch": 0.26, + "learning_rate": 1.7363593015247987e-05, + "loss": 0.474, + "step": 3275 + }, + { + "epoch": 0.26, + "learning_rate": 1.7361856619623338e-05, + "loss": 0.398, + "step": 3276 + }, + { + "epoch": 0.26, + "learning_rate": 1.736011973925585e-05, + "loss": 0.3113, + "step": 3277 + }, + { + "epoch": 0.26, + "learning_rate": 1.7358382374259895e-05, + "loss": 0.4075, + "step": 3278 + }, + { + "epoch": 0.26, + "learning_rate": 1.7356644524749867e-05, + "loss": 0.3786, + "step": 3279 + }, + { + "epoch": 0.26, + "learning_rate": 1.7354906190840194e-05, + "loss": 0.4366, + "step": 3280 + }, + { + "epoch": 0.26, + "learning_rate": 1.7353167372645337e-05, + "loss": 0.3858, + "step": 3281 + }, + { + "epoch": 0.26, + "learning_rate": 1.735142807027979e-05, + "loss": 0.3503, + "step": 3282 + }, + { + "epoch": 0.26, + "learning_rate": 1.734968828385808e-05, + "loss": 0.402, + "step": 3283 + }, + { + "epoch": 0.26, + "learning_rate": 1.7347948013494758e-05, + "loss": 0.4105, + "step": 3284 + }, + { + "epoch": 0.26, + "learning_rate": 1.7346207259304415e-05, + "loss": 0.4284, + "step": 3285 + }, + { + "epoch": 0.26, + "learning_rate": 1.7344466021401673e-05, + "loss": 0.4796, + "step": 3286 + }, + { + "epoch": 0.26, + "learning_rate": 1.734272429990118e-05, + "loss": 0.3375, + "step": 3287 + }, + { + "epoch": 0.26, + "learning_rate": 1.7340982094917627e-05, + "loss": 0.4194, + "step": 3288 + }, + { + "epoch": 0.26, + "learning_rate": 1.7339239406565723e-05, + "loss": 0.2992, + "step": 3289 + }, + { + "epoch": 0.26, + "learning_rate": 1.733749623496022e-05, + "loss": 0.3466, + "step": 3290 + }, + { + "epoch": 0.26, + "learning_rate": 1.7335752580215898e-05, + "loss": 0.3392, + "step": 3291 + }, + { + "epoch": 0.26, + "learning_rate": 1.733400844244756e-05, + "loss": 0.3791, + "step": 3292 + }, + { + "epoch": 0.26, + "learning_rate": 1.733226382177006e-05, + "loss": 0.3653, + "step": 3293 + }, + { + "epoch": 0.26, + "learning_rate": 1.7330518718298263e-05, + "loss": 0.4208, + "step": 3294 + }, + { + "epoch": 0.26, + "learning_rate": 1.7328773132147086e-05, + "loss": 0.3973, + "step": 3295 + }, + { + "epoch": 0.26, + "learning_rate": 1.732702706343146e-05, + "loss": 0.4315, + "step": 3296 + }, + { + "epoch": 0.26, + "learning_rate": 1.7325280512266357e-05, + "loss": 0.5514, + "step": 3297 + }, + { + "epoch": 0.26, + "learning_rate": 1.7323533478766777e-05, + "loss": 0.3315, + "step": 3298 + }, + { + "epoch": 0.26, + "learning_rate": 1.732178596304776e-05, + "loss": 0.3533, + "step": 3299 + }, + { + "epoch": 0.26, + "learning_rate": 1.7320037965224365e-05, + "loss": 0.3386, + "step": 3300 + }, + { + "epoch": 0.26, + "learning_rate": 1.731828948541169e-05, + "loss": 0.3585, + "step": 3301 + }, + { + "epoch": 0.26, + "learning_rate": 1.731654052372487e-05, + "loss": 0.3395, + "step": 3302 + }, + { + "epoch": 0.26, + "learning_rate": 1.731479108027906e-05, + "loss": 0.4566, + "step": 3303 + }, + { + "epoch": 0.26, + "learning_rate": 1.7313041155189454e-05, + "loss": 0.519, + "step": 3304 + }, + { + "epoch": 0.26, + "learning_rate": 1.7311290748571273e-05, + "loss": 0.3564, + "step": 3305 + }, + { + "epoch": 0.26, + "learning_rate": 1.7309539860539783e-05, + "loss": 0.3543, + "step": 3306 + }, + { + "epoch": 0.26, + "learning_rate": 1.7307788491210257e-05, + "loss": 0.3819, + "step": 3307 + }, + { + "epoch": 0.26, + "learning_rate": 1.7306036640698024e-05, + "loss": 0.3959, + "step": 3308 + }, + { + "epoch": 0.26, + "learning_rate": 1.7304284309118436e-05, + "loss": 0.5266, + "step": 3309 + }, + { + "epoch": 0.26, + "learning_rate": 1.7302531496586866e-05, + "loss": 0.4565, + "step": 3310 + }, + { + "epoch": 0.26, + "learning_rate": 1.730077820321874e-05, + "loss": 0.3276, + "step": 3311 + }, + { + "epoch": 0.26, + "learning_rate": 1.7299024429129497e-05, + "loss": 0.3711, + "step": 3312 + }, + { + "epoch": 0.26, + "learning_rate": 1.7297270174434613e-05, + "loss": 0.3365, + "step": 3313 + }, + { + "epoch": 0.26, + "learning_rate": 1.7295515439249608e-05, + "loss": 0.3959, + "step": 3314 + }, + { + "epoch": 0.26, + "learning_rate": 1.7293760223690008e-05, + "loss": 0.512, + "step": 3315 + }, + { + "epoch": 0.26, + "learning_rate": 1.729200452787139e-05, + "loss": 0.3925, + "step": 3316 + }, + { + "epoch": 0.26, + "learning_rate": 1.729024835190937e-05, + "loss": 0.2933, + "step": 3317 + }, + { + "epoch": 0.26, + "learning_rate": 1.7288491695919567e-05, + "loss": 0.2969, + "step": 3318 + }, + { + "epoch": 0.26, + "learning_rate": 1.728673456001766e-05, + "loss": 0.3919, + "step": 3319 + }, + { + "epoch": 0.26, + "learning_rate": 1.728497694431934e-05, + "loss": 0.3605, + "step": 3320 + }, + { + "epoch": 0.26, + "learning_rate": 1.7283218848940344e-05, + "loss": 0.3481, + "step": 3321 + }, + { + "epoch": 0.26, + "learning_rate": 1.728146027399643e-05, + "loss": 0.4478, + "step": 3322 + }, + { + "epoch": 0.26, + "learning_rate": 1.7279701219603394e-05, + "loss": 0.4366, + "step": 3323 + }, + { + "epoch": 0.26, + "learning_rate": 1.727794168587706e-05, + "loss": 0.3474, + "step": 3324 + }, + { + "epoch": 0.26, + "learning_rate": 1.7276181672933287e-05, + "loss": 0.403, + "step": 3325 + }, + { + "epoch": 0.26, + "learning_rate": 1.7274421180887958e-05, + "loss": 0.3663, + "step": 3326 + }, + { + "epoch": 0.26, + "learning_rate": 1.7272660209857e-05, + "loss": 0.3581, + "step": 3327 + }, + { + "epoch": 0.26, + "learning_rate": 1.727089875995636e-05, + "loss": 0.4596, + "step": 3328 + }, + { + "epoch": 0.26, + "learning_rate": 1.726913683130202e-05, + "loss": 0.4929, + "step": 3329 + }, + { + "epoch": 0.26, + "learning_rate": 1.7267374424009998e-05, + "loss": 0.3072, + "step": 3330 + }, + { + "epoch": 0.26, + "learning_rate": 1.726561153819634e-05, + "loss": 0.4292, + "step": 3331 + }, + { + "epoch": 0.26, + "learning_rate": 1.7263848173977122e-05, + "loss": 0.4261, + "step": 3332 + }, + { + "epoch": 0.26, + "learning_rate": 1.726208433146845e-05, + "loss": 0.3291, + "step": 3333 + }, + { + "epoch": 0.26, + "learning_rate": 1.726032001078647e-05, + "loss": 0.4102, + "step": 3334 + }, + { + "epoch": 0.26, + "learning_rate": 1.725855521204735e-05, + "loss": 0.3819, + "step": 3335 + }, + { + "epoch": 0.26, + "learning_rate": 1.7256789935367296e-05, + "loss": 0.3341, + "step": 3336 + }, + { + "epoch": 0.26, + "learning_rate": 1.7255024180862546e-05, + "loss": 0.307, + "step": 3337 + }, + { + "epoch": 0.26, + "learning_rate": 1.7253257948649357e-05, + "loss": 0.3835, + "step": 3338 + }, + { + "epoch": 0.26, + "learning_rate": 1.7251491238844038e-05, + "loss": 0.4387, + "step": 3339 + }, + { + "epoch": 0.26, + "learning_rate": 1.7249724051562905e-05, + "loss": 0.3258, + "step": 3340 + }, + { + "epoch": 0.26, + "learning_rate": 1.7247956386922334e-05, + "loss": 0.3981, + "step": 3341 + }, + { + "epoch": 0.26, + "learning_rate": 1.7246188245038705e-05, + "loss": 0.4817, + "step": 3342 + }, + { + "epoch": 0.26, + "learning_rate": 1.7244419626028454e-05, + "loss": 0.4945, + "step": 3343 + }, + { + "epoch": 0.26, + "learning_rate": 1.724265053000802e-05, + "loss": 0.2574, + "step": 3344 + }, + { + "epoch": 0.27, + "learning_rate": 1.7240880957093903e-05, + "loss": 0.3237, + "step": 3345 + }, + { + "epoch": 0.27, + "learning_rate": 1.7239110907402615e-05, + "loss": 0.266, + "step": 3346 + }, + { + "epoch": 0.27, + "learning_rate": 1.72373403810507e-05, + "loss": 0.4198, + "step": 3347 + }, + { + "epoch": 0.27, + "learning_rate": 1.7235569378154752e-05, + "loss": 0.3164, + "step": 3348 + }, + { + "epoch": 0.27, + "learning_rate": 1.7233797898831376e-05, + "loss": 0.3228, + "step": 3349 + }, + { + "epoch": 0.27, + "learning_rate": 1.7232025943197213e-05, + "loss": 0.3187, + "step": 3350 + }, + { + "epoch": 0.27, + "learning_rate": 1.723025351136894e-05, + "loss": 0.3614, + "step": 3351 + }, + { + "epoch": 0.27, + "learning_rate": 1.722848060346326e-05, + "loss": 0.4191, + "step": 3352 + }, + { + "epoch": 0.27, + "learning_rate": 1.7226707219596918e-05, + "loss": 0.3898, + "step": 3353 + }, + { + "epoch": 0.27, + "learning_rate": 1.7224933359886676e-05, + "loss": 0.5278, + "step": 3354 + }, + { + "epoch": 0.27, + "learning_rate": 1.7223159024449338e-05, + "loss": 0.6422, + "step": 3355 + }, + { + "epoch": 0.27, + "learning_rate": 1.7221384213401732e-05, + "loss": 0.416, + "step": 3356 + }, + { + "epoch": 0.27, + "learning_rate": 1.7219608926860726e-05, + "loss": 0.3167, + "step": 3357 + }, + { + "epoch": 0.27, + "learning_rate": 1.721783316494321e-05, + "loss": 0.3823, + "step": 3358 + }, + { + "epoch": 0.27, + "learning_rate": 1.7216056927766106e-05, + "loss": 0.4277, + "step": 3359 + }, + { + "epoch": 0.27, + "learning_rate": 1.721428021544638e-05, + "loss": 0.4613, + "step": 3360 + }, + { + "epoch": 0.27, + "learning_rate": 1.7212503028101012e-05, + "loss": 0.4012, + "step": 3361 + }, + { + "epoch": 0.27, + "learning_rate": 1.721072536584702e-05, + "loss": 0.4066, + "step": 3362 + }, + { + "epoch": 0.27, + "learning_rate": 1.7208947228801464e-05, + "loss": 0.4202, + "step": 3363 + }, + { + "epoch": 0.27, + "learning_rate": 1.7207168617081418e-05, + "loss": 0.4152, + "step": 3364 + }, + { + "epoch": 0.27, + "learning_rate": 1.7205389530804e-05, + "loss": 0.3997, + "step": 3365 + }, + { + "epoch": 0.27, + "learning_rate": 1.7203609970086347e-05, + "loss": 0.3062, + "step": 3366 + }, + { + "epoch": 0.27, + "learning_rate": 1.720182993504564e-05, + "loss": 0.3779, + "step": 3367 + }, + { + "epoch": 0.27, + "learning_rate": 1.7200049425799087e-05, + "loss": 0.4383, + "step": 3368 + }, + { + "epoch": 0.27, + "learning_rate": 1.7198268442463923e-05, + "loss": 0.4776, + "step": 3369 + }, + { + "epoch": 0.27, + "learning_rate": 1.719648698515742e-05, + "loss": 0.3027, + "step": 3370 + }, + { + "epoch": 0.27, + "learning_rate": 1.7194705053996873e-05, + "loss": 0.4034, + "step": 3371 + }, + { + "epoch": 0.27, + "learning_rate": 1.719292264909962e-05, + "loss": 0.3894, + "step": 3372 + }, + { + "epoch": 0.27, + "learning_rate": 1.7191139770583015e-05, + "loss": 0.3493, + "step": 3373 + }, + { + "epoch": 0.27, + "learning_rate": 1.7189356418564463e-05, + "loss": 0.3289, + "step": 3374 + }, + { + "epoch": 0.27, + "learning_rate": 1.7187572593161382e-05, + "loss": 0.3356, + "step": 3375 + }, + { + "epoch": 0.27, + "learning_rate": 1.7185788294491232e-05, + "loss": 0.4357, + "step": 3376 + }, + { + "epoch": 0.27, + "learning_rate": 1.7184003522671497e-05, + "loss": 0.446, + "step": 3377 + }, + { + "epoch": 0.27, + "learning_rate": 1.7182218277819697e-05, + "loss": 0.2298, + "step": 3378 + }, + { + "epoch": 0.27, + "learning_rate": 1.718043256005338e-05, + "loss": 0.3554, + "step": 3379 + }, + { + "epoch": 0.27, + "learning_rate": 1.717864636949013e-05, + "loss": 0.3291, + "step": 3380 + }, + { + "epoch": 0.27, + "learning_rate": 1.7176859706247563e-05, + "loss": 0.4846, + "step": 3381 + }, + { + "epoch": 0.27, + "learning_rate": 1.717507257044331e-05, + "loss": 0.4728, + "step": 3382 + }, + { + "epoch": 0.27, + "learning_rate": 1.717328496219506e-05, + "loss": 0.2659, + "step": 3383 + }, + { + "epoch": 0.27, + "learning_rate": 1.7171496881620507e-05, + "loss": 0.448, + "step": 3384 + }, + { + "epoch": 0.27, + "learning_rate": 1.716970832883739e-05, + "loss": 0.4299, + "step": 3385 + }, + { + "epoch": 0.27, + "learning_rate": 1.716791930396348e-05, + "loss": 0.4198, + "step": 3386 + }, + { + "epoch": 0.27, + "learning_rate": 1.716612980711657e-05, + "loss": 0.4144, + "step": 3387 + }, + { + "epoch": 0.27, + "learning_rate": 1.7164339838414496e-05, + "loss": 0.3213, + "step": 3388 + }, + { + "epoch": 0.27, + "learning_rate": 1.7162549397975118e-05, + "loss": 0.2968, + "step": 3389 + }, + { + "epoch": 0.27, + "learning_rate": 1.7160758485916325e-05, + "loss": 0.3306, + "step": 3390 + }, + { + "epoch": 0.27, + "learning_rate": 1.715896710235604e-05, + "loss": 0.3971, + "step": 3391 + }, + { + "epoch": 0.27, + "learning_rate": 1.715717524741222e-05, + "loss": 0.3367, + "step": 3392 + }, + { + "epoch": 0.27, + "learning_rate": 1.7155382921202844e-05, + "loss": 0.4066, + "step": 3393 + }, + { + "epoch": 0.27, + "learning_rate": 1.7153590123845938e-05, + "loss": 0.4048, + "step": 3394 + }, + { + "epoch": 0.27, + "learning_rate": 1.715179685545954e-05, + "loss": 0.4146, + "step": 3395 + }, + { + "epoch": 0.27, + "learning_rate": 1.7150003116161734e-05, + "loss": 0.3189, + "step": 3396 + }, + { + "epoch": 0.27, + "learning_rate": 1.714820890607062e-05, + "loss": 0.396, + "step": 3397 + }, + { + "epoch": 0.27, + "learning_rate": 1.714641422530435e-05, + "loss": 0.5177, + "step": 3398 + }, + { + "epoch": 0.27, + "learning_rate": 1.7144619073981088e-05, + "loss": 0.3662, + "step": 3399 + }, + { + "epoch": 0.27, + "learning_rate": 1.7142823452219036e-05, + "loss": 0.4217, + "step": 3400 + }, + { + "epoch": 0.27, + "learning_rate": 1.714102736013643e-05, + "loss": 0.2996, + "step": 3401 + }, + { + "epoch": 0.27, + "learning_rate": 1.7139230797851537e-05, + "loss": 0.3396, + "step": 3402 + }, + { + "epoch": 0.27, + "learning_rate": 1.7137433765482644e-05, + "loss": 0.4462, + "step": 3403 + }, + { + "epoch": 0.27, + "learning_rate": 1.713563626314808e-05, + "loss": 0.459, + "step": 3404 + }, + { + "epoch": 0.27, + "learning_rate": 1.71338382909662e-05, + "loss": 0.2785, + "step": 3405 + }, + { + "epoch": 0.27, + "learning_rate": 1.71320398490554e-05, + "loss": 0.3351, + "step": 3406 + }, + { + "epoch": 0.27, + "learning_rate": 1.713024093753409e-05, + "loss": 0.3877, + "step": 3407 + }, + { + "epoch": 0.27, + "learning_rate": 1.7128441556520723e-05, + "loss": 0.3957, + "step": 3408 + }, + { + "epoch": 0.27, + "learning_rate": 1.7126641706133782e-05, + "loss": 0.3437, + "step": 3409 + }, + { + "epoch": 0.27, + "learning_rate": 1.7124841386491774e-05, + "loss": 0.3872, + "step": 3410 + }, + { + "epoch": 0.27, + "learning_rate": 1.7123040597713242e-05, + "loss": 0.2675, + "step": 3411 + }, + { + "epoch": 0.27, + "learning_rate": 1.7121239339916763e-05, + "loss": 0.3251, + "step": 3412 + }, + { + "epoch": 0.27, + "learning_rate": 1.7119437613220936e-05, + "loss": 0.3928, + "step": 3413 + }, + { + "epoch": 0.27, + "learning_rate": 1.71176354177444e-05, + "loss": 0.454, + "step": 3414 + }, + { + "epoch": 0.27, + "learning_rate": 1.711583275360582e-05, + "loss": 0.2739, + "step": 3415 + }, + { + "epoch": 0.27, + "learning_rate": 1.711402962092389e-05, + "loss": 0.2913, + "step": 3416 + }, + { + "epoch": 0.27, + "learning_rate": 1.7112226019817345e-05, + "loss": 0.2917, + "step": 3417 + }, + { + "epoch": 0.27, + "learning_rate": 1.7110421950404935e-05, + "loss": 0.482, + "step": 3418 + }, + { + "epoch": 0.27, + "learning_rate": 1.710861741280545e-05, + "loss": 0.4827, + "step": 3419 + }, + { + "epoch": 0.27, + "learning_rate": 1.710681240713772e-05, + "loss": 0.3741, + "step": 3420 + }, + { + "epoch": 0.27, + "learning_rate": 1.7105006933520584e-05, + "loss": 0.275, + "step": 3421 + }, + { + "epoch": 0.27, + "learning_rate": 1.710320099207293e-05, + "loss": 0.3277, + "step": 3422 + }, + { + "epoch": 0.27, + "learning_rate": 1.7101394582913667e-05, + "loss": 0.386, + "step": 3423 + }, + { + "epoch": 0.27, + "learning_rate": 1.709958770616174e-05, + "loss": 0.4194, + "step": 3424 + }, + { + "epoch": 0.27, + "learning_rate": 1.7097780361936128e-05, + "loss": 0.2706, + "step": 3425 + }, + { + "epoch": 0.27, + "learning_rate": 1.709597255035583e-05, + "loss": 0.3555, + "step": 3426 + }, + { + "epoch": 0.27, + "learning_rate": 1.709416427153988e-05, + "loss": 0.3939, + "step": 3427 + }, + { + "epoch": 0.27, + "learning_rate": 1.7092355525607352e-05, + "loss": 0.433, + "step": 3428 + }, + { + "epoch": 0.27, + "learning_rate": 1.7090546312677335e-05, + "loss": 0.5283, + "step": 3429 + }, + { + "epoch": 0.27, + "learning_rate": 1.7088736632868964e-05, + "loss": 0.4819, + "step": 3430 + }, + { + "epoch": 0.27, + "learning_rate": 1.7086926486301393e-05, + "loss": 0.2987, + "step": 3431 + }, + { + "epoch": 0.27, + "learning_rate": 1.7085115873093814e-05, + "loss": 0.3547, + "step": 3432 + }, + { + "epoch": 0.27, + "learning_rate": 1.7083304793365445e-05, + "loss": 0.3253, + "step": 3433 + }, + { + "epoch": 0.27, + "learning_rate": 1.7081493247235537e-05, + "loss": 0.3927, + "step": 3434 + }, + { + "epoch": 0.27, + "learning_rate": 1.7079681234823374e-05, + "loss": 0.3894, + "step": 3435 + }, + { + "epoch": 0.27, + "learning_rate": 1.7077868756248265e-05, + "loss": 0.466, + "step": 3436 + }, + { + "epoch": 0.27, + "learning_rate": 1.7076055811629556e-05, + "loss": 0.3971, + "step": 3437 + }, + { + "epoch": 0.27, + "learning_rate": 1.7074242401086623e-05, + "loss": 0.4281, + "step": 3438 + }, + { + "epoch": 0.27, + "learning_rate": 1.7072428524738865e-05, + "loss": 0.3912, + "step": 3439 + }, + { + "epoch": 0.27, + "learning_rate": 1.707061418270572e-05, + "loss": 0.4395, + "step": 3440 + }, + { + "epoch": 0.27, + "learning_rate": 1.706879937510665e-05, + "loss": 0.4516, + "step": 3441 + }, + { + "epoch": 0.27, + "learning_rate": 1.7066984102061155e-05, + "loss": 0.4293, + "step": 3442 + }, + { + "epoch": 0.27, + "learning_rate": 1.706516836368876e-05, + "loss": 0.4337, + "step": 3443 + }, + { + "epoch": 0.27, + "learning_rate": 1.7063352160109026e-05, + "loss": 0.3861, + "step": 3444 + }, + { + "epoch": 0.27, + "learning_rate": 1.7061535491441538e-05, + "loss": 0.506, + "step": 3445 + }, + { + "epoch": 0.27, + "learning_rate": 1.7059718357805915e-05, + "loss": 0.487, + "step": 3446 + }, + { + "epoch": 0.27, + "learning_rate": 1.705790075932181e-05, + "loss": 0.3773, + "step": 3447 + }, + { + "epoch": 0.27, + "learning_rate": 1.7056082696108896e-05, + "loss": 0.4478, + "step": 3448 + }, + { + "epoch": 0.27, + "learning_rate": 1.7054264168286892e-05, + "loss": 0.4988, + "step": 3449 + }, + { + "epoch": 0.27, + "learning_rate": 1.7052445175975533e-05, + "loss": 0.3396, + "step": 3450 + }, + { + "epoch": 0.27, + "learning_rate": 1.7050625719294593e-05, + "loss": 0.4656, + "step": 3451 + }, + { + "epoch": 0.27, + "learning_rate": 1.7048805798363876e-05, + "loss": 0.3399, + "step": 3452 + }, + { + "epoch": 0.27, + "learning_rate": 1.7046985413303215e-05, + "loss": 0.4638, + "step": 3453 + }, + { + "epoch": 0.27, + "learning_rate": 1.7045164564232474e-05, + "loss": 0.3609, + "step": 3454 + }, + { + "epoch": 0.27, + "learning_rate": 1.704334325127154e-05, + "loss": 0.3244, + "step": 3455 + }, + { + "epoch": 0.27, + "learning_rate": 1.704152147454035e-05, + "loss": 0.2987, + "step": 3456 + }, + { + "epoch": 0.27, + "learning_rate": 1.7039699234158846e-05, + "loss": 0.4357, + "step": 3457 + }, + { + "epoch": 0.27, + "learning_rate": 1.7037876530247025e-05, + "loss": 0.3657, + "step": 3458 + }, + { + "epoch": 0.27, + "learning_rate": 1.7036053362924896e-05, + "loss": 0.3749, + "step": 3459 + }, + { + "epoch": 0.27, + "learning_rate": 1.7034229732312512e-05, + "loss": 0.4157, + "step": 3460 + }, + { + "epoch": 0.27, + "learning_rate": 1.703240563852994e-05, + "loss": 0.5076, + "step": 3461 + }, + { + "epoch": 0.27, + "learning_rate": 1.70305810816973e-05, + "loss": 0.358, + "step": 3462 + }, + { + "epoch": 0.27, + "learning_rate": 1.7028756061934722e-05, + "loss": 0.3353, + "step": 3463 + }, + { + "epoch": 0.27, + "learning_rate": 1.702693057936238e-05, + "loss": 0.436, + "step": 3464 + }, + { + "epoch": 0.27, + "learning_rate": 1.702510463410047e-05, + "loss": 0.5088, + "step": 3465 + }, + { + "epoch": 0.27, + "learning_rate": 1.7023278226269222e-05, + "loss": 0.439, + "step": 3466 + }, + { + "epoch": 0.27, + "learning_rate": 1.7021451355988895e-05, + "loss": 0.4563, + "step": 3467 + }, + { + "epoch": 0.27, + "learning_rate": 1.7019624023379784e-05, + "loss": 0.279, + "step": 3468 + }, + { + "epoch": 0.27, + "learning_rate": 1.7017796228562206e-05, + "loss": 0.4485, + "step": 3469 + }, + { + "epoch": 0.27, + "learning_rate": 1.7015967971656513e-05, + "loss": 0.4123, + "step": 3470 + }, + { + "epoch": 0.27, + "learning_rate": 1.7014139252783092e-05, + "loss": 0.3767, + "step": 3471 + }, + { + "epoch": 0.28, + "learning_rate": 1.7012310072062348e-05, + "loss": 0.2823, + "step": 3472 + }, + { + "epoch": 0.28, + "learning_rate": 1.7010480429614726e-05, + "loss": 0.3588, + "step": 3473 + }, + { + "epoch": 0.28, + "learning_rate": 1.70086503255607e-05, + "loss": 0.3402, + "step": 3474 + }, + { + "epoch": 0.28, + "learning_rate": 1.7006819760020773e-05, + "loss": 0.4213, + "step": 3475 + }, + { + "epoch": 0.28, + "learning_rate": 1.700498873311548e-05, + "loss": 0.3907, + "step": 3476 + }, + { + "epoch": 0.28, + "learning_rate": 1.7003157244965387e-05, + "loss": 0.4192, + "step": 3477 + }, + { + "epoch": 0.28, + "learning_rate": 1.700132529569109e-05, + "loss": 0.4065, + "step": 3478 + }, + { + "epoch": 0.28, + "learning_rate": 1.69994928854132e-05, + "loss": 0.3925, + "step": 3479 + }, + { + "epoch": 0.28, + "learning_rate": 1.6997660014252392e-05, + "loss": 0.4184, + "step": 3480 + }, + { + "epoch": 0.28, + "learning_rate": 1.699582668232934e-05, + "loss": 0.4316, + "step": 3481 + }, + { + "epoch": 0.28, + "learning_rate": 1.6993992889764758e-05, + "loss": 0.4591, + "step": 3482 + }, + { + "epoch": 0.28, + "learning_rate": 1.69921586366794e-05, + "loss": 0.433, + "step": 3483 + }, + { + "epoch": 0.28, + "learning_rate": 1.6990323923194042e-05, + "loss": 0.471, + "step": 3484 + }, + { + "epoch": 0.28, + "learning_rate": 1.698848874942949e-05, + "loss": 0.5225, + "step": 3485 + }, + { + "epoch": 0.28, + "learning_rate": 1.698665311550658e-05, + "loss": 0.3331, + "step": 3486 + }, + { + "epoch": 0.28, + "learning_rate": 1.6984817021546177e-05, + "loss": 0.4069, + "step": 3487 + }, + { + "epoch": 0.28, + "learning_rate": 1.6982980467669183e-05, + "loss": 0.4693, + "step": 3488 + }, + { + "epoch": 0.28, + "learning_rate": 1.6981143453996524e-05, + "loss": 0.4163, + "step": 3489 + }, + { + "epoch": 0.28, + "learning_rate": 1.697930598064916e-05, + "loss": 0.3771, + "step": 3490 + }, + { + "epoch": 0.28, + "learning_rate": 1.697746804774808e-05, + "loss": 0.4346, + "step": 3491 + }, + { + "epoch": 0.28, + "learning_rate": 1.6975629655414304e-05, + "loss": 0.397, + "step": 3492 + }, + { + "epoch": 0.28, + "learning_rate": 1.6973790803768875e-05, + "loss": 0.4662, + "step": 3493 + }, + { + "epoch": 0.28, + "learning_rate": 1.6971951492932882e-05, + "loss": 0.2277, + "step": 3494 + }, + { + "epoch": 0.28, + "learning_rate": 1.697011172302743e-05, + "loss": 0.4484, + "step": 3495 + }, + { + "epoch": 0.28, + "learning_rate": 1.696827149417366e-05, + "loss": 0.3825, + "step": 3496 + }, + { + "epoch": 0.28, + "learning_rate": 1.696643080649274e-05, + "loss": 0.3458, + "step": 3497 + }, + { + "epoch": 0.28, + "learning_rate": 1.696458966010587e-05, + "loss": 0.414, + "step": 3498 + }, + { + "epoch": 0.28, + "learning_rate": 1.6962748055134283e-05, + "loss": 0.424, + "step": 3499 + }, + { + "epoch": 0.28, + "learning_rate": 1.696090599169924e-05, + "loss": 0.4252, + "step": 3500 + }, + { + "epoch": 0.28, + "learning_rate": 1.695906346992203e-05, + "loss": 0.4235, + "step": 3501 + }, + { + "epoch": 0.28, + "learning_rate": 1.6957220489923978e-05, + "loss": 0.322, + "step": 3502 + }, + { + "epoch": 0.28, + "learning_rate": 1.695537705182643e-05, + "loss": 0.3873, + "step": 3503 + }, + { + "epoch": 0.28, + "learning_rate": 1.695353315575077e-05, + "loss": 0.3995, + "step": 3504 + }, + { + "epoch": 0.28, + "learning_rate": 1.6951688801818413e-05, + "loss": 0.3054, + "step": 3505 + }, + { + "epoch": 0.28, + "learning_rate": 1.6949843990150798e-05, + "loss": 0.4983, + "step": 3506 + }, + { + "epoch": 0.28, + "learning_rate": 1.6947998720869394e-05, + "loss": 0.3894, + "step": 3507 + }, + { + "epoch": 0.28, + "learning_rate": 1.6946152994095705e-05, + "loss": 0.3792, + "step": 3508 + }, + { + "epoch": 0.28, + "learning_rate": 1.6944306809951264e-05, + "loss": 0.3668, + "step": 3509 + }, + { + "epoch": 0.28, + "learning_rate": 1.694246016855764e-05, + "loss": 0.4343, + "step": 3510 + }, + { + "epoch": 0.28, + "learning_rate": 1.694061307003641e-05, + "loss": 0.337, + "step": 3511 + }, + { + "epoch": 0.28, + "learning_rate": 1.693876551450921e-05, + "loss": 0.3309, + "step": 3512 + }, + { + "epoch": 0.28, + "learning_rate": 1.693691750209769e-05, + "loss": 0.2797, + "step": 3513 + }, + { + "epoch": 0.28, + "learning_rate": 1.6935069032923525e-05, + "loss": 0.5012, + "step": 3514 + }, + { + "epoch": 0.28, + "learning_rate": 1.6933220107108438e-05, + "loss": 0.4969, + "step": 3515 + }, + { + "epoch": 0.28, + "learning_rate": 1.6931370724774166e-05, + "loss": 0.4063, + "step": 3516 + }, + { + "epoch": 0.28, + "learning_rate": 1.6929520886042486e-05, + "loss": 0.3859, + "step": 3517 + }, + { + "epoch": 0.28, + "learning_rate": 1.6927670591035195e-05, + "loss": 0.4312, + "step": 3518 + }, + { + "epoch": 0.28, + "learning_rate": 1.692581983987413e-05, + "loss": 0.4667, + "step": 3519 + }, + { + "epoch": 0.28, + "learning_rate": 1.6923968632681155e-05, + "loss": 0.4306, + "step": 3520 + }, + { + "epoch": 0.28, + "learning_rate": 1.6922116969578163e-05, + "loss": 0.2957, + "step": 3521 + }, + { + "epoch": 0.28, + "learning_rate": 1.692026485068707e-05, + "loss": 0.4781, + "step": 3522 + }, + { + "epoch": 0.28, + "learning_rate": 1.6918412276129837e-05, + "loss": 0.4673, + "step": 3523 + }, + { + "epoch": 0.28, + "learning_rate": 1.691655924602845e-05, + "loss": 0.361, + "step": 3524 + }, + { + "epoch": 0.28, + "learning_rate": 1.6914705760504913e-05, + "loss": 0.5083, + "step": 3525 + }, + { + "epoch": 0.28, + "learning_rate": 1.6912851819681272e-05, + "loss": 0.2854, + "step": 3526 + }, + { + "epoch": 0.28, + "learning_rate": 1.69109974236796e-05, + "loss": 0.4035, + "step": 3527 + }, + { + "epoch": 0.28, + "learning_rate": 1.6909142572622003e-05, + "loss": 0.3432, + "step": 3528 + }, + { + "epoch": 0.28, + "learning_rate": 1.6907287266630614e-05, + "loss": 0.4005, + "step": 3529 + }, + { + "epoch": 0.28, + "learning_rate": 1.6905431505827595e-05, + "loss": 0.2685, + "step": 3530 + }, + { + "epoch": 0.28, + "learning_rate": 1.6903575290335136e-05, + "loss": 0.3213, + "step": 3531 + }, + { + "epoch": 0.28, + "learning_rate": 1.690171862027546e-05, + "loss": 0.3523, + "step": 3532 + }, + { + "epoch": 0.28, + "learning_rate": 1.6899861495770827e-05, + "loss": 0.4781, + "step": 3533 + }, + { + "epoch": 0.28, + "learning_rate": 1.689800391694351e-05, + "loss": 0.3285, + "step": 3534 + }, + { + "epoch": 0.28, + "learning_rate": 1.689614588391583e-05, + "loss": 0.5778, + "step": 3535 + }, + { + "epoch": 0.28, + "learning_rate": 1.689428739681012e-05, + "loss": 0.3246, + "step": 3536 + }, + { + "epoch": 0.28, + "learning_rate": 1.6892428455748762e-05, + "loss": 0.3956, + "step": 3537 + }, + { + "epoch": 0.28, + "learning_rate": 1.6890569060854156e-05, + "loss": 0.2696, + "step": 3538 + }, + { + "epoch": 0.28, + "learning_rate": 1.6888709212248728e-05, + "loss": 0.4384, + "step": 3539 + }, + { + "epoch": 0.28, + "learning_rate": 1.6886848910054947e-05, + "loss": 0.4513, + "step": 3540 + }, + { + "epoch": 0.28, + "learning_rate": 1.6884988154395304e-05, + "loss": 0.4705, + "step": 3541 + }, + { + "epoch": 0.28, + "learning_rate": 1.688312694539232e-05, + "loss": 0.4328, + "step": 3542 + }, + { + "epoch": 0.28, + "learning_rate": 1.6881265283168543e-05, + "loss": 0.5742, + "step": 3543 + }, + { + "epoch": 0.28, + "learning_rate": 1.6879403167846556e-05, + "loss": 0.4224, + "step": 3544 + }, + { + "epoch": 0.28, + "learning_rate": 1.6877540599548977e-05, + "loss": 0.5061, + "step": 3545 + }, + { + "epoch": 0.28, + "learning_rate": 1.6875677578398442e-05, + "loss": 0.4282, + "step": 3546 + }, + { + "epoch": 0.28, + "learning_rate": 1.6873814104517617e-05, + "loss": 0.443, + "step": 3547 + }, + { + "epoch": 0.28, + "learning_rate": 1.6871950178029216e-05, + "loss": 0.4385, + "step": 3548 + }, + { + "epoch": 0.28, + "learning_rate": 1.6870085799055956e-05, + "loss": 0.4543, + "step": 3549 + }, + { + "epoch": 0.28, + "learning_rate": 1.6868220967720604e-05, + "loss": 0.3085, + "step": 3550 + }, + { + "epoch": 0.28, + "learning_rate": 1.686635568414595e-05, + "loss": 0.3851, + "step": 3551 + }, + { + "epoch": 0.28, + "learning_rate": 1.686448994845481e-05, + "loss": 0.3957, + "step": 3552 + }, + { + "epoch": 0.28, + "learning_rate": 1.6862623760770038e-05, + "loss": 0.5958, + "step": 3553 + }, + { + "epoch": 0.28, + "learning_rate": 1.6860757121214513e-05, + "loss": 0.2775, + "step": 3554 + }, + { + "epoch": 0.28, + "learning_rate": 1.685889002991114e-05, + "loss": 0.4419, + "step": 3555 + }, + { + "epoch": 0.28, + "learning_rate": 1.6857022486982865e-05, + "loss": 0.4725, + "step": 3556 + }, + { + "epoch": 0.28, + "learning_rate": 1.6855154492552656e-05, + "loss": 0.371, + "step": 3557 + }, + { + "epoch": 0.28, + "learning_rate": 1.6853286046743505e-05, + "loss": 0.4104, + "step": 3558 + }, + { + "epoch": 0.28, + "learning_rate": 1.6851417149678442e-05, + "loss": 0.4663, + "step": 3559 + }, + { + "epoch": 0.28, + "learning_rate": 1.684954780148053e-05, + "loss": 0.4037, + "step": 3560 + }, + { + "epoch": 0.28, + "learning_rate": 1.684767800227285e-05, + "loss": 0.3703, + "step": 3561 + }, + { + "epoch": 0.28, + "learning_rate": 1.6845807752178528e-05, + "loss": 0.3277, + "step": 3562 + }, + { + "epoch": 0.28, + "learning_rate": 1.68439370513207e-05, + "loss": 0.3736, + "step": 3563 + }, + { + "epoch": 0.28, + "learning_rate": 1.6842065899822548e-05, + "loss": 0.3426, + "step": 3564 + }, + { + "epoch": 0.28, + "learning_rate": 1.6840194297807283e-05, + "loss": 0.4396, + "step": 3565 + }, + { + "epoch": 0.28, + "learning_rate": 1.6838322245398135e-05, + "loss": 0.3904, + "step": 3566 + }, + { + "epoch": 0.28, + "learning_rate": 1.6836449742718367e-05, + "loss": 0.3822, + "step": 3567 + }, + { + "epoch": 0.28, + "learning_rate": 1.6834576789891282e-05, + "loss": 0.396, + "step": 3568 + }, + { + "epoch": 0.28, + "learning_rate": 1.68327033870402e-05, + "loss": 0.5366, + "step": 3569 + }, + { + "epoch": 0.28, + "learning_rate": 1.6830829534288475e-05, + "loss": 0.3474, + "step": 3570 + }, + { + "epoch": 0.28, + "learning_rate": 1.6828955231759495e-05, + "loss": 0.3583, + "step": 3571 + }, + { + "epoch": 0.28, + "learning_rate": 1.682708047957667e-05, + "loss": 0.496, + "step": 3572 + }, + { + "epoch": 0.28, + "learning_rate": 1.682520527786345e-05, + "loss": 0.4199, + "step": 3573 + }, + { + "epoch": 0.28, + "learning_rate": 1.6823329626743298e-05, + "loss": 0.3329, + "step": 3574 + }, + { + "epoch": 0.28, + "learning_rate": 1.6821453526339727e-05, + "loss": 0.3968, + "step": 3575 + }, + { + "epoch": 0.28, + "learning_rate": 1.6819576976776262e-05, + "loss": 0.4586, + "step": 3576 + }, + { + "epoch": 0.28, + "learning_rate": 1.6817699978176464e-05, + "loss": 0.4302, + "step": 3577 + }, + { + "epoch": 0.28, + "learning_rate": 1.681582253066393e-05, + "loss": 0.405, + "step": 3578 + }, + { + "epoch": 0.28, + "learning_rate": 1.681394463436228e-05, + "loss": 0.4138, + "step": 3579 + }, + { + "epoch": 0.28, + "learning_rate": 1.6812066289395157e-05, + "loss": 0.5807, + "step": 3580 + }, + { + "epoch": 0.28, + "learning_rate": 1.681018749588625e-05, + "loss": 0.318, + "step": 3581 + }, + { + "epoch": 0.28, + "learning_rate": 1.6808308253959263e-05, + "loss": 0.3267, + "step": 3582 + }, + { + "epoch": 0.28, + "learning_rate": 1.680642856373794e-05, + "loss": 0.453, + "step": 3583 + }, + { + "epoch": 0.28, + "learning_rate": 1.680454842534604e-05, + "loss": 0.3467, + "step": 3584 + }, + { + "epoch": 0.28, + "learning_rate": 1.6802667838907374e-05, + "loss": 0.4058, + "step": 3585 + }, + { + "epoch": 0.28, + "learning_rate": 1.680078680454576e-05, + "loss": 0.5408, + "step": 3586 + }, + { + "epoch": 0.28, + "learning_rate": 1.6798905322385063e-05, + "loss": 0.4066, + "step": 3587 + }, + { + "epoch": 0.28, + "learning_rate": 1.6797023392549157e-05, + "loss": 0.4653, + "step": 3588 + }, + { + "epoch": 0.28, + "learning_rate": 1.679514101516197e-05, + "loss": 0.3608, + "step": 3589 + }, + { + "epoch": 0.28, + "learning_rate": 1.6793258190347445e-05, + "loss": 0.3712, + "step": 3590 + }, + { + "epoch": 0.28, + "learning_rate": 1.679137491822955e-05, + "loss": 0.3756, + "step": 3591 + }, + { + "epoch": 0.28, + "learning_rate": 1.6789491198932302e-05, + "loss": 0.311, + "step": 3592 + }, + { + "epoch": 0.28, + "learning_rate": 1.6787607032579724e-05, + "loss": 0.4396, + "step": 3593 + }, + { + "epoch": 0.28, + "learning_rate": 1.678572241929588e-05, + "loss": 0.3611, + "step": 3594 + }, + { + "epoch": 0.28, + "learning_rate": 1.6783837359204868e-05, + "loss": 0.4246, + "step": 3595 + }, + { + "epoch": 0.28, + "learning_rate": 1.6781951852430813e-05, + "loss": 0.3412, + "step": 3596 + }, + { + "epoch": 0.28, + "learning_rate": 1.6780065899097853e-05, + "loss": 0.2863, + "step": 3597 + }, + { + "epoch": 0.29, + "learning_rate": 1.677817949933018e-05, + "loss": 0.4483, + "step": 3598 + }, + { + "epoch": 0.29, + "learning_rate": 1.6776292653252e-05, + "loss": 0.3179, + "step": 3599 + }, + { + "epoch": 0.29, + "learning_rate": 1.6774405360987556e-05, + "loss": 0.3623, + "step": 3600 + }, + { + "epoch": 0.29, + "learning_rate": 1.6772517622661115e-05, + "loss": 0.3119, + "step": 3601 + }, + { + "epoch": 0.29, + "learning_rate": 1.6770629438396973e-05, + "loss": 0.3621, + "step": 3602 + }, + { + "epoch": 0.29, + "learning_rate": 1.676874080831947e-05, + "loss": 0.4387, + "step": 3603 + }, + { + "epoch": 0.29, + "learning_rate": 1.676685173255294e-05, + "loss": 0.369, + "step": 3604 + }, + { + "epoch": 0.29, + "learning_rate": 1.6764962211221796e-05, + "loss": 0.4501, + "step": 3605 + }, + { + "epoch": 0.29, + "learning_rate": 1.6763072244450435e-05, + "loss": 0.3802, + "step": 3606 + }, + { + "epoch": 0.29, + "learning_rate": 1.676118183236331e-05, + "loss": 0.4244, + "step": 3607 + }, + { + "epoch": 0.29, + "learning_rate": 1.6759290975084894e-05, + "loss": 0.4121, + "step": 3608 + }, + { + "epoch": 0.29, + "learning_rate": 1.675739967273969e-05, + "loss": 0.3457, + "step": 3609 + }, + { + "epoch": 0.29, + "learning_rate": 1.675550792545223e-05, + "loss": 0.4177, + "step": 3610 + }, + { + "epoch": 0.29, + "learning_rate": 1.6753615733347085e-05, + "loss": 0.4657, + "step": 3611 + }, + { + "epoch": 0.29, + "learning_rate": 1.6751723096548834e-05, + "loss": 0.4516, + "step": 3612 + }, + { + "epoch": 0.29, + "learning_rate": 1.6749830015182106e-05, + "loss": 0.3791, + "step": 3613 + }, + { + "epoch": 0.29, + "learning_rate": 1.6747936489371552e-05, + "loss": 0.4206, + "step": 3614 + }, + { + "epoch": 0.29, + "learning_rate": 1.674604251924185e-05, + "loss": 0.372, + "step": 3615 + }, + { + "epoch": 0.29, + "learning_rate": 1.6744148104917705e-05, + "loss": 0.4493, + "step": 3616 + }, + { + "epoch": 0.29, + "learning_rate": 1.6742253246523856e-05, + "loss": 0.3437, + "step": 3617 + }, + { + "epoch": 0.29, + "learning_rate": 1.6740357944185074e-05, + "loss": 0.3445, + "step": 3618 + }, + { + "epoch": 0.29, + "learning_rate": 1.6738462198026154e-05, + "loss": 0.3321, + "step": 3619 + }, + { + "epoch": 0.29, + "learning_rate": 1.6736566008171925e-05, + "loss": 0.411, + "step": 3620 + }, + { + "epoch": 0.29, + "learning_rate": 1.6734669374747237e-05, + "loss": 0.3812, + "step": 3621 + }, + { + "epoch": 0.29, + "learning_rate": 1.6732772297876975e-05, + "loss": 0.364, + "step": 3622 + }, + { + "epoch": 0.29, + "learning_rate": 1.6730874777686053e-05, + "loss": 0.381, + "step": 3623 + }, + { + "epoch": 0.29, + "learning_rate": 1.6728976814299413e-05, + "loss": 0.3896, + "step": 3624 + }, + { + "epoch": 0.29, + "learning_rate": 1.6727078407842028e-05, + "loss": 0.3645, + "step": 3625 + }, + { + "epoch": 0.29, + "learning_rate": 1.67251795584389e-05, + "loss": 0.3172, + "step": 3626 + }, + { + "epoch": 0.29, + "learning_rate": 1.6723280266215057e-05, + "loss": 0.3205, + "step": 3627 + }, + { + "epoch": 0.29, + "learning_rate": 1.672138053129556e-05, + "loss": 0.3705, + "step": 3628 + }, + { + "epoch": 0.29, + "learning_rate": 1.6719480353805493e-05, + "loss": 0.422, + "step": 3629 + }, + { + "epoch": 0.29, + "learning_rate": 1.671757973386998e-05, + "loss": 0.4768, + "step": 3630 + }, + { + "epoch": 0.29, + "learning_rate": 1.6715678671614162e-05, + "loss": 0.4315, + "step": 3631 + }, + { + "epoch": 0.29, + "learning_rate": 1.6713777167163215e-05, + "loss": 0.3132, + "step": 3632 + }, + { + "epoch": 0.29, + "learning_rate": 1.6711875220642352e-05, + "loss": 0.4815, + "step": 3633 + }, + { + "epoch": 0.29, + "learning_rate": 1.6709972832176797e-05, + "loss": 0.3762, + "step": 3634 + }, + { + "epoch": 0.29, + "learning_rate": 1.670807000189182e-05, + "loss": 0.4959, + "step": 3635 + }, + { + "epoch": 0.29, + "learning_rate": 1.6706166729912712e-05, + "loss": 0.3818, + "step": 3636 + }, + { + "epoch": 0.29, + "learning_rate": 1.670426301636479e-05, + "loss": 0.4151, + "step": 3637 + }, + { + "epoch": 0.29, + "learning_rate": 1.6702358861373408e-05, + "loss": 0.3932, + "step": 3638 + }, + { + "epoch": 0.29, + "learning_rate": 1.6700454265063943e-05, + "loss": 0.3446, + "step": 3639 + }, + { + "epoch": 0.29, + "learning_rate": 1.6698549227561805e-05, + "loss": 0.3629, + "step": 3640 + }, + { + "epoch": 0.29, + "learning_rate": 1.6696643748992434e-05, + "loss": 0.3599, + "step": 3641 + }, + { + "epoch": 0.29, + "learning_rate": 1.6694737829481292e-05, + "loss": 0.3207, + "step": 3642 + }, + { + "epoch": 0.29, + "learning_rate": 1.669283146915388e-05, + "loss": 0.3187, + "step": 3643 + }, + { + "epoch": 0.29, + "learning_rate": 1.6690924668135718e-05, + "loss": 0.3898, + "step": 3644 + }, + { + "epoch": 0.29, + "learning_rate": 1.668901742655236e-05, + "loss": 0.3487, + "step": 3645 + }, + { + "epoch": 0.29, + "learning_rate": 1.6687109744529394e-05, + "loss": 0.4224, + "step": 3646 + }, + { + "epoch": 0.29, + "learning_rate": 1.6685201622192422e-05, + "loss": 0.4063, + "step": 3647 + }, + { + "epoch": 0.29, + "learning_rate": 1.6683293059667096e-05, + "loss": 0.3783, + "step": 3648 + }, + { + "epoch": 0.29, + "learning_rate": 1.6681384057079076e-05, + "loss": 0.4357, + "step": 3649 + }, + { + "epoch": 0.29, + "learning_rate": 1.6679474614554066e-05, + "loss": 0.4097, + "step": 3650 + }, + { + "epoch": 0.29, + "learning_rate": 1.667756473221779e-05, + "loss": 0.3976, + "step": 3651 + }, + { + "epoch": 0.29, + "learning_rate": 1.667565441019601e-05, + "loss": 0.4947, + "step": 3652 + }, + { + "epoch": 0.29, + "learning_rate": 1.6673743648614507e-05, + "loss": 0.3277, + "step": 3653 + }, + { + "epoch": 0.29, + "learning_rate": 1.66718324475991e-05, + "loss": 0.4358, + "step": 3654 + }, + { + "epoch": 0.29, + "learning_rate": 1.6669920807275622e-05, + "loss": 0.4945, + "step": 3655 + }, + { + "epoch": 0.29, + "learning_rate": 1.666800872776996e-05, + "loss": 0.3528, + "step": 3656 + }, + { + "epoch": 0.29, + "learning_rate": 1.6666096209208e-05, + "loss": 0.2642, + "step": 3657 + }, + { + "epoch": 0.29, + "learning_rate": 1.6664183251715687e-05, + "loss": 0.4808, + "step": 3658 + }, + { + "epoch": 0.29, + "learning_rate": 1.666226985541897e-05, + "loss": 0.3709, + "step": 3659 + }, + { + "epoch": 0.29, + "learning_rate": 1.666035602044384e-05, + "loss": 0.3158, + "step": 3660 + }, + { + "epoch": 0.29, + "learning_rate": 1.665844174691631e-05, + "loss": 0.4132, + "step": 3661 + }, + { + "epoch": 0.29, + "learning_rate": 1.6656527034962433e-05, + "loss": 0.384, + "step": 3662 + }, + { + "epoch": 0.29, + "learning_rate": 1.665461188470828e-05, + "loss": 0.297, + "step": 3663 + }, + { + "epoch": 0.29, + "learning_rate": 1.6652696296279954e-05, + "loss": 0.2988, + "step": 3664 + }, + { + "epoch": 0.29, + "learning_rate": 1.6650780269803587e-05, + "loss": 0.3685, + "step": 3665 + }, + { + "epoch": 0.29, + "learning_rate": 1.664886380540534e-05, + "loss": 0.4647, + "step": 3666 + }, + { + "epoch": 0.29, + "learning_rate": 1.664694690321141e-05, + "loss": 0.427, + "step": 3667 + }, + { + "epoch": 0.29, + "learning_rate": 1.6645029563348e-05, + "loss": 0.4792, + "step": 3668 + }, + { + "epoch": 0.29, + "learning_rate": 1.6643111785941374e-05, + "loss": 0.3683, + "step": 3669 + }, + { + "epoch": 0.29, + "learning_rate": 1.66411935711178e-05, + "loss": 0.3862, + "step": 3670 + }, + { + "epoch": 0.29, + "learning_rate": 1.6639274919003582e-05, + "loss": 0.3895, + "step": 3671 + }, + { + "epoch": 0.29, + "learning_rate": 1.6637355829725057e-05, + "loss": 0.4481, + "step": 3672 + }, + { + "epoch": 0.29, + "learning_rate": 1.663543630340859e-05, + "loss": 0.3375, + "step": 3673 + }, + { + "epoch": 0.29, + "learning_rate": 1.6633516340180568e-05, + "loss": 0.3855, + "step": 3674 + }, + { + "epoch": 0.29, + "learning_rate": 1.6631595940167416e-05, + "loss": 0.3559, + "step": 3675 + }, + { + "epoch": 0.29, + "learning_rate": 1.662967510349558e-05, + "loss": 0.357, + "step": 3676 + }, + { + "epoch": 0.29, + "learning_rate": 1.6627753830291536e-05, + "loss": 0.4254, + "step": 3677 + }, + { + "epoch": 0.29, + "learning_rate": 1.6625832120681795e-05, + "loss": 0.4208, + "step": 3678 + }, + { + "epoch": 0.29, + "learning_rate": 1.6623909974792888e-05, + "loss": 0.3747, + "step": 3679 + }, + { + "epoch": 0.29, + "learning_rate": 1.6621987392751385e-05, + "loss": 0.3881, + "step": 3680 + }, + { + "epoch": 0.29, + "learning_rate": 1.6620064374683874e-05, + "loss": 0.3663, + "step": 3681 + }, + { + "epoch": 0.29, + "learning_rate": 1.6618140920716976e-05, + "loss": 0.2979, + "step": 3682 + }, + { + "epoch": 0.29, + "learning_rate": 1.6616217030977345e-05, + "loss": 0.4197, + "step": 3683 + }, + { + "epoch": 0.29, + "learning_rate": 1.6614292705591658e-05, + "loss": 0.4481, + "step": 3684 + }, + { + "epoch": 0.29, + "learning_rate": 1.6612367944686617e-05, + "loss": 0.3044, + "step": 3685 + }, + { + "epoch": 0.29, + "learning_rate": 1.6610442748388972e-05, + "loss": 0.4358, + "step": 3686 + }, + { + "epoch": 0.29, + "learning_rate": 1.6608517116825473e-05, + "loss": 0.3585, + "step": 3687 + }, + { + "epoch": 0.29, + "learning_rate": 1.6606591050122924e-05, + "loss": 0.3625, + "step": 3688 + }, + { + "epoch": 0.29, + "learning_rate": 1.660466454840814e-05, + "loss": 0.3231, + "step": 3689 + }, + { + "epoch": 0.29, + "learning_rate": 1.6602737611807975e-05, + "loss": 0.405, + "step": 3690 + }, + { + "epoch": 0.29, + "learning_rate": 1.660081024044931e-05, + "loss": 0.3125, + "step": 3691 + }, + { + "epoch": 0.29, + "learning_rate": 1.659888243445905e-05, + "loss": 0.4542, + "step": 3692 + }, + { + "epoch": 0.29, + "learning_rate": 1.6596954193964136e-05, + "loss": 0.3228, + "step": 3693 + }, + { + "epoch": 0.29, + "learning_rate": 1.659502551909153e-05, + "loss": 0.2755, + "step": 3694 + }, + { + "epoch": 0.29, + "learning_rate": 1.6593096409968227e-05, + "loss": 0.4547, + "step": 3695 + }, + { + "epoch": 0.29, + "learning_rate": 1.6591166866721247e-05, + "loss": 0.3656, + "step": 3696 + }, + { + "epoch": 0.29, + "learning_rate": 1.658923688947765e-05, + "loss": 0.4185, + "step": 3697 + }, + { + "epoch": 0.29, + "learning_rate": 1.6587306478364502e-05, + "loss": 0.4013, + "step": 3698 + }, + { + "epoch": 0.29, + "learning_rate": 1.658537563350892e-05, + "loss": 0.4011, + "step": 3699 + }, + { + "epoch": 0.29, + "learning_rate": 1.6583444355038042e-05, + "loss": 0.4451, + "step": 3700 + }, + { + "epoch": 0.29, + "learning_rate": 1.6581512643079028e-05, + "loss": 0.2733, + "step": 3701 + }, + { + "epoch": 0.29, + "learning_rate": 1.657958049775908e-05, + "loss": 0.3837, + "step": 3702 + }, + { + "epoch": 0.29, + "learning_rate": 1.6577647919205407e-05, + "loss": 0.3006, + "step": 3703 + }, + { + "epoch": 0.29, + "learning_rate": 1.6575714907545272e-05, + "loss": 0.3967, + "step": 3704 + }, + { + "epoch": 0.29, + "learning_rate": 1.6573781462905954e-05, + "loss": 0.3781, + "step": 3705 + }, + { + "epoch": 0.29, + "learning_rate": 1.6571847585414754e-05, + "loss": 0.3663, + "step": 3706 + }, + { + "epoch": 0.29, + "learning_rate": 1.6569913275199013e-05, + "loss": 0.4475, + "step": 3707 + }, + { + "epoch": 0.29, + "learning_rate": 1.6567978532386094e-05, + "loss": 0.414, + "step": 3708 + }, + { + "epoch": 0.29, + "learning_rate": 1.6566043357103393e-05, + "loss": 0.3724, + "step": 3709 + }, + { + "epoch": 0.29, + "learning_rate": 1.656410774947833e-05, + "loss": 0.3568, + "step": 3710 + }, + { + "epoch": 0.29, + "learning_rate": 1.6562171709638355e-05, + "loss": 0.3685, + "step": 3711 + }, + { + "epoch": 0.29, + "learning_rate": 1.656023523771095e-05, + "loss": 0.4146, + "step": 3712 + }, + { + "epoch": 0.29, + "learning_rate": 1.655829833382362e-05, + "loss": 0.2958, + "step": 3713 + }, + { + "epoch": 0.29, + "learning_rate": 1.6556360998103903e-05, + "loss": 0.534, + "step": 3714 + }, + { + "epoch": 0.29, + "learning_rate": 1.655442323067936e-05, + "loss": 0.4345, + "step": 3715 + }, + { + "epoch": 0.29, + "learning_rate": 1.6552485031677586e-05, + "loss": 0.4081, + "step": 3716 + }, + { + "epoch": 0.29, + "learning_rate": 1.65505464012262e-05, + "loss": 0.3775, + "step": 3717 + }, + { + "epoch": 0.29, + "learning_rate": 1.6548607339452853e-05, + "loss": 0.3597, + "step": 3718 + }, + { + "epoch": 0.29, + "learning_rate": 1.6546667846485224e-05, + "loss": 0.3806, + "step": 3719 + }, + { + "epoch": 0.29, + "learning_rate": 1.6544727922451014e-05, + "loss": 0.3756, + "step": 3720 + }, + { + "epoch": 0.29, + "learning_rate": 1.654278756747796e-05, + "loss": 0.4238, + "step": 3721 + }, + { + "epoch": 0.29, + "learning_rate": 1.6540846781693837e-05, + "loss": 0.3529, + "step": 3722 + }, + { + "epoch": 0.29, + "learning_rate": 1.6538905565226416e-05, + "loss": 0.457, + "step": 3723 + }, + { + "epoch": 0.3, + "learning_rate": 1.6536963918203532e-05, + "loss": 0.3967, + "step": 3724 + }, + { + "epoch": 0.3, + "learning_rate": 1.6535021840753026e-05, + "loss": 0.3633, + "step": 3725 + }, + { + "epoch": 0.3, + "learning_rate": 1.6533079333002775e-05, + "loss": 0.5154, + "step": 3726 + }, + { + "epoch": 0.3, + "learning_rate": 1.6531136395080687e-05, + "loss": 0.3488, + "step": 3727 + }, + { + "epoch": 0.3, + "learning_rate": 1.6529193027114692e-05, + "loss": 0.3989, + "step": 3728 + }, + { + "epoch": 0.3, + "learning_rate": 1.6527249229232754e-05, + "loss": 0.4783, + "step": 3729 + }, + { + "epoch": 0.3, + "learning_rate": 1.652530500156286e-05, + "loss": 0.288, + "step": 3730 + }, + { + "epoch": 0.3, + "learning_rate": 1.652336034423303e-05, + "loss": 0.4485, + "step": 3731 + }, + { + "epoch": 0.3, + "learning_rate": 1.6521415257371312e-05, + "loss": 0.2781, + "step": 3732 + }, + { + "epoch": 0.3, + "learning_rate": 1.6519469741105777e-05, + "loss": 0.4559, + "step": 3733 + }, + { + "epoch": 0.3, + "learning_rate": 1.6517523795564527e-05, + "loss": 0.3527, + "step": 3734 + }, + { + "epoch": 0.3, + "learning_rate": 1.6515577420875698e-05, + "loss": 0.3216, + "step": 3735 + }, + { + "epoch": 0.3, + "learning_rate": 1.6513630617167446e-05, + "loss": 0.5126, + "step": 3736 + }, + { + "epoch": 0.3, + "learning_rate": 1.6511683384567957e-05, + "loss": 0.3661, + "step": 3737 + }, + { + "epoch": 0.3, + "learning_rate": 1.6509735723205453e-05, + "loss": 0.3779, + "step": 3738 + }, + { + "epoch": 0.3, + "learning_rate": 1.6507787633208173e-05, + "loss": 0.4777, + "step": 3739 + }, + { + "epoch": 0.3, + "learning_rate": 1.650583911470439e-05, + "loss": 0.2857, + "step": 3740 + }, + { + "epoch": 0.3, + "learning_rate": 1.6503890167822406e-05, + "loss": 0.4465, + "step": 3741 + }, + { + "epoch": 0.3, + "learning_rate": 1.6501940792690547e-05, + "loss": 0.3203, + "step": 3742 + }, + { + "epoch": 0.3, + "learning_rate": 1.6499990989437177e-05, + "loss": 0.4036, + "step": 3743 + }, + { + "epoch": 0.3, + "learning_rate": 1.6498040758190673e-05, + "loss": 0.3265, + "step": 3744 + }, + { + "epoch": 0.3, + "learning_rate": 1.6496090099079452e-05, + "loss": 0.2953, + "step": 3745 + }, + { + "epoch": 0.3, + "learning_rate": 1.6494139012231954e-05, + "loss": 0.3114, + "step": 3746 + }, + { + "epoch": 0.3, + "learning_rate": 1.6492187497776654e-05, + "loss": 0.5024, + "step": 3747 + }, + { + "epoch": 0.3, + "learning_rate": 1.6490235555842044e-05, + "loss": 0.3489, + "step": 3748 + }, + { + "epoch": 0.3, + "learning_rate": 1.6488283186556648e-05, + "loss": 0.4351, + "step": 3749 + }, + { + "epoch": 0.3, + "learning_rate": 1.6486330390049027e-05, + "loss": 0.4137, + "step": 3750 + }, + { + "epoch": 0.3, + "learning_rate": 1.648437716644776e-05, + "loss": 0.3345, + "step": 3751 + }, + { + "epoch": 0.3, + "learning_rate": 1.6482423515881455e-05, + "loss": 0.4807, + "step": 3752 + }, + { + "epoch": 0.3, + "learning_rate": 1.6480469438478756e-05, + "loss": 0.3585, + "step": 3753 + }, + { + "epoch": 0.3, + "learning_rate": 1.6478514934368326e-05, + "loss": 0.3712, + "step": 3754 + }, + { + "epoch": 0.3, + "learning_rate": 1.647656000367886e-05, + "loss": 0.4136, + "step": 3755 + }, + { + "epoch": 0.3, + "learning_rate": 1.647460464653908e-05, + "loss": 0.4786, + "step": 3756 + }, + { + "epoch": 0.3, + "learning_rate": 1.6472648863077737e-05, + "loss": 0.3053, + "step": 3757 + }, + { + "epoch": 0.3, + "learning_rate": 1.6470692653423614e-05, + "loss": 0.2857, + "step": 3758 + }, + { + "epoch": 0.3, + "learning_rate": 1.6468736017705515e-05, + "loss": 0.4749, + "step": 3759 + }, + { + "epoch": 0.3, + "learning_rate": 1.646677895605227e-05, + "loss": 0.4009, + "step": 3760 + }, + { + "epoch": 0.3, + "learning_rate": 1.6464821468592748e-05, + "loss": 0.4313, + "step": 3761 + }, + { + "epoch": 0.3, + "learning_rate": 1.646286355545584e-05, + "loss": 0.3737, + "step": 3762 + }, + { + "epoch": 0.3, + "learning_rate": 1.6460905216770467e-05, + "loss": 0.3234, + "step": 3763 + }, + { + "epoch": 0.3, + "learning_rate": 1.6458946452665573e-05, + "loss": 0.3812, + "step": 3764 + }, + { + "epoch": 0.3, + "learning_rate": 1.6456987263270132e-05, + "loss": 0.4864, + "step": 3765 + }, + { + "epoch": 0.3, + "learning_rate": 1.645502764871315e-05, + "loss": 0.523, + "step": 3766 + }, + { + "epoch": 0.3, + "learning_rate": 1.6453067609123656e-05, + "loss": 0.4447, + "step": 3767 + }, + { + "epoch": 0.3, + "learning_rate": 1.6451107144630708e-05, + "loss": 0.4154, + "step": 3768 + }, + { + "epoch": 0.3, + "learning_rate": 1.6449146255363395e-05, + "loss": 0.328, + "step": 3769 + }, + { + "epoch": 0.3, + "learning_rate": 1.6447184941450833e-05, + "loss": 0.2488, + "step": 3770 + }, + { + "epoch": 0.3, + "learning_rate": 1.644522320302217e-05, + "loss": 0.4382, + "step": 3771 + }, + { + "epoch": 0.3, + "learning_rate": 1.6443261040206566e-05, + "loss": 0.3443, + "step": 3772 + }, + { + "epoch": 0.3, + "learning_rate": 1.6441298453133224e-05, + "loss": 0.4301, + "step": 3773 + }, + { + "epoch": 0.3, + "learning_rate": 1.6439335441931376e-05, + "loss": 0.4809, + "step": 3774 + }, + { + "epoch": 0.3, + "learning_rate": 1.6437372006730276e-05, + "loss": 0.3264, + "step": 3775 + }, + { + "epoch": 0.3, + "learning_rate": 1.64354081476592e-05, + "loss": 0.4617, + "step": 3776 + }, + { + "epoch": 0.3, + "learning_rate": 1.643344386484746e-05, + "loss": 0.4875, + "step": 3777 + }, + { + "epoch": 0.3, + "learning_rate": 1.64314791584244e-05, + "loss": 0.3718, + "step": 3778 + }, + { + "epoch": 0.3, + "learning_rate": 1.6429514028519383e-05, + "loss": 0.3595, + "step": 3779 + }, + { + "epoch": 0.3, + "learning_rate": 1.6427548475261807e-05, + "loss": 0.3798, + "step": 3780 + }, + { + "epoch": 0.3, + "learning_rate": 1.642558249878109e-05, + "loss": 0.2808, + "step": 3781 + }, + { + "epoch": 0.3, + "learning_rate": 1.642361609920668e-05, + "loss": 0.3931, + "step": 3782 + }, + { + "epoch": 0.3, + "learning_rate": 1.6421649276668065e-05, + "loss": 0.2143, + "step": 3783 + }, + { + "epoch": 0.3, + "learning_rate": 1.641968203129474e-05, + "loss": 0.4045, + "step": 3784 + }, + { + "epoch": 0.3, + "learning_rate": 1.641771436321624e-05, + "loss": 0.3509, + "step": 3785 + }, + { + "epoch": 0.3, + "learning_rate": 1.6415746272562133e-05, + "loss": 0.4034, + "step": 3786 + }, + { + "epoch": 0.3, + "learning_rate": 1.6413777759462005e-05, + "loss": 0.4231, + "step": 3787 + }, + { + "epoch": 0.3, + "learning_rate": 1.6411808824045472e-05, + "loss": 0.4762, + "step": 3788 + }, + { + "epoch": 0.3, + "learning_rate": 1.640983946644218e-05, + "loss": 0.4323, + "step": 3789 + }, + { + "epoch": 0.3, + "learning_rate": 1.64078696867818e-05, + "loss": 0.3494, + "step": 3790 + }, + { + "epoch": 0.3, + "learning_rate": 1.6405899485194034e-05, + "loss": 0.3317, + "step": 3791 + }, + { + "epoch": 0.3, + "learning_rate": 1.640392886180861e-05, + "loss": 0.3728, + "step": 3792 + }, + { + "epoch": 0.3, + "learning_rate": 1.6401957816755286e-05, + "loss": 0.3594, + "step": 3793 + }, + { + "epoch": 0.3, + "learning_rate": 1.6399986350163844e-05, + "loss": 0.3645, + "step": 3794 + }, + { + "epoch": 0.3, + "learning_rate": 1.6398014462164093e-05, + "loss": 0.4086, + "step": 3795 + }, + { + "epoch": 0.3, + "learning_rate": 1.6396042152885874e-05, + "loss": 0.3687, + "step": 3796 + }, + { + "epoch": 0.3, + "learning_rate": 1.639406942245906e-05, + "loss": 0.3605, + "step": 3797 + }, + { + "epoch": 0.3, + "learning_rate": 1.639209627101354e-05, + "loss": 0.4945, + "step": 3798 + }, + { + "epoch": 0.3, + "learning_rate": 1.6390122698679234e-05, + "loss": 0.3318, + "step": 3799 + }, + { + "epoch": 0.3, + "learning_rate": 1.6388148705586097e-05, + "loss": 0.3531, + "step": 3800 + }, + { + "epoch": 0.3, + "learning_rate": 1.6386174291864106e-05, + "loss": 0.4464, + "step": 3801 + }, + { + "epoch": 0.3, + "learning_rate": 1.6384199457643264e-05, + "loss": 0.4458, + "step": 3802 + }, + { + "epoch": 0.3, + "learning_rate": 1.6382224203053607e-05, + "loss": 0.3563, + "step": 3803 + }, + { + "epoch": 0.3, + "learning_rate": 1.6380248528225197e-05, + "loss": 0.3668, + "step": 3804 + }, + { + "epoch": 0.3, + "learning_rate": 1.6378272433288122e-05, + "loss": 0.3502, + "step": 3805 + }, + { + "epoch": 0.3, + "learning_rate": 1.6376295918372495e-05, + "loss": 0.3945, + "step": 3806 + }, + { + "epoch": 0.3, + "learning_rate": 1.6374318983608464e-05, + "loss": 0.5723, + "step": 3807 + }, + { + "epoch": 0.3, + "learning_rate": 1.63723416291262e-05, + "loss": 0.3861, + "step": 3808 + }, + { + "epoch": 0.3, + "learning_rate": 1.63703638550559e-05, + "loss": 0.383, + "step": 3809 + }, + { + "epoch": 0.3, + "learning_rate": 1.6368385661527795e-05, + "loss": 0.4047, + "step": 3810 + }, + { + "epoch": 0.3, + "learning_rate": 1.6366407048672135e-05, + "loss": 0.3245, + "step": 3811 + }, + { + "epoch": 0.3, + "learning_rate": 1.6364428016619202e-05, + "loss": 0.324, + "step": 3812 + }, + { + "epoch": 0.3, + "learning_rate": 1.636244856549931e-05, + "loss": 0.2696, + "step": 3813 + }, + { + "epoch": 0.3, + "learning_rate": 1.6360468695442797e-05, + "loss": 0.3675, + "step": 3814 + }, + { + "epoch": 0.3, + "learning_rate": 1.6358488406580023e-05, + "loss": 0.4355, + "step": 3815 + }, + { + "epoch": 0.3, + "learning_rate": 1.635650769904138e-05, + "loss": 0.4028, + "step": 3816 + }, + { + "epoch": 0.3, + "learning_rate": 1.6354526572957292e-05, + "loss": 0.5307, + "step": 3817 + }, + { + "epoch": 0.3, + "learning_rate": 1.6352545028458206e-05, + "loss": 0.4625, + "step": 3818 + }, + { + "epoch": 0.3, + "learning_rate": 1.6350563065674596e-05, + "loss": 0.3263, + "step": 3819 + }, + { + "epoch": 0.3, + "learning_rate": 1.6348580684736962e-05, + "loss": 0.3229, + "step": 3820 + }, + { + "epoch": 0.3, + "learning_rate": 1.6346597885775843e-05, + "loss": 0.2735, + "step": 3821 + }, + { + "epoch": 0.3, + "learning_rate": 1.6344614668921787e-05, + "loss": 0.3688, + "step": 3822 + }, + { + "epoch": 0.3, + "learning_rate": 1.6342631034305386e-05, + "loss": 0.3645, + "step": 3823 + }, + { + "epoch": 0.3, + "learning_rate": 1.634064698205725e-05, + "loss": 0.3847, + "step": 3824 + }, + { + "epoch": 0.3, + "learning_rate": 1.6338662512308013e-05, + "loss": 0.3312, + "step": 3825 + }, + { + "epoch": 0.3, + "learning_rate": 1.6336677625188357e-05, + "loss": 0.3863, + "step": 3826 + }, + { + "epoch": 0.3, + "learning_rate": 1.6334692320828968e-05, + "loss": 0.3488, + "step": 3827 + }, + { + "epoch": 0.3, + "learning_rate": 1.6332706599360568e-05, + "loss": 0.2988, + "step": 3828 + }, + { + "epoch": 0.3, + "learning_rate": 1.633072046091391e-05, + "loss": 0.3618, + "step": 3829 + }, + { + "epoch": 0.3, + "learning_rate": 1.6328733905619775e-05, + "loss": 0.4129, + "step": 3830 + }, + { + "epoch": 0.3, + "learning_rate": 1.632674693360896e-05, + "loss": 0.4573, + "step": 3831 + }, + { + "epoch": 0.3, + "learning_rate": 1.6324759545012306e-05, + "loss": 0.4836, + "step": 3832 + }, + { + "epoch": 0.3, + "learning_rate": 1.6322771739960664e-05, + "loss": 0.2888, + "step": 3833 + }, + { + "epoch": 0.3, + "learning_rate": 1.6320783518584926e-05, + "loss": 0.3118, + "step": 3834 + }, + { + "epoch": 0.3, + "learning_rate": 1.631879488101601e-05, + "loss": 0.4753, + "step": 3835 + }, + { + "epoch": 0.3, + "learning_rate": 1.6316805827384856e-05, + "loss": 0.3794, + "step": 3836 + }, + { + "epoch": 0.3, + "learning_rate": 1.631481635782243e-05, + "loss": 0.3938, + "step": 3837 + }, + { + "epoch": 0.3, + "learning_rate": 1.631282647245973e-05, + "loss": 0.3237, + "step": 3838 + }, + { + "epoch": 0.3, + "learning_rate": 1.6310836171427788e-05, + "loss": 0.4194, + "step": 3839 + }, + { + "epoch": 0.3, + "learning_rate": 1.6308845454857647e-05, + "loss": 0.3726, + "step": 3840 + }, + { + "epoch": 0.3, + "learning_rate": 1.6306854322880386e-05, + "loss": 0.3582, + "step": 3841 + }, + { + "epoch": 0.3, + "learning_rate": 1.630486277562712e-05, + "loss": 0.4131, + "step": 3842 + }, + { + "epoch": 0.3, + "learning_rate": 1.6302870813228974e-05, + "loss": 0.4802, + "step": 3843 + }, + { + "epoch": 0.3, + "learning_rate": 1.6300878435817115e-05, + "loss": 0.3114, + "step": 3844 + }, + { + "epoch": 0.3, + "learning_rate": 1.6298885643522724e-05, + "loss": 0.4698, + "step": 3845 + }, + { + "epoch": 0.3, + "learning_rate": 1.6296892436477024e-05, + "loss": 0.2886, + "step": 3846 + }, + { + "epoch": 0.3, + "learning_rate": 1.6294898814811258e-05, + "loss": 0.3865, + "step": 3847 + }, + { + "epoch": 0.3, + "learning_rate": 1.629290477865669e-05, + "loss": 0.3828, + "step": 3848 + }, + { + "epoch": 0.3, + "learning_rate": 1.6290910328144627e-05, + "loss": 0.4441, + "step": 3849 + }, + { + "epoch": 0.31, + "learning_rate": 1.6288915463406386e-05, + "loss": 0.4142, + "step": 3850 + }, + { + "epoch": 0.31, + "learning_rate": 1.6286920184573324e-05, + "loss": 0.5069, + "step": 3851 + }, + { + "epoch": 0.31, + "learning_rate": 1.6284924491776815e-05, + "loss": 0.3152, + "step": 3852 + }, + { + "epoch": 0.31, + "learning_rate": 1.6282928385148273e-05, + "loss": 0.476, + "step": 3853 + }, + { + "epoch": 0.31, + "learning_rate": 1.6280931864819125e-05, + "loss": 0.3676, + "step": 3854 + }, + { + "epoch": 0.31, + "learning_rate": 1.6278934930920834e-05, + "loss": 0.5109, + "step": 3855 + }, + { + "epoch": 0.31, + "learning_rate": 1.6276937583584895e-05, + "loss": 0.3686, + "step": 3856 + }, + { + "epoch": 0.31, + "learning_rate": 1.6274939822942818e-05, + "loss": 0.4431, + "step": 3857 + }, + { + "epoch": 0.31, + "learning_rate": 1.6272941649126146e-05, + "loss": 0.438, + "step": 3858 + }, + { + "epoch": 0.31, + "learning_rate": 1.627094306226645e-05, + "loss": 0.4675, + "step": 3859 + }, + { + "epoch": 0.31, + "learning_rate": 1.6268944062495324e-05, + "loss": 0.4346, + "step": 3860 + }, + { + "epoch": 0.31, + "learning_rate": 1.62669446499444e-05, + "loss": 0.3743, + "step": 3861 + }, + { + "epoch": 0.31, + "learning_rate": 1.6264944824745326e-05, + "loss": 0.4583, + "step": 3862 + }, + { + "epoch": 0.31, + "learning_rate": 1.6262944587029777e-05, + "loss": 0.4081, + "step": 3863 + }, + { + "epoch": 0.31, + "learning_rate": 1.6260943936929462e-05, + "loss": 0.4014, + "step": 3864 + }, + { + "epoch": 0.31, + "learning_rate": 1.6258942874576117e-05, + "loss": 0.4127, + "step": 3865 + }, + { + "epoch": 0.31, + "learning_rate": 1.62569414001015e-05, + "loss": 0.4415, + "step": 3866 + }, + { + "epoch": 0.31, + "learning_rate": 1.6254939513637397e-05, + "loss": 0.3628, + "step": 3867 + }, + { + "epoch": 0.31, + "learning_rate": 1.6252937215315622e-05, + "loss": 0.3118, + "step": 3868 + }, + { + "epoch": 0.31, + "learning_rate": 1.6250934505268025e-05, + "loss": 0.4355, + "step": 3869 + }, + { + "epoch": 0.31, + "learning_rate": 1.6248931383626464e-05, + "loss": 0.458, + "step": 3870 + }, + { + "epoch": 0.31, + "learning_rate": 1.6246927850522837e-05, + "loss": 0.3556, + "step": 3871 + }, + { + "epoch": 0.31, + "learning_rate": 1.624492390608907e-05, + "loss": 0.3737, + "step": 3872 + }, + { + "epoch": 0.31, + "learning_rate": 1.6242919550457116e-05, + "loss": 0.3076, + "step": 3873 + }, + { + "epoch": 0.31, + "learning_rate": 1.6240914783758946e-05, + "loss": 0.5028, + "step": 3874 + }, + { + "epoch": 0.31, + "learning_rate": 1.6238909606126568e-05, + "loss": 0.5033, + "step": 3875 + }, + { + "epoch": 0.31, + "learning_rate": 1.6236904017692016e-05, + "loss": 0.3266, + "step": 3876 + }, + { + "epoch": 0.31, + "learning_rate": 1.6234898018587336e-05, + "loss": 0.2731, + "step": 3877 + }, + { + "epoch": 0.31, + "learning_rate": 1.6232891608944627e-05, + "loss": 0.5527, + "step": 3878 + }, + { + "epoch": 0.31, + "learning_rate": 1.6230884788895998e-05, + "loss": 0.4325, + "step": 3879 + }, + { + "epoch": 0.31, + "learning_rate": 1.622887755857358e-05, + "loss": 0.501, + "step": 3880 + }, + { + "epoch": 0.31, + "learning_rate": 1.6226869918109553e-05, + "loss": 0.4569, + "step": 3881 + }, + { + "epoch": 0.31, + "learning_rate": 1.62248618676361e-05, + "loss": 0.363, + "step": 3882 + }, + { + "epoch": 0.31, + "learning_rate": 1.6222853407285447e-05, + "loss": 0.3484, + "step": 3883 + }, + { + "epoch": 0.31, + "learning_rate": 1.622084453718984e-05, + "loss": 0.3608, + "step": 3884 + }, + { + "epoch": 0.31, + "learning_rate": 1.621883525748155e-05, + "loss": 0.5152, + "step": 3885 + }, + { + "epoch": 0.31, + "learning_rate": 1.6216825568292885e-05, + "loss": 0.2701, + "step": 3886 + }, + { + "epoch": 0.31, + "learning_rate": 1.6214815469756165e-05, + "loss": 0.3885, + "step": 3887 + }, + { + "epoch": 0.31, + "learning_rate": 1.6212804962003757e-05, + "loss": 0.3302, + "step": 3888 + }, + { + "epoch": 0.31, + "learning_rate": 1.6210794045168033e-05, + "loss": 0.4754, + "step": 3889 + }, + { + "epoch": 0.31, + "learning_rate": 1.6208782719381403e-05, + "loss": 0.4343, + "step": 3890 + }, + { + "epoch": 0.31, + "learning_rate": 1.6206770984776307e-05, + "loss": 0.4345, + "step": 3891 + }, + { + "epoch": 0.31, + "learning_rate": 1.620475884148521e-05, + "loss": 0.4948, + "step": 3892 + }, + { + "epoch": 0.31, + "learning_rate": 1.6202746289640594e-05, + "loss": 0.3056, + "step": 3893 + }, + { + "epoch": 0.31, + "learning_rate": 1.620073332937498e-05, + "loss": 0.4197, + "step": 3894 + }, + { + "epoch": 0.31, + "learning_rate": 1.6198719960820917e-05, + "loss": 0.2995, + "step": 3895 + }, + { + "epoch": 0.31, + "learning_rate": 1.619670618411097e-05, + "loss": 0.4452, + "step": 3896 + }, + { + "epoch": 0.31, + "learning_rate": 1.6194691999377736e-05, + "loss": 0.3009, + "step": 3897 + }, + { + "epoch": 0.31, + "learning_rate": 1.619267740675384e-05, + "loss": 0.4656, + "step": 3898 + }, + { + "epoch": 0.31, + "learning_rate": 1.6190662406371937e-05, + "loss": 0.2403, + "step": 3899 + }, + { + "epoch": 0.31, + "learning_rate": 1.6188646998364703e-05, + "loss": 0.4265, + "step": 3900 + }, + { + "epoch": 0.31, + "learning_rate": 1.6186631182864835e-05, + "loss": 0.3497, + "step": 3901 + }, + { + "epoch": 0.31, + "learning_rate": 1.6184614960005078e-05, + "loss": 0.358, + "step": 3902 + }, + { + "epoch": 0.31, + "learning_rate": 1.6182598329918185e-05, + "loss": 0.3655, + "step": 3903 + }, + { + "epoch": 0.31, + "learning_rate": 1.6180581292736938e-05, + "loss": 0.3343, + "step": 3904 + }, + { + "epoch": 0.31, + "learning_rate": 1.617856384859415e-05, + "loss": 0.3619, + "step": 3905 + }, + { + "epoch": 0.31, + "learning_rate": 1.6176545997622662e-05, + "loss": 0.3557, + "step": 3906 + }, + { + "epoch": 0.31, + "learning_rate": 1.6174527739955345e-05, + "loss": 0.3957, + "step": 3907 + }, + { + "epoch": 0.31, + "learning_rate": 1.6172509075725084e-05, + "loss": 0.4111, + "step": 3908 + }, + { + "epoch": 0.31, + "learning_rate": 1.61704900050648e-05, + "loss": 0.3001, + "step": 3909 + }, + { + "epoch": 0.31, + "learning_rate": 1.616847052810744e-05, + "loss": 0.4999, + "step": 3910 + }, + { + "epoch": 0.31, + "learning_rate": 1.6166450644985975e-05, + "loss": 0.3603, + "step": 3911 + }, + { + "epoch": 0.31, + "learning_rate": 1.6164430355833407e-05, + "loss": 0.3089, + "step": 3912 + }, + { + "epoch": 0.31, + "learning_rate": 1.616240966078276e-05, + "loss": 0.4429, + "step": 3913 + }, + { + "epoch": 0.31, + "learning_rate": 1.616038855996709e-05, + "loss": 0.2318, + "step": 3914 + }, + { + "epoch": 0.31, + "learning_rate": 1.6158367053519476e-05, + "loss": 0.3074, + "step": 3915 + }, + { + "epoch": 0.31, + "learning_rate": 1.6156345141573022e-05, + "loss": 0.442, + "step": 3916 + }, + { + "epoch": 0.31, + "learning_rate": 1.6154322824260865e-05, + "loss": 0.5281, + "step": 3917 + }, + { + "epoch": 0.31, + "learning_rate": 1.615230010171616e-05, + "loss": 0.4617, + "step": 3918 + }, + { + "epoch": 0.31, + "learning_rate": 1.61502769740721e-05, + "loss": 0.361, + "step": 3919 + }, + { + "epoch": 0.31, + "learning_rate": 1.6148253441461887e-05, + "loss": 0.361, + "step": 3920 + }, + { + "epoch": 0.31, + "learning_rate": 1.6146229504018777e-05, + "loss": 0.3569, + "step": 3921 + }, + { + "epoch": 0.31, + "learning_rate": 1.6144205161876023e-05, + "loss": 0.5045, + "step": 3922 + }, + { + "epoch": 0.31, + "learning_rate": 1.6142180415166926e-05, + "loss": 0.3246, + "step": 3923 + }, + { + "epoch": 0.31, + "learning_rate": 1.61401552640248e-05, + "loss": 0.4448, + "step": 3924 + }, + { + "epoch": 0.31, + "learning_rate": 1.6138129708582996e-05, + "loss": 0.2934, + "step": 3925 + }, + { + "epoch": 0.31, + "learning_rate": 1.6136103748974885e-05, + "loss": 0.2892, + "step": 3926 + }, + { + "epoch": 0.31, + "learning_rate": 1.6134077385333867e-05, + "loss": 0.4102, + "step": 3927 + }, + { + "epoch": 0.31, + "learning_rate": 1.613205061779337e-05, + "loss": 0.3184, + "step": 3928 + }, + { + "epoch": 0.31, + "learning_rate": 1.6130023446486844e-05, + "loss": 0.4278, + "step": 3929 + }, + { + "epoch": 0.31, + "learning_rate": 1.612799587154777e-05, + "loss": 0.4166, + "step": 3930 + }, + { + "epoch": 0.31, + "learning_rate": 1.6125967893109657e-05, + "loss": 0.3537, + "step": 3931 + }, + { + "epoch": 0.31, + "learning_rate": 1.6123939511306028e-05, + "loss": 0.3385, + "step": 3932 + }, + { + "epoch": 0.31, + "learning_rate": 1.6121910726270453e-05, + "loss": 0.396, + "step": 3933 + }, + { + "epoch": 0.31, + "learning_rate": 1.6119881538136514e-05, + "loss": 0.3638, + "step": 3934 + }, + { + "epoch": 0.31, + "learning_rate": 1.611785194703782e-05, + "loss": 0.42, + "step": 3935 + }, + { + "epoch": 0.31, + "learning_rate": 1.6115821953108015e-05, + "loss": 0.3648, + "step": 3936 + }, + { + "epoch": 0.31, + "learning_rate": 1.611379155648076e-05, + "loss": 0.4262, + "step": 3937 + }, + { + "epoch": 0.31, + "learning_rate": 1.611176075728975e-05, + "loss": 0.3446, + "step": 3938 + }, + { + "epoch": 0.31, + "learning_rate": 1.61097295556687e-05, + "loss": 0.3998, + "step": 3939 + }, + { + "epoch": 0.31, + "learning_rate": 1.610769795175136e-05, + "loss": 0.3231, + "step": 3940 + }, + { + "epoch": 0.31, + "learning_rate": 1.6105665945671497e-05, + "loss": 0.3293, + "step": 3941 + }, + { + "epoch": 0.31, + "learning_rate": 1.610363353756291e-05, + "loss": 0.3622, + "step": 3942 + }, + { + "epoch": 0.31, + "learning_rate": 1.6101600727559423e-05, + "loss": 0.2223, + "step": 3943 + }, + { + "epoch": 0.31, + "learning_rate": 1.6099567515794886e-05, + "loss": 0.4157, + "step": 3944 + }, + { + "epoch": 0.31, + "learning_rate": 1.609753390240318e-05, + "loss": 0.2454, + "step": 3945 + }, + { + "epoch": 0.31, + "learning_rate": 1.6095499887518204e-05, + "loss": 0.3586, + "step": 3946 + }, + { + "epoch": 0.31, + "learning_rate": 1.6093465471273894e-05, + "loss": 0.4347, + "step": 3947 + }, + { + "epoch": 0.31, + "learning_rate": 1.60914306538042e-05, + "loss": 0.4207, + "step": 3948 + }, + { + "epoch": 0.31, + "learning_rate": 1.6089395435243105e-05, + "loss": 0.4856, + "step": 3949 + }, + { + "epoch": 0.31, + "learning_rate": 1.6087359815724623e-05, + "loss": 0.4255, + "step": 3950 + }, + { + "epoch": 0.31, + "learning_rate": 1.6085323795382785e-05, + "loss": 0.454, + "step": 3951 + }, + { + "epoch": 0.31, + "learning_rate": 1.608328737435166e-05, + "loss": 0.4065, + "step": 3952 + }, + { + "epoch": 0.31, + "learning_rate": 1.608125055276533e-05, + "loss": 0.3922, + "step": 3953 + }, + { + "epoch": 0.31, + "learning_rate": 1.607921333075791e-05, + "loss": 0.4391, + "step": 3954 + }, + { + "epoch": 0.31, + "learning_rate": 1.607717570846355e-05, + "loss": 0.5842, + "step": 3955 + }, + { + "epoch": 0.31, + "learning_rate": 1.6075137686016408e-05, + "loss": 0.3744, + "step": 3956 + }, + { + "epoch": 0.31, + "learning_rate": 1.6073099263550677e-05, + "loss": 0.3824, + "step": 3957 + }, + { + "epoch": 0.31, + "learning_rate": 1.6071060441200587e-05, + "loss": 0.2831, + "step": 3958 + }, + { + "epoch": 0.31, + "learning_rate": 1.6069021219100375e-05, + "loss": 0.2809, + "step": 3959 + }, + { + "epoch": 0.31, + "learning_rate": 1.606698159738432e-05, + "loss": 0.4213, + "step": 3960 + }, + { + "epoch": 0.31, + "learning_rate": 1.606494157618672e-05, + "loss": 0.4321, + "step": 3961 + }, + { + "epoch": 0.31, + "learning_rate": 1.60629011556419e-05, + "loss": 0.3179, + "step": 3962 + }, + { + "epoch": 0.31, + "learning_rate": 1.6060860335884208e-05, + "loss": 0.3017, + "step": 3963 + }, + { + "epoch": 0.31, + "learning_rate": 1.605881911704803e-05, + "loss": 0.4476, + "step": 3964 + }, + { + "epoch": 0.31, + "learning_rate": 1.6056777499267764e-05, + "loss": 0.4402, + "step": 3965 + }, + { + "epoch": 0.31, + "learning_rate": 1.6054735482677842e-05, + "loss": 0.3733, + "step": 3966 + }, + { + "epoch": 0.31, + "learning_rate": 1.6052693067412724e-05, + "loss": 0.252, + "step": 3967 + }, + { + "epoch": 0.31, + "learning_rate": 1.605065025360689e-05, + "loss": 0.3107, + "step": 3968 + }, + { + "epoch": 0.31, + "learning_rate": 1.6048607041394856e-05, + "loss": 0.2646, + "step": 3969 + }, + { + "epoch": 0.31, + "learning_rate": 1.6046563430911148e-05, + "loss": 0.3403, + "step": 3970 + }, + { + "epoch": 0.31, + "learning_rate": 1.6044519422290333e-05, + "loss": 0.4026, + "step": 3971 + }, + { + "epoch": 0.31, + "learning_rate": 1.6042475015666995e-05, + "loss": 0.3324, + "step": 3972 + }, + { + "epoch": 0.31, + "learning_rate": 1.604043021117575e-05, + "loss": 0.2989, + "step": 3973 + }, + { + "epoch": 0.31, + "learning_rate": 1.603838500895125e-05, + "loss": 0.3689, + "step": 3974 + }, + { + "epoch": 0.31, + "learning_rate": 1.6036339409128146e-05, + "loss": 0.4692, + "step": 3975 + }, + { + "epoch": 0.31, + "learning_rate": 1.603429341184114e-05, + "loss": 0.292, + "step": 3976 + }, + { + "epoch": 0.32, + "learning_rate": 1.6032247017224944e-05, + "loss": 0.3163, + "step": 3977 + }, + { + "epoch": 0.32, + "learning_rate": 1.603020022541431e-05, + "loss": 0.3179, + "step": 3978 + }, + { + "epoch": 0.32, + "learning_rate": 1.6028153036544005e-05, + "loss": 0.4448, + "step": 3979 + }, + { + "epoch": 0.32, + "learning_rate": 1.6026105450748826e-05, + "loss": 0.4003, + "step": 3980 + }, + { + "epoch": 0.32, + "learning_rate": 1.6024057468163604e-05, + "loss": 0.3249, + "step": 3981 + }, + { + "epoch": 0.32, + "learning_rate": 1.602200908892318e-05, + "loss": 0.35, + "step": 3982 + }, + { + "epoch": 0.32, + "learning_rate": 1.6019960313162436e-05, + "loss": 0.3609, + "step": 3983 + }, + { + "epoch": 0.32, + "learning_rate": 1.601791114101627e-05, + "loss": 0.4053, + "step": 3984 + }, + { + "epoch": 0.32, + "learning_rate": 1.6015861572619612e-05, + "loss": 0.3888, + "step": 3985 + }, + { + "epoch": 0.32, + "learning_rate": 1.6013811608107415e-05, + "loss": 0.391, + "step": 3986 + }, + { + "epoch": 0.32, + "learning_rate": 1.6011761247614664e-05, + "loss": 0.3863, + "step": 3987 + }, + { + "epoch": 0.32, + "learning_rate": 1.600971049127636e-05, + "loss": 0.2883, + "step": 3988 + }, + { + "epoch": 0.32, + "learning_rate": 1.6007659339227534e-05, + "loss": 0.3601, + "step": 3989 + }, + { + "epoch": 0.32, + "learning_rate": 1.6005607791603247e-05, + "loss": 0.4042, + "step": 3990 + }, + { + "epoch": 0.32, + "learning_rate": 1.6003555848538586e-05, + "loss": 0.3917, + "step": 3991 + }, + { + "epoch": 0.32, + "learning_rate": 1.600150351016866e-05, + "loss": 0.3971, + "step": 3992 + }, + { + "epoch": 0.32, + "learning_rate": 1.5999450776628607e-05, + "loss": 0.4545, + "step": 3993 + }, + { + "epoch": 0.32, + "learning_rate": 1.5997397648053587e-05, + "loss": 0.4982, + "step": 3994 + }, + { + "epoch": 0.32, + "learning_rate": 1.599534412457879e-05, + "loss": 0.406, + "step": 3995 + }, + { + "epoch": 0.32, + "learning_rate": 1.5993290206339426e-05, + "loss": 0.3235, + "step": 3996 + }, + { + "epoch": 0.32, + "learning_rate": 1.5991235893470745e-05, + "loss": 0.5409, + "step": 3997 + }, + { + "epoch": 0.32, + "learning_rate": 1.5989181186108003e-05, + "loss": 0.4354, + "step": 3998 + }, + { + "epoch": 0.32, + "learning_rate": 1.59871260843865e-05, + "loss": 0.3246, + "step": 3999 + }, + { + "epoch": 0.32, + "learning_rate": 1.5985070588441556e-05, + "loss": 0.407, + "step": 4000 + }, + { + "epoch": 0.32, + "learning_rate": 1.598301469840851e-05, + "loss": 0.3885, + "step": 4001 + }, + { + "epoch": 0.32, + "learning_rate": 1.598095841442273e-05, + "loss": 0.3204, + "step": 4002 + }, + { + "epoch": 0.32, + "learning_rate": 1.5978901736619624e-05, + "loss": 0.3429, + "step": 4003 + }, + { + "epoch": 0.32, + "learning_rate": 1.5976844665134607e-05, + "loss": 0.3739, + "step": 4004 + }, + { + "epoch": 0.32, + "learning_rate": 1.5974787200103124e-05, + "loss": 0.4011, + "step": 4005 + }, + { + "epoch": 0.32, + "learning_rate": 1.5972729341660653e-05, + "loss": 0.4526, + "step": 4006 + }, + { + "epoch": 0.32, + "learning_rate": 1.597067108994269e-05, + "loss": 0.3499, + "step": 4007 + }, + { + "epoch": 0.32, + "learning_rate": 1.5968612445084773e-05, + "loss": 0.3963, + "step": 4008 + }, + { + "epoch": 0.32, + "learning_rate": 1.596655340722244e-05, + "loss": 0.3595, + "step": 4009 + }, + { + "epoch": 0.32, + "learning_rate": 1.5964493976491278e-05, + "loss": 0.3162, + "step": 4010 + }, + { + "epoch": 0.32, + "learning_rate": 1.5962434153026884e-05, + "loss": 0.3535, + "step": 4011 + }, + { + "epoch": 0.32, + "learning_rate": 1.596037393696489e-05, + "loss": 0.3963, + "step": 4012 + }, + { + "epoch": 0.32, + "learning_rate": 1.5958313328440954e-05, + "loss": 0.2685, + "step": 4013 + }, + { + "epoch": 0.32, + "learning_rate": 1.595625232759076e-05, + "loss": 0.6723, + "step": 4014 + }, + { + "epoch": 0.32, + "learning_rate": 1.595419093455e-05, + "loss": 0.2335, + "step": 4015 + }, + { + "epoch": 0.32, + "learning_rate": 1.5952129149454422e-05, + "loss": 0.519, + "step": 4016 + }, + { + "epoch": 0.32, + "learning_rate": 1.595006697243978e-05, + "loss": 0.4117, + "step": 4017 + }, + { + "epoch": 0.32, + "learning_rate": 1.5948004403641853e-05, + "loss": 0.4196, + "step": 4018 + }, + { + "epoch": 0.32, + "learning_rate": 1.594594144319646e-05, + "loss": 0.3838, + "step": 4019 + }, + { + "epoch": 0.32, + "learning_rate": 1.594387809123943e-05, + "loss": 0.381, + "step": 4020 + }, + { + "epoch": 0.32, + "learning_rate": 1.594181434790663e-05, + "loss": 0.3541, + "step": 4021 + }, + { + "epoch": 0.32, + "learning_rate": 1.5939750213333948e-05, + "loss": 0.4621, + "step": 4022 + }, + { + "epoch": 0.32, + "learning_rate": 1.593768568765729e-05, + "loss": 0.3036, + "step": 4023 + }, + { + "epoch": 0.32, + "learning_rate": 1.5935620771012603e-05, + "loss": 0.4107, + "step": 4024 + }, + { + "epoch": 0.32, + "learning_rate": 1.5933555463535846e-05, + "loss": 0.3488, + "step": 4025 + }, + { + "epoch": 0.32, + "learning_rate": 1.5931489765363014e-05, + "loss": 0.2804, + "step": 4026 + }, + { + "epoch": 0.32, + "learning_rate": 1.592942367663012e-05, + "loss": 0.4871, + "step": 4027 + }, + { + "epoch": 0.32, + "learning_rate": 1.5927357197473207e-05, + "loss": 0.4143, + "step": 4028 + }, + { + "epoch": 0.32, + "learning_rate": 1.5925290328028346e-05, + "loss": 0.2905, + "step": 4029 + }, + { + "epoch": 0.32, + "learning_rate": 1.5923223068431626e-05, + "loss": 0.4246, + "step": 4030 + }, + { + "epoch": 0.32, + "learning_rate": 1.592115541881917e-05, + "loss": 0.5062, + "step": 4031 + }, + { + "epoch": 0.32, + "learning_rate": 1.5919087379327116e-05, + "loss": 0.4372, + "step": 4032 + }, + { + "epoch": 0.32, + "learning_rate": 1.5917018950091642e-05, + "loss": 0.3046, + "step": 4033 + }, + { + "epoch": 0.32, + "learning_rate": 1.591495013124894e-05, + "loss": 0.3604, + "step": 4034 + }, + { + "epoch": 0.32, + "learning_rate": 1.591288092293523e-05, + "loss": 0.4021, + "step": 4035 + }, + { + "epoch": 0.32, + "learning_rate": 1.5910811325286768e-05, + "loss": 0.4663, + "step": 4036 + }, + { + "epoch": 0.32, + "learning_rate": 1.5908741338439818e-05, + "loss": 0.4209, + "step": 4037 + }, + { + "epoch": 0.32, + "learning_rate": 1.5906670962530683e-05, + "loss": 0.4377, + "step": 4038 + }, + { + "epoch": 0.32, + "learning_rate": 1.5904600197695684e-05, + "loss": 0.4172, + "step": 4039 + }, + { + "epoch": 0.32, + "learning_rate": 1.5902529044071173e-05, + "loss": 0.426, + "step": 4040 + }, + { + "epoch": 0.32, + "learning_rate": 1.590045750179353e-05, + "loss": 0.4147, + "step": 4041 + }, + { + "epoch": 0.32, + "learning_rate": 1.5898385570999146e-05, + "loss": 0.305, + "step": 4042 + }, + { + "epoch": 0.32, + "learning_rate": 1.589631325182446e-05, + "loss": 0.3733, + "step": 4043 + }, + { + "epoch": 0.32, + "learning_rate": 1.589424054440591e-05, + "loss": 0.4896, + "step": 4044 + }, + { + "epoch": 0.32, + "learning_rate": 1.5892167448879984e-05, + "loss": 0.2743, + "step": 4045 + }, + { + "epoch": 0.32, + "learning_rate": 1.5890093965383186e-05, + "loss": 0.4946, + "step": 4046 + }, + { + "epoch": 0.32, + "learning_rate": 1.588802009405204e-05, + "loss": 0.4613, + "step": 4047 + }, + { + "epoch": 0.32, + "learning_rate": 1.5885945835023104e-05, + "loss": 0.5413, + "step": 4048 + }, + { + "epoch": 0.32, + "learning_rate": 1.5883871188432955e-05, + "loss": 0.4722, + "step": 4049 + }, + { + "epoch": 0.32, + "learning_rate": 1.5881796154418196e-05, + "loss": 0.2338, + "step": 4050 + }, + { + "epoch": 0.32, + "learning_rate": 1.5879720733115464e-05, + "loss": 0.3846, + "step": 4051 + }, + { + "epoch": 0.32, + "learning_rate": 1.5877644924661412e-05, + "loss": 0.3352, + "step": 4052 + }, + { + "epoch": 0.32, + "learning_rate": 1.5875568729192728e-05, + "loss": 0.2651, + "step": 4053 + }, + { + "epoch": 0.32, + "learning_rate": 1.587349214684611e-05, + "loss": 0.2961, + "step": 4054 + }, + { + "epoch": 0.32, + "learning_rate": 1.5871415177758297e-05, + "loss": 0.3735, + "step": 4055 + }, + { + "epoch": 0.32, + "learning_rate": 1.5869337822066043e-05, + "loss": 0.41, + "step": 4056 + }, + { + "epoch": 0.32, + "learning_rate": 1.586726007990614e-05, + "loss": 0.4383, + "step": 4057 + }, + { + "epoch": 0.32, + "learning_rate": 1.586518195141539e-05, + "loss": 0.3217, + "step": 4058 + }, + { + "epoch": 0.32, + "learning_rate": 1.5863103436730627e-05, + "loss": 0.3566, + "step": 4059 + }, + { + "epoch": 0.32, + "learning_rate": 1.586102453598872e-05, + "loss": 0.3609, + "step": 4060 + }, + { + "epoch": 0.32, + "learning_rate": 1.5858945249326545e-05, + "loss": 0.3402, + "step": 4061 + }, + { + "epoch": 0.32, + "learning_rate": 1.5856865576881016e-05, + "loss": 0.3896, + "step": 4062 + }, + { + "epoch": 0.32, + "learning_rate": 1.5854785518789074e-05, + "loss": 0.4865, + "step": 4063 + }, + { + "epoch": 0.32, + "learning_rate": 1.5852705075187674e-05, + "loss": 0.3829, + "step": 4064 + }, + { + "epoch": 0.32, + "learning_rate": 1.5850624246213805e-05, + "loss": 0.3752, + "step": 4065 + }, + { + "epoch": 0.32, + "learning_rate": 1.5848543032004483e-05, + "loss": 0.5193, + "step": 4066 + }, + { + "epoch": 0.32, + "learning_rate": 1.5846461432696744e-05, + "loss": 0.4241, + "step": 4067 + }, + { + "epoch": 0.32, + "learning_rate": 1.5844379448427648e-05, + "loss": 0.5836, + "step": 4068 + }, + { + "epoch": 0.32, + "learning_rate": 1.5842297079334293e-05, + "loss": 0.3291, + "step": 4069 + }, + { + "epoch": 0.32, + "learning_rate": 1.5840214325553782e-05, + "loss": 0.4188, + "step": 4070 + }, + { + "epoch": 0.32, + "learning_rate": 1.583813118722326e-05, + "loss": 0.5066, + "step": 4071 + }, + { + "epoch": 0.32, + "learning_rate": 1.583604766447989e-05, + "loss": 0.4439, + "step": 4072 + }, + { + "epoch": 0.32, + "learning_rate": 1.5833963757460863e-05, + "loss": 0.4937, + "step": 4073 + }, + { + "epoch": 0.32, + "learning_rate": 1.5831879466303393e-05, + "loss": 0.4279, + "step": 4074 + }, + { + "epoch": 0.32, + "learning_rate": 1.5829794791144723e-05, + "loss": 0.4023, + "step": 4075 + }, + { + "epoch": 0.32, + "learning_rate": 1.5827709732122115e-05, + "loss": 0.3791, + "step": 4076 + }, + { + "epoch": 0.32, + "learning_rate": 1.5825624289372864e-05, + "loss": 0.4959, + "step": 4077 + }, + { + "epoch": 0.32, + "learning_rate": 1.5823538463034283e-05, + "loss": 0.3836, + "step": 4078 + }, + { + "epoch": 0.32, + "learning_rate": 1.5821452253243718e-05, + "loss": 0.4124, + "step": 4079 + }, + { + "epoch": 0.32, + "learning_rate": 1.581936566013853e-05, + "loss": 0.4488, + "step": 4080 + }, + { + "epoch": 0.32, + "learning_rate": 1.5817278683856117e-05, + "loss": 0.3194, + "step": 4081 + }, + { + "epoch": 0.32, + "learning_rate": 1.5815191324533893e-05, + "loss": 0.4364, + "step": 4082 + }, + { + "epoch": 0.32, + "learning_rate": 1.58131035823093e-05, + "loss": 0.4484, + "step": 4083 + }, + { + "epoch": 0.32, + "learning_rate": 1.581101545731981e-05, + "loss": 0.375, + "step": 4084 + }, + { + "epoch": 0.32, + "learning_rate": 1.580892694970291e-05, + "loss": 0.4116, + "step": 4085 + }, + { + "epoch": 0.32, + "learning_rate": 1.580683805959612e-05, + "loss": 0.3166, + "step": 4086 + }, + { + "epoch": 0.32, + "learning_rate": 1.5804748787136987e-05, + "loss": 0.4234, + "step": 4087 + }, + { + "epoch": 0.32, + "learning_rate": 1.5802659132463076e-05, + "loss": 0.3104, + "step": 4088 + }, + { + "epoch": 0.32, + "learning_rate": 1.5800569095711983e-05, + "loss": 0.323, + "step": 4089 + }, + { + "epoch": 0.32, + "learning_rate": 1.5798478677021327e-05, + "loss": 0.48, + "step": 4090 + }, + { + "epoch": 0.32, + "learning_rate": 1.5796387876528746e-05, + "loss": 0.3683, + "step": 4091 + }, + { + "epoch": 0.32, + "learning_rate": 1.579429669437192e-05, + "loss": 0.3604, + "step": 4092 + }, + { + "epoch": 0.32, + "learning_rate": 1.579220513068853e-05, + "loss": 0.4864, + "step": 4093 + }, + { + "epoch": 0.32, + "learning_rate": 1.5790113185616305e-05, + "loss": 0.3199, + "step": 4094 + }, + { + "epoch": 0.32, + "learning_rate": 1.5788020859292987e-05, + "loss": 0.3623, + "step": 4095 + }, + { + "epoch": 0.32, + "learning_rate": 1.5785928151856345e-05, + "loss": 0.3448, + "step": 4096 + }, + { + "epoch": 0.32, + "learning_rate": 1.5783835063444176e-05, + "loss": 0.3154, + "step": 4097 + }, + { + "epoch": 0.32, + "learning_rate": 1.57817415941943e-05, + "loss": 0.4089, + "step": 4098 + }, + { + "epoch": 0.32, + "learning_rate": 1.5779647744244556e-05, + "loss": 0.4147, + "step": 4099 + }, + { + "epoch": 0.32, + "learning_rate": 1.577755351373282e-05, + "loss": 0.3799, + "step": 4100 + }, + { + "epoch": 0.32, + "learning_rate": 1.5775458902796982e-05, + "loss": 0.3224, + "step": 4101 + }, + { + "epoch": 0.32, + "learning_rate": 1.577336391157497e-05, + "loss": 0.4043, + "step": 4102 + }, + { + "epoch": 0.33, + "learning_rate": 1.5771268540204724e-05, + "loss": 0.4262, + "step": 4103 + }, + { + "epoch": 0.33, + "learning_rate": 1.576917278882421e-05, + "loss": 0.3558, + "step": 4104 + }, + { + "epoch": 0.33, + "learning_rate": 1.576707665757143e-05, + "loss": 0.3475, + "step": 4105 + }, + { + "epoch": 0.33, + "learning_rate": 1.5764980146584402e-05, + "loss": 0.3469, + "step": 4106 + }, + { + "epoch": 0.33, + "learning_rate": 1.5762883256001168e-05, + "loss": 0.3347, + "step": 4107 + }, + { + "epoch": 0.33, + "learning_rate": 1.57607859859598e-05, + "loss": 0.3961, + "step": 4108 + }, + { + "epoch": 0.33, + "learning_rate": 1.5758688336598397e-05, + "loss": 0.4293, + "step": 4109 + }, + { + "epoch": 0.33, + "learning_rate": 1.5756590308055075e-05, + "loss": 0.3415, + "step": 4110 + }, + { + "epoch": 0.33, + "learning_rate": 1.5754491900467982e-05, + "loss": 0.3812, + "step": 4111 + }, + { + "epoch": 0.33, + "learning_rate": 1.5752393113975282e-05, + "loss": 0.4778, + "step": 4112 + }, + { + "epoch": 0.33, + "learning_rate": 1.5750293948715178e-05, + "loss": 0.3152, + "step": 4113 + }, + { + "epoch": 0.33, + "learning_rate": 1.5748194404825885e-05, + "loss": 0.45, + "step": 4114 + }, + { + "epoch": 0.33, + "learning_rate": 1.574609448244565e-05, + "loss": 0.4239, + "step": 4115 + }, + { + "epoch": 0.33, + "learning_rate": 1.574399418171274e-05, + "loss": 0.4398, + "step": 4116 + }, + { + "epoch": 0.33, + "learning_rate": 1.5741893502765452e-05, + "loss": 0.3838, + "step": 4117 + }, + { + "epoch": 0.33, + "learning_rate": 1.5739792445742103e-05, + "loss": 0.3513, + "step": 4118 + }, + { + "epoch": 0.33, + "learning_rate": 1.573769101078104e-05, + "loss": 0.456, + "step": 4119 + }, + { + "epoch": 0.33, + "learning_rate": 1.573558919802064e-05, + "loss": 0.3602, + "step": 4120 + }, + { + "epoch": 0.33, + "learning_rate": 1.573348700759928e-05, + "loss": 0.41, + "step": 4121 + }, + { + "epoch": 0.33, + "learning_rate": 1.573138443965539e-05, + "loss": 0.3903, + "step": 4122 + }, + { + "epoch": 0.33, + "learning_rate": 1.572928149432741e-05, + "loss": 0.4295, + "step": 4123 + }, + { + "epoch": 0.33, + "learning_rate": 1.5727178171753817e-05, + "loss": 0.3569, + "step": 4124 + }, + { + "epoch": 0.33, + "learning_rate": 1.57250744720731e-05, + "loss": 0.3485, + "step": 4125 + }, + { + "epoch": 0.33, + "learning_rate": 1.572297039542377e-05, + "loss": 0.3468, + "step": 4126 + }, + { + "epoch": 0.33, + "learning_rate": 1.572086594194438e-05, + "loss": 0.3927, + "step": 4127 + }, + { + "epoch": 0.33, + "learning_rate": 1.571876111177349e-05, + "loss": 0.3043, + "step": 4128 + }, + { + "epoch": 0.33, + "learning_rate": 1.571665590504971e-05, + "loss": 0.3083, + "step": 4129 + }, + { + "epoch": 0.33, + "learning_rate": 1.5714550321911636e-05, + "loss": 0.3931, + "step": 4130 + }, + { + "epoch": 0.33, + "learning_rate": 1.5712444362497917e-05, + "loss": 0.2831, + "step": 4131 + }, + { + "epoch": 0.33, + "learning_rate": 1.5710338026947227e-05, + "loss": 0.5664, + "step": 4132 + }, + { + "epoch": 0.33, + "learning_rate": 1.5708231315398255e-05, + "loss": 0.3412, + "step": 4133 + }, + { + "epoch": 0.33, + "learning_rate": 1.570612422798972e-05, + "loss": 0.257, + "step": 4134 + }, + { + "epoch": 0.33, + "learning_rate": 1.5704016764860358e-05, + "loss": 0.334, + "step": 4135 + }, + { + "epoch": 0.33, + "learning_rate": 1.5701908926148933e-05, + "loss": 0.2846, + "step": 4136 + }, + { + "epoch": 0.33, + "learning_rate": 1.5699800711994247e-05, + "loss": 0.3247, + "step": 4137 + }, + { + "epoch": 0.33, + "learning_rate": 1.569769212253511e-05, + "loss": 0.3969, + "step": 4138 + }, + { + "epoch": 0.33, + "learning_rate": 1.569558315791036e-05, + "loss": 0.4876, + "step": 4139 + }, + { + "epoch": 0.33, + "learning_rate": 1.5693473818258866e-05, + "loss": 0.3927, + "step": 4140 + }, + { + "epoch": 0.33, + "learning_rate": 1.5691364103719515e-05, + "loss": 0.3905, + "step": 4141 + }, + { + "epoch": 0.33, + "learning_rate": 1.5689254014431225e-05, + "loss": 0.3682, + "step": 4142 + }, + { + "epoch": 0.33, + "learning_rate": 1.5687143550532932e-05, + "loss": 0.3792, + "step": 4143 + }, + { + "epoch": 0.33, + "learning_rate": 1.56850327121636e-05, + "loss": 0.3538, + "step": 4144 + }, + { + "epoch": 0.33, + "learning_rate": 1.568292149946222e-05, + "loss": 0.4166, + "step": 4145 + }, + { + "epoch": 0.33, + "learning_rate": 1.56808099125678e-05, + "loss": 0.3547, + "step": 4146 + }, + { + "epoch": 0.33, + "learning_rate": 1.5678697951619386e-05, + "loss": 0.3511, + "step": 4147 + }, + { + "epoch": 0.33, + "learning_rate": 1.5676585616756037e-05, + "loss": 0.4387, + "step": 4148 + }, + { + "epoch": 0.33, + "learning_rate": 1.5674472908116834e-05, + "loss": 0.4227, + "step": 4149 + }, + { + "epoch": 0.33, + "learning_rate": 1.5672359825840895e-05, + "loss": 0.3855, + "step": 4150 + }, + { + "epoch": 0.33, + "learning_rate": 1.567024637006736e-05, + "loss": 0.3158, + "step": 4151 + }, + { + "epoch": 0.33, + "learning_rate": 1.566813254093538e-05, + "loss": 0.378, + "step": 4152 + }, + { + "epoch": 0.33, + "learning_rate": 1.566601833858415e-05, + "loss": 0.3729, + "step": 4153 + }, + { + "epoch": 0.33, + "learning_rate": 1.566390376315287e-05, + "loss": 0.3762, + "step": 4154 + }, + { + "epoch": 0.33, + "learning_rate": 1.5661788814780782e-05, + "loss": 0.3661, + "step": 4155 + }, + { + "epoch": 0.33, + "learning_rate": 1.5659673493607144e-05, + "loss": 0.3505, + "step": 4156 + }, + { + "epoch": 0.33, + "learning_rate": 1.565755779977124e-05, + "loss": 0.3618, + "step": 4157 + }, + { + "epoch": 0.33, + "learning_rate": 1.5655441733412376e-05, + "loss": 0.3183, + "step": 4158 + }, + { + "epoch": 0.33, + "learning_rate": 1.5653325294669884e-05, + "loss": 0.2777, + "step": 4159 + }, + { + "epoch": 0.33, + "learning_rate": 1.565120848368313e-05, + "loss": 0.3096, + "step": 4160 + }, + { + "epoch": 0.33, + "learning_rate": 1.5649091300591482e-05, + "loss": 0.2072, + "step": 4161 + }, + { + "epoch": 0.33, + "learning_rate": 1.564697374553436e-05, + "loss": 0.2873, + "step": 4162 + }, + { + "epoch": 0.33, + "learning_rate": 1.5644855818651184e-05, + "loss": 0.4542, + "step": 4163 + }, + { + "epoch": 0.33, + "learning_rate": 1.564273752008141e-05, + "loss": 0.5235, + "step": 4164 + }, + { + "epoch": 0.33, + "learning_rate": 1.5640618849964528e-05, + "loss": 0.2544, + "step": 4165 + }, + { + "epoch": 0.33, + "learning_rate": 1.5638499808440036e-05, + "loss": 0.4013, + "step": 4166 + }, + { + "epoch": 0.33, + "learning_rate": 1.563638039564746e-05, + "loss": 0.2805, + "step": 4167 + }, + { + "epoch": 0.33, + "learning_rate": 1.5634260611726355e-05, + "loss": 0.3858, + "step": 4168 + }, + { + "epoch": 0.33, + "learning_rate": 1.5632140456816302e-05, + "loss": 0.3501, + "step": 4169 + }, + { + "epoch": 0.33, + "learning_rate": 1.5630019931056894e-05, + "loss": 0.4189, + "step": 4170 + }, + { + "epoch": 0.33, + "learning_rate": 1.5627899034587768e-05, + "loss": 0.3955, + "step": 4171 + }, + { + "epoch": 0.33, + "learning_rate": 1.562577776754857e-05, + "loss": 0.4211, + "step": 4172 + }, + { + "epoch": 0.33, + "learning_rate": 1.5623656130078976e-05, + "loss": 0.3873, + "step": 4173 + }, + { + "epoch": 0.33, + "learning_rate": 1.5621534122318682e-05, + "loss": 0.3535, + "step": 4174 + }, + { + "epoch": 0.33, + "learning_rate": 1.5619411744407416e-05, + "loss": 0.3675, + "step": 4175 + }, + { + "epoch": 0.33, + "learning_rate": 1.561728899648493e-05, + "loss": 0.5141, + "step": 4176 + }, + { + "epoch": 0.33, + "learning_rate": 1.561516587869099e-05, + "loss": 0.3348, + "step": 4177 + }, + { + "epoch": 0.33, + "learning_rate": 1.5613042391165395e-05, + "loss": 0.5207, + "step": 4178 + }, + { + "epoch": 0.33, + "learning_rate": 1.5610918534047964e-05, + "loss": 0.399, + "step": 4179 + }, + { + "epoch": 0.33, + "learning_rate": 1.5608794307478546e-05, + "loss": 0.4458, + "step": 4180 + }, + { + "epoch": 0.33, + "learning_rate": 1.5606669711597017e-05, + "loss": 0.3893, + "step": 4181 + }, + { + "epoch": 0.33, + "learning_rate": 1.560454474654326e-05, + "loss": 0.3072, + "step": 4182 + }, + { + "epoch": 0.33, + "learning_rate": 1.56024194124572e-05, + "loss": 0.4436, + "step": 4183 + }, + { + "epoch": 0.33, + "learning_rate": 1.5600293709478776e-05, + "loss": 0.3324, + "step": 4184 + }, + { + "epoch": 0.33, + "learning_rate": 1.559816763774796e-05, + "loss": 0.4012, + "step": 4185 + }, + { + "epoch": 0.33, + "learning_rate": 1.559604119740474e-05, + "loss": 0.1951, + "step": 4186 + }, + { + "epoch": 0.33, + "learning_rate": 1.5593914388589136e-05, + "loss": 0.3446, + "step": 4187 + }, + { + "epoch": 0.33, + "learning_rate": 1.559178721144119e-05, + "loss": 0.4079, + "step": 4188 + }, + { + "epoch": 0.33, + "learning_rate": 1.5589659666100952e-05, + "loss": 0.4762, + "step": 4189 + }, + { + "epoch": 0.33, + "learning_rate": 1.5587531752708528e-05, + "loss": 0.3888, + "step": 4190 + }, + { + "epoch": 0.33, + "learning_rate": 1.558540347140402e-05, + "loss": 0.362, + "step": 4191 + }, + { + "epoch": 0.33, + "learning_rate": 1.558327482232757e-05, + "loss": 0.3217, + "step": 4192 + }, + { + "epoch": 0.33, + "learning_rate": 1.558114580561934e-05, + "loss": 0.3531, + "step": 4193 + }, + { + "epoch": 0.33, + "learning_rate": 1.557901642141951e-05, + "loss": 0.3434, + "step": 4194 + }, + { + "epoch": 0.33, + "learning_rate": 1.5576886669868297e-05, + "loss": 0.3881, + "step": 4195 + }, + { + "epoch": 0.33, + "learning_rate": 1.5574756551105926e-05, + "loss": 0.3949, + "step": 4196 + }, + { + "epoch": 0.33, + "learning_rate": 1.5572626065272666e-05, + "loss": 0.2733, + "step": 4197 + }, + { + "epoch": 0.33, + "learning_rate": 1.557049521250879e-05, + "loss": 0.331, + "step": 4198 + }, + { + "epoch": 0.33, + "learning_rate": 1.5568363992954607e-05, + "loss": 0.4913, + "step": 4199 + }, + { + "epoch": 0.33, + "learning_rate": 1.556623240675045e-05, + "loss": 0.2867, + "step": 4200 + }, + { + "epoch": 0.33, + "learning_rate": 1.556410045403667e-05, + "loss": 0.3622, + "step": 4201 + }, + { + "epoch": 0.33, + "learning_rate": 1.556196813495365e-05, + "loss": 0.5271, + "step": 4202 + }, + { + "epoch": 0.33, + "learning_rate": 1.555983544964179e-05, + "loss": 0.4037, + "step": 4203 + }, + { + "epoch": 0.33, + "learning_rate": 1.555770239824152e-05, + "loss": 0.3313, + "step": 4204 + }, + { + "epoch": 0.33, + "learning_rate": 1.5555568980893284e-05, + "loss": 0.321, + "step": 4205 + }, + { + "epoch": 0.33, + "learning_rate": 1.5553435197737566e-05, + "loss": 0.4006, + "step": 4206 + }, + { + "epoch": 0.33, + "learning_rate": 1.5551301048914863e-05, + "loss": 0.4433, + "step": 4207 + }, + { + "epoch": 0.33, + "learning_rate": 1.5549166534565695e-05, + "loss": 0.4443, + "step": 4208 + }, + { + "epoch": 0.33, + "learning_rate": 1.554703165483061e-05, + "loss": 0.4245, + "step": 4209 + }, + { + "epoch": 0.33, + "learning_rate": 1.5544896409850183e-05, + "loss": 0.3634, + "step": 4210 + }, + { + "epoch": 0.33, + "learning_rate": 1.554276079976501e-05, + "loss": 0.3527, + "step": 4211 + }, + { + "epoch": 0.33, + "learning_rate": 1.5540624824715703e-05, + "loss": 0.352, + "step": 4212 + }, + { + "epoch": 0.33, + "learning_rate": 1.5538488484842914e-05, + "loss": 0.3256, + "step": 4213 + }, + { + "epoch": 0.33, + "learning_rate": 1.553635178028731e-05, + "loss": 0.3522, + "step": 4214 + }, + { + "epoch": 0.33, + "learning_rate": 1.5534214711189574e-05, + "loss": 0.4184, + "step": 4215 + }, + { + "epoch": 0.33, + "learning_rate": 1.5532077277690435e-05, + "loss": 0.4489, + "step": 4216 + }, + { + "epoch": 0.33, + "learning_rate": 1.552993947993062e-05, + "loss": 0.354, + "step": 4217 + }, + { + "epoch": 0.33, + "learning_rate": 1.5527801318050904e-05, + "loss": 0.3464, + "step": 4218 + }, + { + "epoch": 0.33, + "learning_rate": 1.5525662792192066e-05, + "loss": 0.3024, + "step": 4219 + }, + { + "epoch": 0.33, + "learning_rate": 1.5523523902494927e-05, + "loss": 0.4741, + "step": 4220 + }, + { + "epoch": 0.33, + "learning_rate": 1.552138464910031e-05, + "loss": 0.366, + "step": 4221 + }, + { + "epoch": 0.33, + "learning_rate": 1.5519245032149083e-05, + "loss": 0.4624, + "step": 4222 + }, + { + "epoch": 0.33, + "learning_rate": 1.5517105051782127e-05, + "loss": 0.2954, + "step": 4223 + }, + { + "epoch": 0.33, + "learning_rate": 1.551496470814035e-05, + "loss": 0.3654, + "step": 4224 + }, + { + "epoch": 0.33, + "learning_rate": 1.5512824001364686e-05, + "loss": 0.3405, + "step": 4225 + }, + { + "epoch": 0.33, + "learning_rate": 1.5510682931596083e-05, + "loss": 0.38, + "step": 4226 + }, + { + "epoch": 0.33, + "learning_rate": 1.550854149897553e-05, + "loss": 0.4756, + "step": 4227 + }, + { + "epoch": 0.33, + "learning_rate": 1.5506399703644017e-05, + "loss": 0.38, + "step": 4228 + }, + { + "epoch": 0.34, + "learning_rate": 1.5504257545742585e-05, + "loss": 0.4255, + "step": 4229 + }, + { + "epoch": 0.34, + "learning_rate": 1.5502115025412275e-05, + "loss": 0.4808, + "step": 4230 + }, + { + "epoch": 0.34, + "learning_rate": 1.5499972142794167e-05, + "loss": 0.4107, + "step": 4231 + }, + { + "epoch": 0.34, + "learning_rate": 1.5497828898029358e-05, + "loss": 0.3145, + "step": 4232 + }, + { + "epoch": 0.34, + "learning_rate": 1.5495685291258967e-05, + "loss": 0.3569, + "step": 4233 + }, + { + "epoch": 0.34, + "learning_rate": 1.5493541322624145e-05, + "loss": 0.3965, + "step": 4234 + }, + { + "epoch": 0.34, + "learning_rate": 1.5491396992266065e-05, + "loss": 0.3148, + "step": 4235 + }, + { + "epoch": 0.34, + "learning_rate": 1.548925230032591e-05, + "loss": 0.3715, + "step": 4236 + }, + { + "epoch": 0.34, + "learning_rate": 1.5487107246944902e-05, + "loss": 0.4254, + "step": 4237 + }, + { + "epoch": 0.34, + "learning_rate": 1.548496183226429e-05, + "loss": 0.4634, + "step": 4238 + }, + { + "epoch": 0.34, + "learning_rate": 1.548281605642533e-05, + "loss": 0.3021, + "step": 4239 + }, + { + "epoch": 0.34, + "learning_rate": 1.5480669919569313e-05, + "loss": 0.3698, + "step": 4240 + }, + { + "epoch": 0.34, + "learning_rate": 1.5478523421837553e-05, + "loss": 0.347, + "step": 4241 + }, + { + "epoch": 0.34, + "learning_rate": 1.5476376563371392e-05, + "loss": 0.3656, + "step": 4242 + }, + { + "epoch": 0.34, + "learning_rate": 1.547422934431218e-05, + "loss": 0.3649, + "step": 4243 + }, + { + "epoch": 0.34, + "learning_rate": 1.5472081764801307e-05, + "loss": 0.4811, + "step": 4244 + }, + { + "epoch": 0.34, + "learning_rate": 1.546993382498018e-05, + "loss": 0.273, + "step": 4245 + }, + { + "epoch": 0.34, + "learning_rate": 1.546778552499023e-05, + "loss": 0.3106, + "step": 4246 + }, + { + "epoch": 0.34, + "learning_rate": 1.5465636864972914e-05, + "loss": 0.4742, + "step": 4247 + }, + { + "epoch": 0.34, + "learning_rate": 1.5463487845069708e-05, + "loss": 0.5235, + "step": 4248 + }, + { + "epoch": 0.34, + "learning_rate": 1.546133846542212e-05, + "loss": 0.3998, + "step": 4249 + }, + { + "epoch": 0.34, + "learning_rate": 1.5459188726171666e-05, + "loss": 0.3124, + "step": 4250 + }, + { + "epoch": 0.34, + "learning_rate": 1.5457038627459905e-05, + "loss": 0.4622, + "step": 4251 + }, + { + "epoch": 0.34, + "learning_rate": 1.545488816942841e-05, + "loss": 0.241, + "step": 4252 + }, + { + "epoch": 0.34, + "learning_rate": 1.5452737352218773e-05, + "loss": 0.3801, + "step": 4253 + }, + { + "epoch": 0.34, + "learning_rate": 1.545058617597262e-05, + "loss": 0.4065, + "step": 4254 + }, + { + "epoch": 0.34, + "learning_rate": 1.544843464083159e-05, + "loss": 0.3174, + "step": 4255 + }, + { + "epoch": 0.34, + "learning_rate": 1.544628274693736e-05, + "loss": 0.3642, + "step": 4256 + }, + { + "epoch": 0.34, + "learning_rate": 1.5444130494431612e-05, + "loss": 0.3013, + "step": 4257 + }, + { + "epoch": 0.34, + "learning_rate": 1.544197788345607e-05, + "loss": 0.3543, + "step": 4258 + }, + { + "epoch": 0.34, + "learning_rate": 1.543982491415247e-05, + "loss": 0.4302, + "step": 4259 + }, + { + "epoch": 0.34, + "learning_rate": 1.5437671586662575e-05, + "loss": 0.2833, + "step": 4260 + }, + { + "epoch": 0.34, + "learning_rate": 1.543551790112817e-05, + "loss": 0.3812, + "step": 4261 + }, + { + "epoch": 0.34, + "learning_rate": 1.5433363857691067e-05, + "loss": 0.2855, + "step": 4262 + }, + { + "epoch": 0.34, + "learning_rate": 1.5431209456493093e-05, + "loss": 0.3121, + "step": 4263 + }, + { + "epoch": 0.34, + "learning_rate": 1.542905469767611e-05, + "loss": 0.352, + "step": 4264 + }, + { + "epoch": 0.34, + "learning_rate": 1.5426899581382e-05, + "loss": 0.2329, + "step": 4265 + }, + { + "epoch": 0.34, + "learning_rate": 1.5424744107752666e-05, + "loss": 0.3697, + "step": 4266 + }, + { + "epoch": 0.34, + "learning_rate": 1.542258827693003e-05, + "loss": 0.3075, + "step": 4267 + }, + { + "epoch": 0.34, + "learning_rate": 1.542043208905605e-05, + "loss": 0.3091, + "step": 4268 + }, + { + "epoch": 0.34, + "learning_rate": 1.5418275544272702e-05, + "loss": 0.2696, + "step": 4269 + }, + { + "epoch": 0.34, + "learning_rate": 1.541611864272198e-05, + "loss": 0.4129, + "step": 4270 + }, + { + "epoch": 0.34, + "learning_rate": 1.5413961384545902e-05, + "loss": 0.4036, + "step": 4271 + }, + { + "epoch": 0.34, + "learning_rate": 1.541180376988652e-05, + "loss": 0.3967, + "step": 4272 + }, + { + "epoch": 0.34, + "learning_rate": 1.54096457988859e-05, + "loss": 0.5067, + "step": 4273 + }, + { + "epoch": 0.34, + "learning_rate": 1.540748747168613e-05, + "loss": 0.3218, + "step": 4274 + }, + { + "epoch": 0.34, + "learning_rate": 1.5405328788429333e-05, + "loss": 0.3824, + "step": 4275 + }, + { + "epoch": 0.34, + "learning_rate": 1.5403169749257644e-05, + "loss": 0.4639, + "step": 4276 + }, + { + "epoch": 0.34, + "learning_rate": 1.5401010354313222e-05, + "loss": 0.3719, + "step": 4277 + }, + { + "epoch": 0.34, + "learning_rate": 1.539885060373826e-05, + "loss": 0.4903, + "step": 4278 + }, + { + "epoch": 0.34, + "learning_rate": 1.539669049767496e-05, + "loss": 0.3788, + "step": 4279 + }, + { + "epoch": 0.34, + "learning_rate": 1.539453003626556e-05, + "loss": 0.3217, + "step": 4280 + }, + { + "epoch": 0.34, + "learning_rate": 1.5392369219652313e-05, + "loss": 0.3945, + "step": 4281 + }, + { + "epoch": 0.34, + "learning_rate": 1.53902080479775e-05, + "loss": 0.3128, + "step": 4282 + }, + { + "epoch": 0.34, + "learning_rate": 1.5388046521383424e-05, + "loss": 0.3388, + "step": 4283 + }, + { + "epoch": 0.34, + "learning_rate": 1.538588464001241e-05, + "loss": 0.4534, + "step": 4284 + }, + { + "epoch": 0.34, + "learning_rate": 1.5383722404006808e-05, + "loss": 0.4432, + "step": 4285 + }, + { + "epoch": 0.34, + "learning_rate": 1.5381559813508986e-05, + "loss": 0.4769, + "step": 4286 + }, + { + "epoch": 0.34, + "learning_rate": 1.537939686866135e-05, + "loss": 0.2587, + "step": 4287 + }, + { + "epoch": 0.34, + "learning_rate": 1.5377233569606312e-05, + "loss": 0.4046, + "step": 4288 + }, + { + "epoch": 0.34, + "learning_rate": 1.5375069916486318e-05, + "loss": 0.4021, + "step": 4289 + }, + { + "epoch": 0.34, + "learning_rate": 1.5372905909443833e-05, + "loss": 0.4086, + "step": 4290 + }, + { + "epoch": 0.34, + "learning_rate": 1.5370741548621343e-05, + "loss": 0.4188, + "step": 4291 + }, + { + "epoch": 0.34, + "learning_rate": 1.5368576834161372e-05, + "loss": 0.3543, + "step": 4292 + }, + { + "epoch": 0.34, + "learning_rate": 1.536641176620644e-05, + "loss": 0.4383, + "step": 4293 + }, + { + "epoch": 0.34, + "learning_rate": 1.536424634489912e-05, + "loss": 0.3103, + "step": 4294 + }, + { + "epoch": 0.34, + "learning_rate": 1.536208057038199e-05, + "loss": 0.4522, + "step": 4295 + }, + { + "epoch": 0.34, + "learning_rate": 1.535991444279765e-05, + "loss": 0.378, + "step": 4296 + }, + { + "epoch": 0.34, + "learning_rate": 1.535774796228874e-05, + "loss": 0.3628, + "step": 4297 + }, + { + "epoch": 0.34, + "learning_rate": 1.5355581128997904e-05, + "loss": 0.3322, + "step": 4298 + }, + { + "epoch": 0.34, + "learning_rate": 1.5353413943067818e-05, + "loss": 0.3873, + "step": 4299 + }, + { + "epoch": 0.34, + "learning_rate": 1.5351246404641183e-05, + "loss": 0.2579, + "step": 4300 + }, + { + "epoch": 0.34, + "learning_rate": 1.5349078513860728e-05, + "loss": 0.3746, + "step": 4301 + }, + { + "epoch": 0.34, + "learning_rate": 1.534691027086918e-05, + "loss": 0.3827, + "step": 4302 + }, + { + "epoch": 0.34, + "learning_rate": 1.5344741675809328e-05, + "loss": 0.4069, + "step": 4303 + }, + { + "epoch": 0.34, + "learning_rate": 1.534257272882395e-05, + "loss": 0.309, + "step": 4304 + }, + { + "epoch": 0.34, + "learning_rate": 1.5340403430055864e-05, + "loss": 0.3389, + "step": 4305 + }, + { + "epoch": 0.34, + "learning_rate": 1.533823377964791e-05, + "loss": 0.3838, + "step": 4306 + }, + { + "epoch": 0.34, + "learning_rate": 1.5336063777742944e-05, + "loss": 0.3636, + "step": 4307 + }, + { + "epoch": 0.34, + "learning_rate": 1.5333893424483856e-05, + "loss": 0.3913, + "step": 4308 + }, + { + "epoch": 0.34, + "learning_rate": 1.5331722720013555e-05, + "loss": 0.3702, + "step": 4309 + }, + { + "epoch": 0.34, + "learning_rate": 1.532955166447496e-05, + "loss": 0.4484, + "step": 4310 + }, + { + "epoch": 0.34, + "learning_rate": 1.5327380258011037e-05, + "loss": 0.4913, + "step": 4311 + }, + { + "epoch": 0.34, + "learning_rate": 1.5325208500764756e-05, + "loss": 0.3171, + "step": 4312 + }, + { + "epoch": 0.34, + "learning_rate": 1.532303639287912e-05, + "loss": 0.3768, + "step": 4313 + }, + { + "epoch": 0.34, + "learning_rate": 1.532086393449715e-05, + "loss": 0.412, + "step": 4314 + }, + { + "epoch": 0.34, + "learning_rate": 1.531869112576189e-05, + "loss": 0.3418, + "step": 4315 + }, + { + "epoch": 0.34, + "learning_rate": 1.5316517966816414e-05, + "loss": 0.3932, + "step": 4316 + }, + { + "epoch": 0.34, + "learning_rate": 1.5314344457803812e-05, + "loss": 0.3251, + "step": 4317 + }, + { + "epoch": 0.34, + "learning_rate": 1.5312170598867195e-05, + "loss": 0.2839, + "step": 4318 + }, + { + "epoch": 0.34, + "learning_rate": 1.5309996390149708e-05, + "loss": 0.2607, + "step": 4319 + }, + { + "epoch": 0.34, + "learning_rate": 1.5307821831794506e-05, + "loss": 0.4676, + "step": 4320 + }, + { + "epoch": 0.34, + "learning_rate": 1.5305646923944776e-05, + "loss": 0.3608, + "step": 4321 + }, + { + "epoch": 0.34, + "learning_rate": 1.5303471666743727e-05, + "loss": 0.2802, + "step": 4322 + }, + { + "epoch": 0.34, + "learning_rate": 1.5301296060334588e-05, + "loss": 0.2923, + "step": 4323 + }, + { + "epoch": 0.34, + "learning_rate": 1.529912010486061e-05, + "loss": 0.3139, + "step": 4324 + }, + { + "epoch": 0.34, + "learning_rate": 1.5296943800465068e-05, + "loss": 0.3518, + "step": 4325 + }, + { + "epoch": 0.34, + "learning_rate": 1.529476714729127e-05, + "loss": 0.4242, + "step": 4326 + }, + { + "epoch": 0.34, + "learning_rate": 1.529259014548253e-05, + "loss": 0.3954, + "step": 4327 + }, + { + "epoch": 0.34, + "learning_rate": 1.5290412795182193e-05, + "loss": 0.3605, + "step": 4328 + }, + { + "epoch": 0.34, + "learning_rate": 1.528823509653363e-05, + "loss": 0.5317, + "step": 4329 + }, + { + "epoch": 0.34, + "learning_rate": 1.5286057049680236e-05, + "loss": 0.399, + "step": 4330 + }, + { + "epoch": 0.34, + "learning_rate": 1.5283878654765414e-05, + "loss": 0.3346, + "step": 4331 + }, + { + "epoch": 0.34, + "learning_rate": 1.5281699911932612e-05, + "loss": 0.2561, + "step": 4332 + }, + { + "epoch": 0.34, + "learning_rate": 1.527952082132528e-05, + "loss": 0.4135, + "step": 4333 + }, + { + "epoch": 0.34, + "learning_rate": 1.5277341383086906e-05, + "loss": 0.4589, + "step": 4334 + }, + { + "epoch": 0.34, + "learning_rate": 1.5275161597360996e-05, + "loss": 0.3363, + "step": 4335 + }, + { + "epoch": 0.34, + "learning_rate": 1.5272981464291077e-05, + "loss": 0.3886, + "step": 4336 + }, + { + "epoch": 0.34, + "learning_rate": 1.5270800984020705e-05, + "loss": 0.4144, + "step": 4337 + }, + { + "epoch": 0.34, + "learning_rate": 1.5268620156693444e-05, + "loss": 0.4174, + "step": 4338 + }, + { + "epoch": 0.34, + "learning_rate": 1.52664389824529e-05, + "loss": 0.4167, + "step": 4339 + }, + { + "epoch": 0.34, + "learning_rate": 1.5264257461442687e-05, + "loss": 0.2476, + "step": 4340 + }, + { + "epoch": 0.34, + "learning_rate": 1.526207559380645e-05, + "loss": 0.3668, + "step": 4341 + }, + { + "epoch": 0.34, + "learning_rate": 1.5259893379687855e-05, + "loss": 0.3119, + "step": 4342 + }, + { + "epoch": 0.34, + "learning_rate": 1.525771081923059e-05, + "loss": 0.4254, + "step": 4343 + }, + { + "epoch": 0.34, + "learning_rate": 1.525552791257837e-05, + "loss": 0.5503, + "step": 4344 + }, + { + "epoch": 0.34, + "learning_rate": 1.525334465987492e-05, + "loss": 0.2859, + "step": 4345 + }, + { + "epoch": 0.34, + "learning_rate": 1.5251161061264003e-05, + "loss": 0.424, + "step": 4346 + }, + { + "epoch": 0.34, + "learning_rate": 1.5248977116889396e-05, + "loss": 0.3517, + "step": 4347 + }, + { + "epoch": 0.34, + "learning_rate": 1.5246792826894906e-05, + "loss": 0.338, + "step": 4348 + }, + { + "epoch": 0.34, + "learning_rate": 1.5244608191424352e-05, + "loss": 0.3669, + "step": 4349 + }, + { + "epoch": 0.34, + "learning_rate": 1.5242423210621584e-05, + "loss": 0.2655, + "step": 4350 + }, + { + "epoch": 0.34, + "learning_rate": 1.5240237884630471e-05, + "loss": 0.4279, + "step": 4351 + }, + { + "epoch": 0.34, + "learning_rate": 1.5238052213594912e-05, + "loss": 0.4402, + "step": 4352 + }, + { + "epoch": 0.34, + "learning_rate": 1.5235866197658812e-05, + "loss": 0.4339, + "step": 4353 + }, + { + "epoch": 0.34, + "learning_rate": 1.5233679836966122e-05, + "loss": 0.3755, + "step": 4354 + }, + { + "epoch": 0.35, + "learning_rate": 1.5231493131660794e-05, + "loss": 0.4106, + "step": 4355 + }, + { + "epoch": 0.35, + "learning_rate": 1.5229306081886818e-05, + "loss": 0.3918, + "step": 4356 + }, + { + "epoch": 0.35, + "learning_rate": 1.5227118687788198e-05, + "loss": 0.3466, + "step": 4357 + }, + { + "epoch": 0.35, + "learning_rate": 1.5224930949508964e-05, + "loss": 0.3496, + "step": 4358 + }, + { + "epoch": 0.35, + "learning_rate": 1.5222742867193167e-05, + "loss": 0.3182, + "step": 4359 + }, + { + "epoch": 0.35, + "learning_rate": 1.5220554440984882e-05, + "loss": 0.3383, + "step": 4360 + }, + { + "epoch": 0.35, + "learning_rate": 1.5218365671028207e-05, + "loss": 0.4012, + "step": 4361 + }, + { + "epoch": 0.35, + "learning_rate": 1.5216176557467265e-05, + "loss": 0.467, + "step": 4362 + }, + { + "epoch": 0.35, + "learning_rate": 1.521398710044619e-05, + "loss": 0.4546, + "step": 4363 + }, + { + "epoch": 0.35, + "learning_rate": 1.5211797300109154e-05, + "loss": 0.346, + "step": 4364 + }, + { + "epoch": 0.35, + "learning_rate": 1.5209607156600346e-05, + "loss": 0.3652, + "step": 4365 + }, + { + "epoch": 0.35, + "learning_rate": 1.520741667006397e-05, + "loss": 0.4054, + "step": 4366 + }, + { + "epoch": 0.35, + "learning_rate": 1.5205225840644264e-05, + "loss": 0.3118, + "step": 4367 + }, + { + "epoch": 0.35, + "learning_rate": 1.5203034668485486e-05, + "loss": 0.3255, + "step": 4368 + }, + { + "epoch": 0.35, + "learning_rate": 1.5200843153731905e-05, + "loss": 0.5049, + "step": 4369 + }, + { + "epoch": 0.35, + "learning_rate": 1.519865129652783e-05, + "loss": 0.3378, + "step": 4370 + }, + { + "epoch": 0.35, + "learning_rate": 1.5196459097017582e-05, + "loss": 0.349, + "step": 4371 + }, + { + "epoch": 0.35, + "learning_rate": 1.5194266555345505e-05, + "loss": 0.3712, + "step": 4372 + }, + { + "epoch": 0.35, + "learning_rate": 1.5192073671655969e-05, + "loss": 0.3871, + "step": 4373 + }, + { + "epoch": 0.35, + "learning_rate": 1.5189880446093366e-05, + "loss": 0.3889, + "step": 4374 + }, + { + "epoch": 0.35, + "learning_rate": 1.5187686878802108e-05, + "loss": 0.2952, + "step": 4375 + }, + { + "epoch": 0.35, + "learning_rate": 1.5185492969926627e-05, + "loss": 0.4032, + "step": 4376 + }, + { + "epoch": 0.35, + "learning_rate": 1.5183298719611388e-05, + "loss": 0.5085, + "step": 4377 + }, + { + "epoch": 0.35, + "learning_rate": 1.5181104128000868e-05, + "loss": 0.3632, + "step": 4378 + }, + { + "epoch": 0.35, + "learning_rate": 1.517890919523957e-05, + "loss": 0.4635, + "step": 4379 + }, + { + "epoch": 0.35, + "learning_rate": 1.517671392147202e-05, + "loss": 0.3964, + "step": 4380 + }, + { + "epoch": 0.35, + "learning_rate": 1.517451830684277e-05, + "loss": 0.5332, + "step": 4381 + }, + { + "epoch": 0.35, + "learning_rate": 1.5172322351496385e-05, + "loss": 0.4038, + "step": 4382 + }, + { + "epoch": 0.35, + "learning_rate": 1.517012605557746e-05, + "loss": 0.3276, + "step": 4383 + }, + { + "epoch": 0.35, + "learning_rate": 1.5167929419230616e-05, + "loss": 0.4459, + "step": 4384 + }, + { + "epoch": 0.35, + "learning_rate": 1.516573244260048e-05, + "loss": 0.3845, + "step": 4385 + }, + { + "epoch": 0.35, + "learning_rate": 1.5163535125831724e-05, + "loss": 0.3698, + "step": 4386 + }, + { + "epoch": 0.35, + "learning_rate": 1.5161337469069024e-05, + "loss": 0.4213, + "step": 4387 + }, + { + "epoch": 0.35, + "learning_rate": 1.5159139472457086e-05, + "loss": 0.3375, + "step": 4388 + }, + { + "epoch": 0.35, + "learning_rate": 1.5156941136140637e-05, + "loss": 0.3847, + "step": 4389 + }, + { + "epoch": 0.35, + "learning_rate": 1.5154742460264426e-05, + "loss": 0.3505, + "step": 4390 + }, + { + "epoch": 0.35, + "learning_rate": 1.515254344497323e-05, + "loss": 0.3219, + "step": 4391 + }, + { + "epoch": 0.35, + "learning_rate": 1.5150344090411841e-05, + "loss": 0.333, + "step": 4392 + }, + { + "epoch": 0.35, + "learning_rate": 1.5148144396725072e-05, + "loss": 0.28, + "step": 4393 + }, + { + "epoch": 0.35, + "learning_rate": 1.514594436405777e-05, + "loss": 0.3509, + "step": 4394 + }, + { + "epoch": 0.35, + "learning_rate": 1.5143743992554791e-05, + "loss": 0.3962, + "step": 4395 + }, + { + "epoch": 0.35, + "learning_rate": 1.514154328236102e-05, + "loss": 0.3886, + "step": 4396 + }, + { + "epoch": 0.35, + "learning_rate": 1.5139342233621364e-05, + "loss": 0.2702, + "step": 4397 + }, + { + "epoch": 0.35, + "learning_rate": 1.5137140846480752e-05, + "loss": 0.2519, + "step": 4398 + }, + { + "epoch": 0.35, + "learning_rate": 1.5134939121084129e-05, + "loss": 0.3797, + "step": 4399 + }, + { + "epoch": 0.35, + "learning_rate": 1.5132737057576476e-05, + "loss": 0.4479, + "step": 4400 + }, + { + "epoch": 0.35, + "learning_rate": 1.5130534656102783e-05, + "loss": 0.3888, + "step": 4401 + }, + { + "epoch": 0.35, + "learning_rate": 1.512833191680807e-05, + "loss": 0.3596, + "step": 4402 + }, + { + "epoch": 0.35, + "learning_rate": 1.5126128839837378e-05, + "loss": 0.2822, + "step": 4403 + }, + { + "epoch": 0.35, + "learning_rate": 1.5123925425335766e-05, + "loss": 0.2913, + "step": 4404 + }, + { + "epoch": 0.35, + "learning_rate": 1.5121721673448319e-05, + "loss": 0.3993, + "step": 4405 + }, + { + "epoch": 0.35, + "learning_rate": 1.5119517584320146e-05, + "loss": 0.4033, + "step": 4406 + }, + { + "epoch": 0.35, + "learning_rate": 1.5117313158096371e-05, + "loss": 0.381, + "step": 4407 + }, + { + "epoch": 0.35, + "learning_rate": 1.511510839492215e-05, + "loss": 0.4427, + "step": 4408 + }, + { + "epoch": 0.35, + "learning_rate": 1.5112903294942651e-05, + "loss": 0.2648, + "step": 4409 + }, + { + "epoch": 0.35, + "learning_rate": 1.5110697858303072e-05, + "loss": 0.3514, + "step": 4410 + }, + { + "epoch": 0.35, + "learning_rate": 1.5108492085148632e-05, + "loss": 0.4411, + "step": 4411 + }, + { + "epoch": 0.35, + "learning_rate": 1.5106285975624568e-05, + "loss": 0.5103, + "step": 4412 + }, + { + "epoch": 0.35, + "learning_rate": 1.5104079529876143e-05, + "loss": 0.3637, + "step": 4413 + }, + { + "epoch": 0.35, + "learning_rate": 1.510187274804864e-05, + "loss": 0.3129, + "step": 4414 + }, + { + "epoch": 0.35, + "learning_rate": 1.5099665630287365e-05, + "loss": 0.5134, + "step": 4415 + }, + { + "epoch": 0.35, + "learning_rate": 1.5097458176737647e-05, + "loss": 0.3371, + "step": 4416 + }, + { + "epoch": 0.35, + "learning_rate": 1.5095250387544833e-05, + "loss": 0.4092, + "step": 4417 + }, + { + "epoch": 0.35, + "learning_rate": 1.5093042262854297e-05, + "loss": 0.3307, + "step": 4418 + }, + { + "epoch": 0.35, + "learning_rate": 1.509083380281144e-05, + "loss": 0.3922, + "step": 4419 + }, + { + "epoch": 0.35, + "learning_rate": 1.5088625007561668e-05, + "loss": 0.3821, + "step": 4420 + }, + { + "epoch": 0.35, + "learning_rate": 1.5086415877250424e-05, + "loss": 0.3635, + "step": 4421 + }, + { + "epoch": 0.35, + "learning_rate": 1.5084206412023172e-05, + "loss": 0.3417, + "step": 4422 + }, + { + "epoch": 0.35, + "learning_rate": 1.5081996612025387e-05, + "loss": 0.3376, + "step": 4423 + }, + { + "epoch": 0.35, + "learning_rate": 1.5079786477402581e-05, + "loss": 0.3674, + "step": 4424 + }, + { + "epoch": 0.35, + "learning_rate": 1.5077576008300278e-05, + "loss": 0.4715, + "step": 4425 + }, + { + "epoch": 0.35, + "learning_rate": 1.5075365204864025e-05, + "loss": 0.3958, + "step": 4426 + }, + { + "epoch": 0.35, + "learning_rate": 1.5073154067239396e-05, + "loss": 0.4995, + "step": 4427 + }, + { + "epoch": 0.35, + "learning_rate": 1.507094259557198e-05, + "loss": 0.4157, + "step": 4428 + }, + { + "epoch": 0.35, + "learning_rate": 1.5068730790007395e-05, + "loss": 0.3895, + "step": 4429 + }, + { + "epoch": 0.35, + "learning_rate": 1.5066518650691277e-05, + "loss": 0.3378, + "step": 4430 + }, + { + "epoch": 0.35, + "learning_rate": 1.5064306177769284e-05, + "loss": 0.3654, + "step": 4431 + }, + { + "epoch": 0.35, + "learning_rate": 1.5062093371387097e-05, + "loss": 0.4683, + "step": 4432 + }, + { + "epoch": 0.35, + "learning_rate": 1.5059880231690418e-05, + "loss": 0.2795, + "step": 4433 + }, + { + "epoch": 0.35, + "learning_rate": 1.5057666758824974e-05, + "loss": 0.4365, + "step": 4434 + }, + { + "epoch": 0.35, + "learning_rate": 1.5055452952936512e-05, + "loss": 0.4089, + "step": 4435 + }, + { + "epoch": 0.35, + "learning_rate": 1.5053238814170792e-05, + "loss": 0.3009, + "step": 4436 + }, + { + "epoch": 0.35, + "learning_rate": 1.5051024342673614e-05, + "loss": 0.2986, + "step": 4437 + }, + { + "epoch": 0.35, + "learning_rate": 1.5048809538590789e-05, + "loss": 0.3501, + "step": 4438 + }, + { + "epoch": 0.35, + "learning_rate": 1.5046594402068147e-05, + "loss": 0.3964, + "step": 4439 + }, + { + "epoch": 0.35, + "learning_rate": 1.5044378933251546e-05, + "loss": 0.3697, + "step": 4440 + }, + { + "epoch": 0.35, + "learning_rate": 1.5042163132286867e-05, + "loss": 0.3423, + "step": 4441 + }, + { + "epoch": 0.35, + "learning_rate": 1.5039946999320004e-05, + "loss": 0.3524, + "step": 4442 + }, + { + "epoch": 0.35, + "learning_rate": 1.5037730534496882e-05, + "loss": 0.3403, + "step": 4443 + }, + { + "epoch": 0.35, + "learning_rate": 1.5035513737963445e-05, + "loss": 0.3982, + "step": 4444 + }, + { + "epoch": 0.35, + "learning_rate": 1.5033296609865658e-05, + "loss": 0.2669, + "step": 4445 + }, + { + "epoch": 0.35, + "learning_rate": 1.503107915034951e-05, + "loss": 0.3006, + "step": 4446 + }, + { + "epoch": 0.35, + "learning_rate": 1.5028861359561005e-05, + "loss": 0.419, + "step": 4447 + }, + { + "epoch": 0.35, + "learning_rate": 1.5026643237646176e-05, + "loss": 0.3343, + "step": 4448 + }, + { + "epoch": 0.35, + "learning_rate": 1.5024424784751079e-05, + "loss": 0.4115, + "step": 4449 + }, + { + "epoch": 0.35, + "learning_rate": 1.5022206001021784e-05, + "loss": 0.3087, + "step": 4450 + }, + { + "epoch": 0.35, + "learning_rate": 1.501998688660439e-05, + "loss": 0.3132, + "step": 4451 + }, + { + "epoch": 0.35, + "learning_rate": 1.5017767441645015e-05, + "loss": 0.3309, + "step": 4452 + }, + { + "epoch": 0.35, + "learning_rate": 1.5015547666289798e-05, + "loss": 0.3543, + "step": 4453 + }, + { + "epoch": 0.35, + "learning_rate": 1.50133275606849e-05, + "loss": 0.4689, + "step": 4454 + }, + { + "epoch": 0.35, + "learning_rate": 1.5011107124976505e-05, + "loss": 0.3892, + "step": 4455 + }, + { + "epoch": 0.35, + "learning_rate": 1.5008886359310815e-05, + "loss": 0.373, + "step": 4456 + }, + { + "epoch": 0.35, + "learning_rate": 1.5006665263834062e-05, + "loss": 0.2792, + "step": 4457 + }, + { + "epoch": 0.35, + "learning_rate": 1.5004443838692492e-05, + "loss": 0.4641, + "step": 4458 + }, + { + "epoch": 0.35, + "learning_rate": 1.5002222084032374e-05, + "loss": 0.3265, + "step": 4459 + }, + { + "epoch": 0.35, + "learning_rate": 1.5000000000000002e-05, + "loss": 0.2737, + "step": 4460 + }, + { + "epoch": 0.35, + "learning_rate": 1.4997777586741689e-05, + "loss": 0.4221, + "step": 4461 + }, + { + "epoch": 0.35, + "learning_rate": 1.4995554844403767e-05, + "loss": 0.4463, + "step": 4462 + }, + { + "epoch": 0.35, + "learning_rate": 1.4993331773132598e-05, + "loss": 0.3237, + "step": 4463 + }, + { + "epoch": 0.35, + "learning_rate": 1.4991108373074557e-05, + "loss": 0.3187, + "step": 4464 + }, + { + "epoch": 0.35, + "learning_rate": 1.4988884644376045e-05, + "loss": 0.3961, + "step": 4465 + }, + { + "epoch": 0.35, + "learning_rate": 1.4986660587183485e-05, + "loss": 0.2854, + "step": 4466 + }, + { + "epoch": 0.35, + "learning_rate": 1.498443620164332e-05, + "loss": 0.3357, + "step": 4467 + }, + { + "epoch": 0.35, + "learning_rate": 1.4982211487902015e-05, + "loss": 0.5021, + "step": 4468 + }, + { + "epoch": 0.35, + "learning_rate": 1.4979986446106054e-05, + "loss": 0.3182, + "step": 4469 + }, + { + "epoch": 0.35, + "learning_rate": 1.4977761076401949e-05, + "loss": 0.4034, + "step": 4470 + }, + { + "epoch": 0.35, + "learning_rate": 1.4975535378936228e-05, + "loss": 0.4223, + "step": 4471 + }, + { + "epoch": 0.35, + "learning_rate": 1.4973309353855443e-05, + "loss": 0.3206, + "step": 4472 + }, + { + "epoch": 0.35, + "learning_rate": 1.497108300130617e-05, + "loss": 0.3612, + "step": 4473 + }, + { + "epoch": 0.35, + "learning_rate": 1.4968856321434997e-05, + "loss": 0.3678, + "step": 4474 + }, + { + "epoch": 0.35, + "learning_rate": 1.4966629314388548e-05, + "loss": 0.311, + "step": 4475 + }, + { + "epoch": 0.35, + "learning_rate": 1.4964401980313452e-05, + "loss": 0.4311, + "step": 4476 + }, + { + "epoch": 0.35, + "learning_rate": 1.4962174319356372e-05, + "loss": 0.4215, + "step": 4477 + }, + { + "epoch": 0.35, + "learning_rate": 1.4959946331663995e-05, + "loss": 0.3612, + "step": 4478 + }, + { + "epoch": 0.35, + "learning_rate": 1.4957718017383013e-05, + "loss": 0.3252, + "step": 4479 + }, + { + "epoch": 0.35, + "learning_rate": 1.4955489376660157e-05, + "loss": 0.426, + "step": 4480 + }, + { + "epoch": 0.36, + "learning_rate": 1.4953260409642172e-05, + "loss": 0.5287, + "step": 4481 + }, + { + "epoch": 0.36, + "learning_rate": 1.4951031116475819e-05, + "loss": 0.3383, + "step": 4482 + }, + { + "epoch": 0.36, + "learning_rate": 1.4948801497307893e-05, + "loss": 0.3529, + "step": 4483 + }, + { + "epoch": 0.36, + "learning_rate": 1.4946571552285196e-05, + "loss": 0.4439, + "step": 4484 + }, + { + "epoch": 0.36, + "learning_rate": 1.4944341281554566e-05, + "loss": 0.3457, + "step": 4485 + }, + { + "epoch": 0.36, + "learning_rate": 1.4942110685262854e-05, + "loss": 0.4003, + "step": 4486 + }, + { + "epoch": 0.36, + "learning_rate": 1.493987976355693e-05, + "loss": 0.3482, + "step": 4487 + }, + { + "epoch": 0.36, + "learning_rate": 1.4937648516583696e-05, + "loss": 0.3308, + "step": 4488 + }, + { + "epoch": 0.36, + "learning_rate": 1.4935416944490066e-05, + "loss": 0.4776, + "step": 4489 + }, + { + "epoch": 0.36, + "learning_rate": 1.4933185047422976e-05, + "loss": 0.3529, + "step": 4490 + }, + { + "epoch": 0.36, + "learning_rate": 1.493095282552939e-05, + "loss": 0.4388, + "step": 4491 + }, + { + "epoch": 0.36, + "learning_rate": 1.4928720278956284e-05, + "loss": 0.3696, + "step": 4492 + }, + { + "epoch": 0.36, + "learning_rate": 1.4926487407850667e-05, + "loss": 0.4121, + "step": 4493 + }, + { + "epoch": 0.36, + "learning_rate": 1.4924254212359557e-05, + "loss": 0.4267, + "step": 4494 + }, + { + "epoch": 0.36, + "learning_rate": 1.492202069263e-05, + "loss": 0.2967, + "step": 4495 + }, + { + "epoch": 0.36, + "learning_rate": 1.4919786848809061e-05, + "loss": 0.3331, + "step": 4496 + }, + { + "epoch": 0.36, + "learning_rate": 1.4917552681043837e-05, + "loss": 0.3167, + "step": 4497 + }, + { + "epoch": 0.36, + "learning_rate": 1.4915318189481425e-05, + "loss": 0.5474, + "step": 4498 + }, + { + "epoch": 0.36, + "learning_rate": 1.4913083374268965e-05, + "loss": 0.2716, + "step": 4499 + }, + { + "epoch": 0.36, + "learning_rate": 1.4910848235553604e-05, + "loss": 0.407, + "step": 4500 + }, + { + "epoch": 0.36, + "learning_rate": 1.4908612773482514e-05, + "loss": 0.2681, + "step": 4501 + }, + { + "epoch": 0.36, + "learning_rate": 1.4906376988202893e-05, + "loss": 0.3012, + "step": 4502 + }, + { + "epoch": 0.36, + "learning_rate": 1.4904140879861957e-05, + "loss": 0.4082, + "step": 4503 + }, + { + "epoch": 0.36, + "learning_rate": 1.490190444860694e-05, + "loss": 0.2497, + "step": 4504 + }, + { + "epoch": 0.36, + "learning_rate": 1.48996676945851e-05, + "loss": 0.3772, + "step": 4505 + }, + { + "epoch": 0.36, + "learning_rate": 1.4897430617943718e-05, + "loss": 0.4483, + "step": 4506 + }, + { + "epoch": 0.36, + "learning_rate": 1.4895193218830098e-05, + "loss": 0.2484, + "step": 4507 + }, + { + "epoch": 0.36, + "learning_rate": 1.4892955497391556e-05, + "loss": 0.2892, + "step": 4508 + }, + { + "epoch": 0.36, + "learning_rate": 1.4890717453775438e-05, + "loss": 0.3648, + "step": 4509 + }, + { + "epoch": 0.36, + "learning_rate": 1.488847908812911e-05, + "loss": 0.2026, + "step": 4510 + }, + { + "epoch": 0.36, + "learning_rate": 1.4886240400599954e-05, + "loss": 0.3822, + "step": 4511 + }, + { + "epoch": 0.36, + "learning_rate": 1.488400139133538e-05, + "loss": 0.3525, + "step": 4512 + }, + { + "epoch": 0.36, + "learning_rate": 1.4881762060482814e-05, + "loss": 0.366, + "step": 4513 + }, + { + "epoch": 0.36, + "learning_rate": 1.4879522408189706e-05, + "loss": 0.3838, + "step": 4514 + }, + { + "epoch": 0.36, + "learning_rate": 1.4877282434603527e-05, + "loss": 0.2548, + "step": 4515 + }, + { + "epoch": 0.36, + "learning_rate": 1.4875042139871768e-05, + "loss": 0.4634, + "step": 4516 + }, + { + "epoch": 0.36, + "learning_rate": 1.487280152414194e-05, + "loss": 0.3491, + "step": 4517 + }, + { + "epoch": 0.36, + "learning_rate": 1.4870560587561578e-05, + "loss": 0.3592, + "step": 4518 + }, + { + "epoch": 0.36, + "learning_rate": 1.4868319330278236e-05, + "loss": 0.5435, + "step": 4519 + }, + { + "epoch": 0.36, + "learning_rate": 1.4866077752439495e-05, + "loss": 0.2156, + "step": 4520 + }, + { + "epoch": 0.36, + "learning_rate": 1.4863835854192945e-05, + "loss": 0.3613, + "step": 4521 + }, + { + "epoch": 0.36, + "learning_rate": 1.4861593635686207e-05, + "loss": 0.3138, + "step": 4522 + }, + { + "epoch": 0.36, + "learning_rate": 1.485935109706692e-05, + "loss": 0.4005, + "step": 4523 + }, + { + "epoch": 0.36, + "learning_rate": 1.4857108238482747e-05, + "loss": 0.3261, + "step": 4524 + }, + { + "epoch": 0.36, + "learning_rate": 1.4854865060081367e-05, + "loss": 0.4448, + "step": 4525 + }, + { + "epoch": 0.36, + "learning_rate": 1.4852621562010484e-05, + "loss": 0.4395, + "step": 4526 + }, + { + "epoch": 0.36, + "learning_rate": 1.4850377744417816e-05, + "loss": 0.3991, + "step": 4527 + }, + { + "epoch": 0.36, + "learning_rate": 1.4848133607451116e-05, + "loss": 0.318, + "step": 4528 + }, + { + "epoch": 0.36, + "learning_rate": 1.4845889151258144e-05, + "loss": 0.4001, + "step": 4529 + }, + { + "epoch": 0.36, + "learning_rate": 1.484364437598669e-05, + "loss": 0.3701, + "step": 4530 + }, + { + "epoch": 0.36, + "learning_rate": 1.4841399281784558e-05, + "loss": 0.3413, + "step": 4531 + }, + { + "epoch": 0.36, + "learning_rate": 1.4839153868799583e-05, + "loss": 0.3027, + "step": 4532 + }, + { + "epoch": 0.36, + "learning_rate": 1.4836908137179607e-05, + "loss": 0.3737, + "step": 4533 + }, + { + "epoch": 0.36, + "learning_rate": 1.4834662087072502e-05, + "loss": 0.3774, + "step": 4534 + }, + { + "epoch": 0.36, + "learning_rate": 1.4832415718626166e-05, + "loss": 0.3233, + "step": 4535 + }, + { + "epoch": 0.36, + "learning_rate": 1.4830169031988502e-05, + "loss": 0.4019, + "step": 4536 + }, + { + "epoch": 0.36, + "learning_rate": 1.482792202730745e-05, + "loss": 0.4066, + "step": 4537 + }, + { + "epoch": 0.36, + "learning_rate": 1.4825674704730966e-05, + "loss": 0.4072, + "step": 4538 + }, + { + "epoch": 0.36, + "learning_rate": 1.4823427064407018e-05, + "loss": 0.3073, + "step": 4539 + }, + { + "epoch": 0.36, + "learning_rate": 1.4821179106483609e-05, + "loss": 0.3466, + "step": 4540 + }, + { + "epoch": 0.36, + "learning_rate": 1.4818930831108755e-05, + "loss": 0.3361, + "step": 4541 + }, + { + "epoch": 0.36, + "learning_rate": 1.481668223843049e-05, + "loss": 0.4862, + "step": 4542 + }, + { + "epoch": 0.36, + "learning_rate": 1.481443332859688e-05, + "loss": 0.3674, + "step": 4543 + }, + { + "epoch": 0.36, + "learning_rate": 1.4812184101755997e-05, + "loss": 0.3916, + "step": 4544 + }, + { + "epoch": 0.36, + "learning_rate": 1.480993455805595e-05, + "loss": 0.4475, + "step": 4545 + }, + { + "epoch": 0.36, + "learning_rate": 1.480768469764485e-05, + "loss": 0.4479, + "step": 4546 + }, + { + "epoch": 0.36, + "learning_rate": 1.480543452067085e-05, + "loss": 0.4172, + "step": 4547 + }, + { + "epoch": 0.36, + "learning_rate": 1.480318402728211e-05, + "loss": 0.3806, + "step": 4548 + }, + { + "epoch": 0.36, + "learning_rate": 1.480093321762681e-05, + "loss": 0.438, + "step": 4549 + }, + { + "epoch": 0.36, + "learning_rate": 1.4798682091853161e-05, + "loss": 0.2699, + "step": 4550 + }, + { + "epoch": 0.36, + "learning_rate": 1.4796430650109383e-05, + "loss": 0.5026, + "step": 4551 + }, + { + "epoch": 0.36, + "learning_rate": 1.4794178892543727e-05, + "loss": 0.3868, + "step": 4552 + }, + { + "epoch": 0.36, + "learning_rate": 1.4791926819304462e-05, + "loss": 0.4423, + "step": 4553 + }, + { + "epoch": 0.36, + "learning_rate": 1.4789674430539868e-05, + "loss": 0.331, + "step": 4554 + }, + { + "epoch": 0.36, + "learning_rate": 1.4787421726398263e-05, + "loss": 0.3517, + "step": 4555 + }, + { + "epoch": 0.36, + "learning_rate": 1.4785168707027972e-05, + "loss": 0.386, + "step": 4556 + }, + { + "epoch": 0.36, + "learning_rate": 1.4782915372577347e-05, + "loss": 0.3324, + "step": 4557 + }, + { + "epoch": 0.36, + "learning_rate": 1.4780661723194757e-05, + "loss": 0.4171, + "step": 4558 + }, + { + "epoch": 0.36, + "learning_rate": 1.4778407759028599e-05, + "loss": 0.3687, + "step": 4559 + }, + { + "epoch": 0.36, + "learning_rate": 1.4776153480227278e-05, + "loss": 0.4377, + "step": 4560 + }, + { + "epoch": 0.36, + "learning_rate": 1.4773898886939235e-05, + "loss": 0.3657, + "step": 4561 + }, + { + "epoch": 0.36, + "learning_rate": 1.4771643979312917e-05, + "loss": 0.416, + "step": 4562 + }, + { + "epoch": 0.36, + "learning_rate": 1.4769388757496806e-05, + "loss": 0.288, + "step": 4563 + }, + { + "epoch": 0.36, + "learning_rate": 1.4767133221639394e-05, + "loss": 0.3623, + "step": 4564 + }, + { + "epoch": 0.36, + "learning_rate": 1.4764877371889194e-05, + "loss": 0.3755, + "step": 4565 + }, + { + "epoch": 0.36, + "learning_rate": 1.476262120839475e-05, + "loss": 0.3243, + "step": 4566 + }, + { + "epoch": 0.36, + "learning_rate": 1.4760364731304614e-05, + "loss": 0.416, + "step": 4567 + }, + { + "epoch": 0.36, + "learning_rate": 1.4758107940767368e-05, + "loss": 0.2954, + "step": 4568 + }, + { + "epoch": 0.36, + "learning_rate": 1.4755850836931607e-05, + "loss": 0.3212, + "step": 4569 + }, + { + "epoch": 0.36, + "learning_rate": 1.475359341994595e-05, + "loss": 0.4921, + "step": 4570 + }, + { + "epoch": 0.36, + "learning_rate": 1.4751335689959044e-05, + "loss": 0.4235, + "step": 4571 + }, + { + "epoch": 0.36, + "learning_rate": 1.4749077647119542e-05, + "loss": 0.2791, + "step": 4572 + }, + { + "epoch": 0.36, + "learning_rate": 1.474681929157613e-05, + "loss": 0.4522, + "step": 4573 + }, + { + "epoch": 0.36, + "learning_rate": 1.4744560623477502e-05, + "loss": 0.4161, + "step": 4574 + }, + { + "epoch": 0.36, + "learning_rate": 1.4742301642972392e-05, + "loss": 0.3834, + "step": 4575 + }, + { + "epoch": 0.36, + "learning_rate": 1.4740042350209536e-05, + "loss": 0.3781, + "step": 4576 + }, + { + "epoch": 0.36, + "learning_rate": 1.4737782745337696e-05, + "loss": 0.3531, + "step": 4577 + }, + { + "epoch": 0.36, + "learning_rate": 1.4735522828505663e-05, + "loss": 0.4147, + "step": 4578 + }, + { + "epoch": 0.36, + "learning_rate": 1.4733262599862234e-05, + "loss": 0.359, + "step": 4579 + }, + { + "epoch": 0.36, + "learning_rate": 1.4731002059556242e-05, + "loss": 0.3298, + "step": 4580 + }, + { + "epoch": 0.36, + "learning_rate": 1.4728741207736525e-05, + "loss": 0.379, + "step": 4581 + }, + { + "epoch": 0.36, + "learning_rate": 1.4726480044551953e-05, + "loss": 0.431, + "step": 4582 + }, + { + "epoch": 0.36, + "learning_rate": 1.4724218570151415e-05, + "loss": 0.4556, + "step": 4583 + }, + { + "epoch": 0.36, + "learning_rate": 1.4721956784683813e-05, + "loss": 0.5208, + "step": 4584 + }, + { + "epoch": 0.36, + "learning_rate": 1.4719694688298078e-05, + "loss": 0.4488, + "step": 4585 + }, + { + "epoch": 0.36, + "learning_rate": 1.4717432281143161e-05, + "loss": 0.2527, + "step": 4586 + }, + { + "epoch": 0.36, + "learning_rate": 1.4715169563368021e-05, + "loss": 0.4116, + "step": 4587 + }, + { + "epoch": 0.36, + "learning_rate": 1.4712906535121658e-05, + "loss": 0.2697, + "step": 4588 + }, + { + "epoch": 0.36, + "learning_rate": 1.4710643196553074e-05, + "loss": 0.4261, + "step": 4589 + }, + { + "epoch": 0.36, + "learning_rate": 1.4708379547811302e-05, + "loss": 0.3057, + "step": 4590 + }, + { + "epoch": 0.36, + "learning_rate": 1.4706115589045396e-05, + "loss": 0.3614, + "step": 4591 + }, + { + "epoch": 0.36, + "learning_rate": 1.4703851320404416e-05, + "loss": 0.4889, + "step": 4592 + }, + { + "epoch": 0.36, + "learning_rate": 1.4701586742037464e-05, + "loss": 0.3305, + "step": 4593 + }, + { + "epoch": 0.36, + "learning_rate": 1.4699321854093649e-05, + "loss": 0.406, + "step": 4594 + }, + { + "epoch": 0.36, + "learning_rate": 1.46970566567221e-05, + "loss": 0.442, + "step": 4595 + }, + { + "epoch": 0.36, + "learning_rate": 1.469479115007197e-05, + "loss": 0.467, + "step": 4596 + }, + { + "epoch": 0.36, + "learning_rate": 1.4692525334292434e-05, + "loss": 0.2784, + "step": 4597 + }, + { + "epoch": 0.36, + "learning_rate": 1.4690259209532682e-05, + "loss": 0.278, + "step": 4598 + }, + { + "epoch": 0.36, + "learning_rate": 1.468799277594193e-05, + "loss": 0.3662, + "step": 4599 + }, + { + "epoch": 0.36, + "learning_rate": 1.4685726033669412e-05, + "loss": 0.4355, + "step": 4600 + }, + { + "epoch": 0.36, + "learning_rate": 1.468345898286438e-05, + "loss": 0.3507, + "step": 4601 + }, + { + "epoch": 0.36, + "learning_rate": 1.468119162367611e-05, + "loss": 0.2824, + "step": 4602 + }, + { + "epoch": 0.36, + "learning_rate": 1.4678923956253894e-05, + "loss": 0.5299, + "step": 4603 + }, + { + "epoch": 0.36, + "learning_rate": 1.4676655980747052e-05, + "loss": 0.3477, + "step": 4604 + }, + { + "epoch": 0.36, + "learning_rate": 1.4674387697304914e-05, + "loss": 0.2926, + "step": 4605 + }, + { + "epoch": 0.36, + "learning_rate": 1.4672119106076838e-05, + "loss": 0.5394, + "step": 4606 + }, + { + "epoch": 0.36, + "learning_rate": 1.4669850207212202e-05, + "loss": 0.3839, + "step": 4607 + }, + { + "epoch": 0.37, + "learning_rate": 1.4667581000860395e-05, + "loss": 0.4277, + "step": 4608 + }, + { + "epoch": 0.37, + "learning_rate": 1.4665311487170844e-05, + "loss": 0.5102, + "step": 4609 + }, + { + "epoch": 0.37, + "learning_rate": 1.4663041666292978e-05, + "loss": 0.4354, + "step": 4610 + }, + { + "epoch": 0.37, + "learning_rate": 1.4660771538376253e-05, + "loss": 0.4371, + "step": 4611 + }, + { + "epoch": 0.37, + "learning_rate": 1.4658501103570149e-05, + "loss": 0.3802, + "step": 4612 + }, + { + "epoch": 0.37, + "learning_rate": 1.4656230362024166e-05, + "loss": 0.4065, + "step": 4613 + }, + { + "epoch": 0.37, + "learning_rate": 1.4653959313887813e-05, + "loss": 0.3477, + "step": 4614 + }, + { + "epoch": 0.37, + "learning_rate": 1.4651687959310636e-05, + "loss": 0.3369, + "step": 4615 + }, + { + "epoch": 0.37, + "learning_rate": 1.4649416298442187e-05, + "loss": 0.3052, + "step": 4616 + }, + { + "epoch": 0.37, + "learning_rate": 1.4647144331432049e-05, + "loss": 0.4264, + "step": 4617 + }, + { + "epoch": 0.37, + "learning_rate": 1.4644872058429816e-05, + "loss": 0.2995, + "step": 4618 + }, + { + "epoch": 0.37, + "learning_rate": 1.4642599479585106e-05, + "loss": 0.4138, + "step": 4619 + }, + { + "epoch": 0.37, + "learning_rate": 1.4640326595047561e-05, + "loss": 0.4928, + "step": 4620 + }, + { + "epoch": 0.37, + "learning_rate": 1.4638053404966836e-05, + "loss": 0.4441, + "step": 4621 + }, + { + "epoch": 0.37, + "learning_rate": 1.4635779909492614e-05, + "loss": 0.304, + "step": 4622 + }, + { + "epoch": 0.37, + "learning_rate": 1.4633506108774588e-05, + "loss": 0.3656, + "step": 4623 + }, + { + "epoch": 0.37, + "learning_rate": 1.4631232002962481e-05, + "loss": 0.3893, + "step": 4624 + }, + { + "epoch": 0.37, + "learning_rate": 1.462895759220603e-05, + "loss": 0.2778, + "step": 4625 + }, + { + "epoch": 0.37, + "learning_rate": 1.4626682876654998e-05, + "loss": 0.3708, + "step": 4626 + }, + { + "epoch": 0.37, + "learning_rate": 1.4624407856459154e-05, + "loss": 0.4219, + "step": 4627 + }, + { + "epoch": 0.37, + "learning_rate": 1.4622132531768309e-05, + "loss": 0.4148, + "step": 4628 + }, + { + "epoch": 0.37, + "learning_rate": 1.4619856902732279e-05, + "loss": 0.3372, + "step": 4629 + }, + { + "epoch": 0.37, + "learning_rate": 1.4617580969500895e-05, + "loss": 0.4078, + "step": 4630 + }, + { + "epoch": 0.37, + "learning_rate": 1.461530473222403e-05, + "loss": 0.3335, + "step": 4631 + }, + { + "epoch": 0.37, + "learning_rate": 1.4613028191051548e-05, + "loss": 0.3473, + "step": 4632 + }, + { + "epoch": 0.37, + "learning_rate": 1.4610751346133361e-05, + "loss": 0.3274, + "step": 4633 + }, + { + "epoch": 0.37, + "learning_rate": 1.4608474197619383e-05, + "loss": 0.4041, + "step": 4634 + }, + { + "epoch": 0.37, + "learning_rate": 1.4606196745659551e-05, + "loss": 0.3641, + "step": 4635 + }, + { + "epoch": 0.37, + "learning_rate": 1.460391899040383e-05, + "loss": 0.3325, + "step": 4636 + }, + { + "epoch": 0.37, + "learning_rate": 1.4601640932002194e-05, + "loss": 0.4305, + "step": 4637 + }, + { + "epoch": 0.37, + "learning_rate": 1.4599362570604645e-05, + "loss": 0.2968, + "step": 4638 + }, + { + "epoch": 0.37, + "learning_rate": 1.4597083906361203e-05, + "loss": 0.4511, + "step": 4639 + }, + { + "epoch": 0.37, + "learning_rate": 1.4594804939421903e-05, + "loss": 0.3455, + "step": 4640 + }, + { + "epoch": 0.37, + "learning_rate": 1.4592525669936808e-05, + "loss": 0.3798, + "step": 4641 + }, + { + "epoch": 0.37, + "learning_rate": 1.4590246098055995e-05, + "loss": 0.4892, + "step": 4642 + }, + { + "epoch": 0.37, + "learning_rate": 1.4587966223929562e-05, + "loss": 0.3697, + "step": 4643 + }, + { + "epoch": 0.37, + "learning_rate": 1.458568604770763e-05, + "loss": 0.3723, + "step": 4644 + }, + { + "epoch": 0.37, + "learning_rate": 1.458340556954034e-05, + "loss": 0.3387, + "step": 4645 + }, + { + "epoch": 0.37, + "learning_rate": 1.4581124789577841e-05, + "loss": 0.3969, + "step": 4646 + }, + { + "epoch": 0.37, + "learning_rate": 1.4578843707970323e-05, + "loss": 0.3845, + "step": 4647 + }, + { + "epoch": 0.37, + "learning_rate": 1.4576562324867975e-05, + "loss": 0.3114, + "step": 4648 + }, + { + "epoch": 0.37, + "learning_rate": 1.457428064042102e-05, + "loss": 0.434, + "step": 4649 + }, + { + "epoch": 0.37, + "learning_rate": 1.45719986547797e-05, + "loss": 0.2643, + "step": 4650 + }, + { + "epoch": 0.37, + "learning_rate": 1.4569716368094262e-05, + "loss": 0.3174, + "step": 4651 + }, + { + "epoch": 0.37, + "learning_rate": 1.456743378051499e-05, + "loss": 0.3815, + "step": 4652 + }, + { + "epoch": 0.37, + "learning_rate": 1.456515089219218e-05, + "loss": 0.3104, + "step": 4653 + }, + { + "epoch": 0.37, + "learning_rate": 1.456286770327615e-05, + "loss": 0.4539, + "step": 4654 + }, + { + "epoch": 0.37, + "learning_rate": 1.456058421391724e-05, + "loss": 0.2625, + "step": 4655 + }, + { + "epoch": 0.37, + "learning_rate": 1.45583004242658e-05, + "loss": 0.414, + "step": 4656 + }, + { + "epoch": 0.37, + "learning_rate": 1.4556016334472211e-05, + "loss": 0.3729, + "step": 4657 + }, + { + "epoch": 0.37, + "learning_rate": 1.455373194468687e-05, + "loss": 0.3201, + "step": 4658 + }, + { + "epoch": 0.37, + "learning_rate": 1.4551447255060192e-05, + "loss": 0.3165, + "step": 4659 + }, + { + "epoch": 0.37, + "learning_rate": 1.4549162265742608e-05, + "loss": 0.2455, + "step": 4660 + }, + { + "epoch": 0.37, + "learning_rate": 1.4546876976884583e-05, + "loss": 0.3496, + "step": 4661 + }, + { + "epoch": 0.37, + "learning_rate": 1.4544591388636584e-05, + "loss": 0.2901, + "step": 4662 + }, + { + "epoch": 0.37, + "learning_rate": 1.454230550114911e-05, + "loss": 0.2412, + "step": 4663 + }, + { + "epoch": 0.37, + "learning_rate": 1.4540019314572678e-05, + "loss": 0.3362, + "step": 4664 + }, + { + "epoch": 0.37, + "learning_rate": 1.4537732829057816e-05, + "loss": 0.5096, + "step": 4665 + }, + { + "epoch": 0.37, + "learning_rate": 1.4535446044755082e-05, + "loss": 0.411, + "step": 4666 + }, + { + "epoch": 0.37, + "learning_rate": 1.4533158961815048e-05, + "loss": 0.395, + "step": 4667 + }, + { + "epoch": 0.37, + "learning_rate": 1.4530871580388311e-05, + "loss": 0.2166, + "step": 4668 + }, + { + "epoch": 0.37, + "learning_rate": 1.4528583900625481e-05, + "loss": 0.4227, + "step": 4669 + }, + { + "epoch": 0.37, + "learning_rate": 1.4526295922677189e-05, + "loss": 0.3894, + "step": 4670 + }, + { + "epoch": 0.37, + "learning_rate": 1.4524007646694091e-05, + "loss": 0.4363, + "step": 4671 + }, + { + "epoch": 0.37, + "learning_rate": 1.4521719072826858e-05, + "loss": 0.3228, + "step": 4672 + }, + { + "epoch": 0.37, + "learning_rate": 1.451943020122618e-05, + "loss": 0.2931, + "step": 4673 + }, + { + "epoch": 0.37, + "learning_rate": 1.4517141032042773e-05, + "loss": 0.3022, + "step": 4674 + }, + { + "epoch": 0.37, + "learning_rate": 1.4514851565427362e-05, + "loss": 0.3303, + "step": 4675 + }, + { + "epoch": 0.37, + "learning_rate": 1.4512561801530699e-05, + "loss": 0.3847, + "step": 4676 + }, + { + "epoch": 0.37, + "learning_rate": 1.4510271740503555e-05, + "loss": 0.3269, + "step": 4677 + }, + { + "epoch": 0.37, + "learning_rate": 1.4507981382496716e-05, + "loss": 0.3952, + "step": 4678 + }, + { + "epoch": 0.37, + "learning_rate": 1.4505690727660997e-05, + "loss": 0.4134, + "step": 4679 + }, + { + "epoch": 0.37, + "learning_rate": 1.4503399776147223e-05, + "loss": 0.3465, + "step": 4680 + }, + { + "epoch": 0.37, + "learning_rate": 1.4501108528106243e-05, + "loss": 0.3999, + "step": 4681 + }, + { + "epoch": 0.37, + "learning_rate": 1.4498816983688926e-05, + "loss": 0.529, + "step": 4682 + }, + { + "epoch": 0.37, + "learning_rate": 1.4496525143046154e-05, + "loss": 0.4157, + "step": 4683 + }, + { + "epoch": 0.37, + "learning_rate": 1.4494233006328837e-05, + "loss": 0.415, + "step": 4684 + }, + { + "epoch": 0.37, + "learning_rate": 1.4491940573687906e-05, + "loss": 0.3111, + "step": 4685 + }, + { + "epoch": 0.37, + "learning_rate": 1.44896478452743e-05, + "loss": 0.3317, + "step": 4686 + }, + { + "epoch": 0.37, + "learning_rate": 1.4487354821238983e-05, + "loss": 0.3521, + "step": 4687 + }, + { + "epoch": 0.37, + "learning_rate": 1.4485061501732949e-05, + "loss": 0.3744, + "step": 4688 + }, + { + "epoch": 0.37, + "learning_rate": 1.448276788690719e-05, + "loss": 0.2974, + "step": 4689 + }, + { + "epoch": 0.37, + "learning_rate": 1.4480473976912737e-05, + "loss": 0.2951, + "step": 4690 + }, + { + "epoch": 0.37, + "learning_rate": 1.4478179771900634e-05, + "loss": 0.301, + "step": 4691 + }, + { + "epoch": 0.37, + "learning_rate": 1.4475885272021936e-05, + "loss": 0.3571, + "step": 4692 + }, + { + "epoch": 0.37, + "learning_rate": 1.4473590477427735e-05, + "loss": 0.2719, + "step": 4693 + }, + { + "epoch": 0.37, + "learning_rate": 1.4471295388269121e-05, + "loss": 0.4249, + "step": 4694 + }, + { + "epoch": 0.37, + "learning_rate": 1.4469000004697224e-05, + "loss": 0.3262, + "step": 4695 + }, + { + "epoch": 0.37, + "learning_rate": 1.446670432686318e-05, + "loss": 0.312, + "step": 4696 + }, + { + "epoch": 0.37, + "learning_rate": 1.4464408354918145e-05, + "loss": 0.4009, + "step": 4697 + }, + { + "epoch": 0.37, + "learning_rate": 1.4462112089013304e-05, + "loss": 0.3575, + "step": 4698 + }, + { + "epoch": 0.37, + "learning_rate": 1.4459815529299851e-05, + "loss": 0.3327, + "step": 4699 + }, + { + "epoch": 0.37, + "learning_rate": 1.4457518675929008e-05, + "loss": 0.3468, + "step": 4700 + }, + { + "epoch": 0.37, + "learning_rate": 1.4455221529052006e-05, + "loss": 0.3185, + "step": 4701 + }, + { + "epoch": 0.37, + "learning_rate": 1.4452924088820101e-05, + "loss": 0.3743, + "step": 4702 + }, + { + "epoch": 0.37, + "learning_rate": 1.4450626355384573e-05, + "loss": 0.4268, + "step": 4703 + }, + { + "epoch": 0.37, + "learning_rate": 1.4448328328896717e-05, + "loss": 0.2639, + "step": 4704 + }, + { + "epoch": 0.37, + "learning_rate": 1.444603000950784e-05, + "loss": 0.3399, + "step": 4705 + }, + { + "epoch": 0.37, + "learning_rate": 1.4443731397369283e-05, + "loss": 0.3253, + "step": 4706 + }, + { + "epoch": 0.37, + "learning_rate": 1.4441432492632395e-05, + "loss": 0.3744, + "step": 4707 + }, + { + "epoch": 0.37, + "learning_rate": 1.4439133295448547e-05, + "loss": 0.3672, + "step": 4708 + }, + { + "epoch": 0.37, + "learning_rate": 1.4436833805969133e-05, + "loss": 0.3364, + "step": 4709 + }, + { + "epoch": 0.37, + "learning_rate": 1.4434534024345558e-05, + "loss": 0.3104, + "step": 4710 + }, + { + "epoch": 0.37, + "learning_rate": 1.4432233950729257e-05, + "loss": 0.3611, + "step": 4711 + }, + { + "epoch": 0.37, + "learning_rate": 1.442993358527168e-05, + "loss": 0.4458, + "step": 4712 + }, + { + "epoch": 0.37, + "learning_rate": 1.4427632928124288e-05, + "loss": 0.4283, + "step": 4713 + }, + { + "epoch": 0.37, + "learning_rate": 1.4425331979438573e-05, + "loss": 0.2868, + "step": 4714 + }, + { + "epoch": 0.37, + "learning_rate": 1.4423030739366042e-05, + "loss": 0.2551, + "step": 4715 + }, + { + "epoch": 0.37, + "learning_rate": 1.4420729208058217e-05, + "loss": 0.3909, + "step": 4716 + }, + { + "epoch": 0.37, + "learning_rate": 1.4418427385666647e-05, + "loss": 0.5098, + "step": 4717 + }, + { + "epoch": 0.37, + "learning_rate": 1.4416125272342891e-05, + "loss": 0.4247, + "step": 4718 + }, + { + "epoch": 0.37, + "learning_rate": 1.4413822868238537e-05, + "loss": 0.3665, + "step": 4719 + }, + { + "epoch": 0.37, + "learning_rate": 1.4411520173505184e-05, + "loss": 0.4522, + "step": 4720 + }, + { + "epoch": 0.37, + "learning_rate": 1.4409217188294456e-05, + "loss": 0.343, + "step": 4721 + }, + { + "epoch": 0.37, + "learning_rate": 1.440691391275799e-05, + "loss": 0.3746, + "step": 4722 + }, + { + "epoch": 0.37, + "learning_rate": 1.440461034704745e-05, + "loss": 0.3402, + "step": 4723 + }, + { + "epoch": 0.37, + "learning_rate": 1.4402306491314508e-05, + "loss": 0.542, + "step": 4724 + }, + { + "epoch": 0.37, + "learning_rate": 1.4400002345710871e-05, + "loss": 0.2061, + "step": 4725 + }, + { + "epoch": 0.37, + "learning_rate": 1.4397697910388248e-05, + "loss": 0.2991, + "step": 4726 + }, + { + "epoch": 0.37, + "learning_rate": 1.4395393185498381e-05, + "loss": 0.404, + "step": 4727 + }, + { + "epoch": 0.37, + "learning_rate": 1.4393088171193021e-05, + "loss": 0.4232, + "step": 4728 + }, + { + "epoch": 0.37, + "learning_rate": 1.439078286762394e-05, + "loss": 0.4145, + "step": 4729 + }, + { + "epoch": 0.37, + "learning_rate": 1.4388477274942936e-05, + "loss": 0.4395, + "step": 4730 + }, + { + "epoch": 0.37, + "learning_rate": 1.438617139330182e-05, + "loss": 0.4631, + "step": 4731 + }, + { + "epoch": 0.37, + "learning_rate": 1.4383865222852423e-05, + "loss": 0.4233, + "step": 4732 + }, + { + "epoch": 0.37, + "learning_rate": 1.4381558763746593e-05, + "loss": 0.351, + "step": 4733 + }, + { + "epoch": 0.38, + "learning_rate": 1.4379252016136203e-05, + "loss": 0.3444, + "step": 4734 + }, + { + "epoch": 0.38, + "learning_rate": 1.4376944980173138e-05, + "loss": 0.3635, + "step": 4735 + }, + { + "epoch": 0.38, + "learning_rate": 1.4374637656009309e-05, + "loss": 0.3845, + "step": 4736 + }, + { + "epoch": 0.38, + "learning_rate": 1.4372330043796636e-05, + "loss": 0.3877, + "step": 4737 + }, + { + "epoch": 0.38, + "learning_rate": 1.437002214368707e-05, + "loss": 0.4021, + "step": 4738 + }, + { + "epoch": 0.38, + "learning_rate": 1.4367713955832575e-05, + "loss": 0.46, + "step": 4739 + }, + { + "epoch": 0.38, + "learning_rate": 1.4365405480385129e-05, + "loss": 0.3076, + "step": 4740 + }, + { + "epoch": 0.38, + "learning_rate": 1.4363096717496738e-05, + "loss": 0.4307, + "step": 4741 + }, + { + "epoch": 0.38, + "learning_rate": 1.4360787667319423e-05, + "loss": 0.3215, + "step": 4742 + }, + { + "epoch": 0.38, + "learning_rate": 1.4358478330005222e-05, + "loss": 0.3399, + "step": 4743 + }, + { + "epoch": 0.38, + "learning_rate": 1.4356168705706195e-05, + "loss": 0.4439, + "step": 4744 + }, + { + "epoch": 0.38, + "learning_rate": 1.4353858794574418e-05, + "loss": 0.36, + "step": 4745 + }, + { + "epoch": 0.38, + "learning_rate": 1.435154859676199e-05, + "loss": 0.3076, + "step": 4746 + }, + { + "epoch": 0.38, + "learning_rate": 1.4349238112421025e-05, + "loss": 0.3578, + "step": 4747 + }, + { + "epoch": 0.38, + "learning_rate": 1.4346927341703659e-05, + "loss": 0.2969, + "step": 4748 + }, + { + "epoch": 0.38, + "learning_rate": 1.4344616284762038e-05, + "loss": 0.3796, + "step": 4749 + }, + { + "epoch": 0.38, + "learning_rate": 1.4342304941748347e-05, + "loss": 0.3761, + "step": 4750 + }, + { + "epoch": 0.38, + "learning_rate": 1.4339993312814765e-05, + "loss": 0.3424, + "step": 4751 + }, + { + "epoch": 0.38, + "learning_rate": 1.4337681398113508e-05, + "loss": 0.4495, + "step": 4752 + }, + { + "epoch": 0.38, + "learning_rate": 1.4335369197796803e-05, + "loss": 0.4033, + "step": 4753 + }, + { + "epoch": 0.38, + "learning_rate": 1.4333056712016893e-05, + "loss": 0.3739, + "step": 4754 + }, + { + "epoch": 0.38, + "learning_rate": 1.4330743940926052e-05, + "loss": 0.407, + "step": 4755 + }, + { + "epoch": 0.38, + "learning_rate": 1.4328430884676559e-05, + "loss": 0.3775, + "step": 4756 + }, + { + "epoch": 0.38, + "learning_rate": 1.432611754342072e-05, + "loss": 0.2658, + "step": 4757 + }, + { + "epoch": 0.38, + "learning_rate": 1.4323803917310857e-05, + "loss": 0.3781, + "step": 4758 + }, + { + "epoch": 0.38, + "learning_rate": 1.4321490006499309e-05, + "loss": 0.4022, + "step": 4759 + }, + { + "epoch": 0.38, + "learning_rate": 1.4319175811138439e-05, + "loss": 0.3892, + "step": 4760 + }, + { + "epoch": 0.38, + "learning_rate": 1.4316861331380624e-05, + "loss": 0.3139, + "step": 4761 + }, + { + "epoch": 0.38, + "learning_rate": 1.431454656737826e-05, + "loss": 0.3091, + "step": 4762 + }, + { + "epoch": 0.38, + "learning_rate": 1.4312231519283768e-05, + "loss": 0.4494, + "step": 4763 + }, + { + "epoch": 0.38, + "learning_rate": 1.4309916187249578e-05, + "loss": 0.4114, + "step": 4764 + }, + { + "epoch": 0.38, + "learning_rate": 1.4307600571428143e-05, + "loss": 0.3057, + "step": 4765 + }, + { + "epoch": 0.38, + "learning_rate": 1.4305284671971943e-05, + "loss": 0.3172, + "step": 4766 + }, + { + "epoch": 0.38, + "learning_rate": 1.4302968489033462e-05, + "loss": 0.3981, + "step": 4767 + }, + { + "epoch": 0.38, + "learning_rate": 1.4300652022765207e-05, + "loss": 0.2528, + "step": 4768 + }, + { + "epoch": 0.38, + "learning_rate": 1.429833527331971e-05, + "loss": 0.3059, + "step": 4769 + }, + { + "epoch": 0.38, + "learning_rate": 1.4296018240849518e-05, + "loss": 0.4361, + "step": 4770 + }, + { + "epoch": 0.38, + "learning_rate": 1.4293700925507199e-05, + "loss": 0.4316, + "step": 4771 + }, + { + "epoch": 0.38, + "learning_rate": 1.429138332744533e-05, + "loss": 0.3439, + "step": 4772 + }, + { + "epoch": 0.38, + "learning_rate": 1.428906544681652e-05, + "loss": 0.562, + "step": 4773 + }, + { + "epoch": 0.38, + "learning_rate": 1.4286747283773388e-05, + "loss": 0.3572, + "step": 4774 + }, + { + "epoch": 0.38, + "learning_rate": 1.4284428838468572e-05, + "loss": 0.4048, + "step": 4775 + }, + { + "epoch": 0.38, + "learning_rate": 1.4282110111054733e-05, + "loss": 0.4068, + "step": 4776 + }, + { + "epoch": 0.38, + "learning_rate": 1.4279791101684547e-05, + "loss": 0.4176, + "step": 4777 + }, + { + "epoch": 0.38, + "learning_rate": 1.427747181051071e-05, + "loss": 0.419, + "step": 4778 + }, + { + "epoch": 0.38, + "learning_rate": 1.4275152237685938e-05, + "loss": 0.4407, + "step": 4779 + }, + { + "epoch": 0.38, + "learning_rate": 1.4272832383362962e-05, + "loss": 0.2978, + "step": 4780 + }, + { + "epoch": 0.38, + "learning_rate": 1.427051224769453e-05, + "loss": 0.2626, + "step": 4781 + }, + { + "epoch": 0.38, + "learning_rate": 1.4268191830833417e-05, + "loss": 0.3443, + "step": 4782 + }, + { + "epoch": 0.38, + "learning_rate": 1.426587113293241e-05, + "loss": 0.349, + "step": 4783 + }, + { + "epoch": 0.38, + "learning_rate": 1.4263550154144313e-05, + "loss": 0.3452, + "step": 4784 + }, + { + "epoch": 0.38, + "learning_rate": 1.4261228894621955e-05, + "loss": 0.3484, + "step": 4785 + }, + { + "epoch": 0.38, + "learning_rate": 1.4258907354518177e-05, + "loss": 0.4289, + "step": 4786 + }, + { + "epoch": 0.38, + "learning_rate": 1.4256585533985842e-05, + "loss": 0.3767, + "step": 4787 + }, + { + "epoch": 0.38, + "learning_rate": 1.425426343317783e-05, + "loss": 0.3941, + "step": 4788 + }, + { + "epoch": 0.38, + "learning_rate": 1.4251941052247044e-05, + "loss": 0.3883, + "step": 4789 + }, + { + "epoch": 0.38, + "learning_rate": 1.4249618391346399e-05, + "loss": 0.2508, + "step": 4790 + }, + { + "epoch": 0.38, + "learning_rate": 1.4247295450628826e-05, + "loss": 0.443, + "step": 4791 + }, + { + "epoch": 0.38, + "learning_rate": 1.4244972230247287e-05, + "loss": 0.3267, + "step": 4792 + }, + { + "epoch": 0.38, + "learning_rate": 1.4242648730354756e-05, + "loss": 0.3978, + "step": 4793 + }, + { + "epoch": 0.38, + "learning_rate": 1.4240324951104213e-05, + "loss": 0.3622, + "step": 4794 + }, + { + "epoch": 0.38, + "learning_rate": 1.4238000892648682e-05, + "loss": 0.3969, + "step": 4795 + }, + { + "epoch": 0.38, + "learning_rate": 1.423567655514118e-05, + "loss": 0.3843, + "step": 4796 + }, + { + "epoch": 0.38, + "learning_rate": 1.4233351938734758e-05, + "loss": 0.4479, + "step": 4797 + }, + { + "epoch": 0.38, + "learning_rate": 1.4231027043582483e-05, + "loss": 0.3367, + "step": 4798 + }, + { + "epoch": 0.38, + "learning_rate": 1.4228701869837433e-05, + "loss": 0.2789, + "step": 4799 + }, + { + "epoch": 0.38, + "learning_rate": 1.4226376417652713e-05, + "loss": 0.2878, + "step": 4800 + }, + { + "epoch": 0.38, + "learning_rate": 1.4224050687181442e-05, + "loss": 0.4985, + "step": 4801 + }, + { + "epoch": 0.38, + "learning_rate": 1.4221724678576756e-05, + "loss": 0.3828, + "step": 4802 + }, + { + "epoch": 0.38, + "learning_rate": 1.421939839199182e-05, + "loss": 0.3858, + "step": 4803 + }, + { + "epoch": 0.38, + "learning_rate": 1.4217071827579796e-05, + "loss": 0.4332, + "step": 4804 + }, + { + "epoch": 0.38, + "learning_rate": 1.4214744985493884e-05, + "loss": 0.3719, + "step": 4805 + }, + { + "epoch": 0.38, + "learning_rate": 1.4212417865887299e-05, + "loss": 0.3039, + "step": 4806 + }, + { + "epoch": 0.38, + "learning_rate": 1.4210090468913263e-05, + "loss": 0.4563, + "step": 4807 + }, + { + "epoch": 0.38, + "learning_rate": 1.4207762794725026e-05, + "loss": 0.2729, + "step": 4808 + }, + { + "epoch": 0.38, + "learning_rate": 1.4205434843475859e-05, + "loss": 0.4953, + "step": 4809 + }, + { + "epoch": 0.38, + "learning_rate": 1.420310661531904e-05, + "loss": 0.3653, + "step": 4810 + }, + { + "epoch": 0.38, + "learning_rate": 1.4200778110407873e-05, + "loss": 0.3882, + "step": 4811 + }, + { + "epoch": 0.38, + "learning_rate": 1.4198449328895685e-05, + "loss": 0.3563, + "step": 4812 + }, + { + "epoch": 0.38, + "learning_rate": 1.4196120270935807e-05, + "loss": 0.4173, + "step": 4813 + }, + { + "epoch": 0.38, + "learning_rate": 1.4193790936681602e-05, + "loss": 0.5137, + "step": 4814 + }, + { + "epoch": 0.38, + "learning_rate": 1.4191461326286442e-05, + "loss": 0.3609, + "step": 4815 + }, + { + "epoch": 0.38, + "learning_rate": 1.4189131439903721e-05, + "loss": 0.4398, + "step": 4816 + }, + { + "epoch": 0.38, + "learning_rate": 1.4186801277686852e-05, + "loss": 0.4927, + "step": 4817 + }, + { + "epoch": 0.38, + "learning_rate": 1.4184470839789265e-05, + "loss": 0.2058, + "step": 4818 + }, + { + "epoch": 0.38, + "learning_rate": 1.4182140126364404e-05, + "loss": 0.3395, + "step": 4819 + }, + { + "epoch": 0.38, + "learning_rate": 1.4179809137565742e-05, + "loss": 0.3043, + "step": 4820 + }, + { + "epoch": 0.38, + "learning_rate": 1.417747787354676e-05, + "loss": 0.429, + "step": 4821 + }, + { + "epoch": 0.38, + "learning_rate": 1.4175146334460963e-05, + "loss": 0.3933, + "step": 4822 + }, + { + "epoch": 0.38, + "learning_rate": 1.4172814520461867e-05, + "loss": 0.3618, + "step": 4823 + }, + { + "epoch": 0.38, + "learning_rate": 1.4170482431703012e-05, + "loss": 0.403, + "step": 4824 + }, + { + "epoch": 0.38, + "learning_rate": 1.4168150068337958e-05, + "loss": 0.3883, + "step": 4825 + }, + { + "epoch": 0.38, + "learning_rate": 1.4165817430520276e-05, + "loss": 0.3408, + "step": 4826 + }, + { + "epoch": 0.38, + "learning_rate": 1.4163484518403561e-05, + "loss": 0.3568, + "step": 4827 + }, + { + "epoch": 0.38, + "learning_rate": 1.4161151332141426e-05, + "loss": 0.4812, + "step": 4828 + }, + { + "epoch": 0.38, + "learning_rate": 1.4158817871887497e-05, + "loss": 0.3804, + "step": 4829 + }, + { + "epoch": 0.38, + "learning_rate": 1.4156484137795424e-05, + "loss": 0.3191, + "step": 4830 + }, + { + "epoch": 0.38, + "learning_rate": 1.4154150130018867e-05, + "loss": 0.342, + "step": 4831 + }, + { + "epoch": 0.38, + "learning_rate": 1.4151815848711512e-05, + "loss": 0.4374, + "step": 4832 + }, + { + "epoch": 0.38, + "learning_rate": 1.4149481294027063e-05, + "loss": 0.4673, + "step": 4833 + }, + { + "epoch": 0.38, + "learning_rate": 1.4147146466119235e-05, + "loss": 0.3466, + "step": 4834 + }, + { + "epoch": 0.38, + "learning_rate": 1.4144811365141769e-05, + "loss": 0.2172, + "step": 4835 + }, + { + "epoch": 0.38, + "learning_rate": 1.4142475991248417e-05, + "loss": 0.4468, + "step": 4836 + }, + { + "epoch": 0.38, + "learning_rate": 1.4140140344592952e-05, + "loss": 0.4202, + "step": 4837 + }, + { + "epoch": 0.38, + "learning_rate": 1.413780442532917e-05, + "loss": 0.3815, + "step": 4838 + }, + { + "epoch": 0.38, + "learning_rate": 1.4135468233610872e-05, + "loss": 0.3264, + "step": 4839 + }, + { + "epoch": 0.38, + "learning_rate": 1.4133131769591893e-05, + "loss": 0.3251, + "step": 4840 + }, + { + "epoch": 0.38, + "learning_rate": 1.4130795033426073e-05, + "loss": 0.3642, + "step": 4841 + }, + { + "epoch": 0.38, + "learning_rate": 1.4128458025267276e-05, + "loss": 0.4268, + "step": 4842 + }, + { + "epoch": 0.38, + "learning_rate": 1.4126120745269382e-05, + "loss": 0.3838, + "step": 4843 + }, + { + "epoch": 0.38, + "learning_rate": 1.4123783193586294e-05, + "loss": 0.3349, + "step": 4844 + }, + { + "epoch": 0.38, + "learning_rate": 1.4121445370371922e-05, + "loss": 0.3798, + "step": 4845 + }, + { + "epoch": 0.38, + "learning_rate": 1.4119107275780203e-05, + "loss": 0.2733, + "step": 4846 + }, + { + "epoch": 0.38, + "learning_rate": 1.4116768909965092e-05, + "loss": 0.2832, + "step": 4847 + }, + { + "epoch": 0.38, + "learning_rate": 1.4114430273080558e-05, + "loss": 0.292, + "step": 4848 + }, + { + "epoch": 0.38, + "learning_rate": 1.4112091365280585e-05, + "loss": 0.4221, + "step": 4849 + }, + { + "epoch": 0.38, + "learning_rate": 1.4109752186719181e-05, + "loss": 0.3342, + "step": 4850 + }, + { + "epoch": 0.38, + "learning_rate": 1.4107412737550372e-05, + "loss": 0.3746, + "step": 4851 + }, + { + "epoch": 0.38, + "learning_rate": 1.4105073017928199e-05, + "loss": 0.3434, + "step": 4852 + }, + { + "epoch": 0.38, + "learning_rate": 1.4102733028006719e-05, + "loss": 0.4169, + "step": 4853 + }, + { + "epoch": 0.38, + "learning_rate": 1.410039276794001e-05, + "loss": 0.3443, + "step": 4854 + }, + { + "epoch": 0.38, + "learning_rate": 1.4098052237882168e-05, + "loss": 0.3227, + "step": 4855 + }, + { + "epoch": 0.38, + "learning_rate": 1.4095711437987303e-05, + "loss": 0.4471, + "step": 4856 + }, + { + "epoch": 0.38, + "learning_rate": 1.4093370368409546e-05, + "loss": 0.2279, + "step": 4857 + }, + { + "epoch": 0.38, + "learning_rate": 1.409102902930305e-05, + "loss": 0.3157, + "step": 4858 + }, + { + "epoch": 0.38, + "learning_rate": 1.4088687420821974e-05, + "loss": 0.4063, + "step": 4859 + }, + { + "epoch": 0.39, + "learning_rate": 1.4086345543120508e-05, + "loss": 0.3933, + "step": 4860 + }, + { + "epoch": 0.39, + "learning_rate": 1.4084003396352848e-05, + "loss": 0.3888, + "step": 4861 + }, + { + "epoch": 0.39, + "learning_rate": 1.4081660980673215e-05, + "loss": 0.3293, + "step": 4862 + }, + { + "epoch": 0.39, + "learning_rate": 1.4079318296235846e-05, + "loss": 0.3135, + "step": 4863 + }, + { + "epoch": 0.39, + "learning_rate": 1.4076975343194996e-05, + "loss": 0.3744, + "step": 4864 + }, + { + "epoch": 0.39, + "learning_rate": 1.4074632121704941e-05, + "loss": 0.4885, + "step": 4865 + }, + { + "epoch": 0.39, + "learning_rate": 1.4072288631919962e-05, + "loss": 0.3231, + "step": 4866 + }, + { + "epoch": 0.39, + "learning_rate": 1.406994487399437e-05, + "loss": 0.3369, + "step": 4867 + }, + { + "epoch": 0.39, + "learning_rate": 1.4067600848082496e-05, + "loss": 0.4217, + "step": 4868 + }, + { + "epoch": 0.39, + "learning_rate": 1.4065256554338675e-05, + "loss": 0.3122, + "step": 4869 + }, + { + "epoch": 0.39, + "learning_rate": 1.406291199291727e-05, + "loss": 0.366, + "step": 4870 + }, + { + "epoch": 0.39, + "learning_rate": 1.4060567163972663e-05, + "loss": 0.4753, + "step": 4871 + }, + { + "epoch": 0.39, + "learning_rate": 1.4058222067659244e-05, + "loss": 0.3872, + "step": 4872 + }, + { + "epoch": 0.39, + "learning_rate": 1.405587670413143e-05, + "loss": 0.3555, + "step": 4873 + }, + { + "epoch": 0.39, + "learning_rate": 1.405353107354365e-05, + "loss": 0.3411, + "step": 4874 + }, + { + "epoch": 0.39, + "learning_rate": 1.4051185176050353e-05, + "loss": 0.4795, + "step": 4875 + }, + { + "epoch": 0.39, + "learning_rate": 1.4048839011806006e-05, + "loss": 0.3932, + "step": 4876 + }, + { + "epoch": 0.39, + "learning_rate": 1.404649258096509e-05, + "loss": 0.5096, + "step": 4877 + }, + { + "epoch": 0.39, + "learning_rate": 1.4044145883682108e-05, + "loss": 0.3252, + "step": 4878 + }, + { + "epoch": 0.39, + "learning_rate": 1.4041798920111582e-05, + "loss": 0.3816, + "step": 4879 + }, + { + "epoch": 0.39, + "learning_rate": 1.4039451690408042e-05, + "loss": 0.3676, + "step": 4880 + }, + { + "epoch": 0.39, + "learning_rate": 1.4037104194726048e-05, + "loss": 0.2638, + "step": 4881 + }, + { + "epoch": 0.39, + "learning_rate": 1.4034756433220164e-05, + "loss": 0.3244, + "step": 4882 + }, + { + "epoch": 0.39, + "learning_rate": 1.4032408406044986e-05, + "loss": 0.3233, + "step": 4883 + }, + { + "epoch": 0.39, + "learning_rate": 1.4030060113355118e-05, + "loss": 0.3074, + "step": 4884 + }, + { + "epoch": 0.39, + "learning_rate": 1.402771155530518e-05, + "loss": 0.3389, + "step": 4885 + }, + { + "epoch": 0.39, + "learning_rate": 1.4025362732049816e-05, + "loss": 0.3622, + "step": 4886 + }, + { + "epoch": 0.39, + "learning_rate": 1.4023013643743688e-05, + "loss": 0.2771, + "step": 4887 + }, + { + "epoch": 0.39, + "learning_rate": 1.4020664290541465e-05, + "loss": 0.3592, + "step": 4888 + }, + { + "epoch": 0.39, + "learning_rate": 1.4018314672597848e-05, + "loss": 0.3071, + "step": 4889 + }, + { + "epoch": 0.39, + "learning_rate": 1.4015964790067545e-05, + "loss": 0.3409, + "step": 4890 + }, + { + "epoch": 0.39, + "learning_rate": 1.401361464310528e-05, + "loss": 0.2802, + "step": 4891 + }, + { + "epoch": 0.39, + "learning_rate": 1.4011264231865807e-05, + "loss": 0.519, + "step": 4892 + }, + { + "epoch": 0.39, + "learning_rate": 1.4008913556503885e-05, + "loss": 0.387, + "step": 4893 + }, + { + "epoch": 0.39, + "learning_rate": 1.4006562617174292e-05, + "loss": 0.3712, + "step": 4894 + }, + { + "epoch": 0.39, + "learning_rate": 1.4004211414031831e-05, + "loss": 0.2954, + "step": 4895 + }, + { + "epoch": 0.39, + "learning_rate": 1.4001859947231316e-05, + "loss": 0.2985, + "step": 4896 + }, + { + "epoch": 0.39, + "learning_rate": 1.3999508216927578e-05, + "loss": 0.3822, + "step": 4897 + }, + { + "epoch": 0.39, + "learning_rate": 1.399715622327547e-05, + "loss": 0.5309, + "step": 4898 + }, + { + "epoch": 0.39, + "learning_rate": 1.3994803966429854e-05, + "loss": 0.3368, + "step": 4899 + }, + { + "epoch": 0.39, + "learning_rate": 1.3992451446545624e-05, + "loss": 0.3672, + "step": 4900 + }, + { + "epoch": 0.39, + "learning_rate": 1.3990098663777674e-05, + "loss": 0.3474, + "step": 4901 + }, + { + "epoch": 0.39, + "learning_rate": 1.3987745618280925e-05, + "loss": 0.3062, + "step": 4902 + }, + { + "epoch": 0.39, + "learning_rate": 1.3985392310210318e-05, + "loss": 0.3868, + "step": 4903 + }, + { + "epoch": 0.39, + "learning_rate": 1.39830387397208e-05, + "loss": 0.3645, + "step": 4904 + }, + { + "epoch": 0.39, + "learning_rate": 1.3980684906967348e-05, + "loss": 0.4153, + "step": 4905 + }, + { + "epoch": 0.39, + "learning_rate": 1.3978330812104947e-05, + "loss": 0.4126, + "step": 4906 + }, + { + "epoch": 0.39, + "learning_rate": 1.3975976455288607e-05, + "loss": 0.456, + "step": 4907 + }, + { + "epoch": 0.39, + "learning_rate": 1.397362183667335e-05, + "loss": 0.389, + "step": 4908 + }, + { + "epoch": 0.39, + "learning_rate": 1.3971266956414211e-05, + "loss": 0.2898, + "step": 4909 + }, + { + "epoch": 0.39, + "learning_rate": 1.3968911814666252e-05, + "loss": 0.3899, + "step": 4910 + }, + { + "epoch": 0.39, + "learning_rate": 1.3966556411584548e-05, + "loss": 0.3585, + "step": 4911 + }, + { + "epoch": 0.39, + "learning_rate": 1.396420074732419e-05, + "loss": 0.3422, + "step": 4912 + }, + { + "epoch": 0.39, + "learning_rate": 1.396184482204029e-05, + "loss": 0.4052, + "step": 4913 + }, + { + "epoch": 0.39, + "learning_rate": 1.3959488635887967e-05, + "loss": 0.3724, + "step": 4914 + }, + { + "epoch": 0.39, + "learning_rate": 1.3957132189022373e-05, + "loss": 0.358, + "step": 4915 + }, + { + "epoch": 0.39, + "learning_rate": 1.3954775481598665e-05, + "loss": 0.4296, + "step": 4916 + }, + { + "epoch": 0.39, + "learning_rate": 1.3952418513772016e-05, + "loss": 0.4132, + "step": 4917 + }, + { + "epoch": 0.39, + "learning_rate": 1.3950061285697629e-05, + "loss": 0.3605, + "step": 4918 + }, + { + "epoch": 0.39, + "learning_rate": 1.3947703797530716e-05, + "loss": 0.3144, + "step": 4919 + }, + { + "epoch": 0.39, + "learning_rate": 1.3945346049426498e-05, + "loss": 0.3951, + "step": 4920 + }, + { + "epoch": 0.39, + "learning_rate": 1.3942988041540226e-05, + "loss": 0.3005, + "step": 4921 + }, + { + "epoch": 0.39, + "learning_rate": 1.394062977402717e-05, + "loss": 0.3077, + "step": 4922 + }, + { + "epoch": 0.39, + "learning_rate": 1.3938271247042601e-05, + "loss": 0.4049, + "step": 4923 + }, + { + "epoch": 0.39, + "learning_rate": 1.3935912460741818e-05, + "loss": 0.2997, + "step": 4924 + }, + { + "epoch": 0.39, + "learning_rate": 1.3933553415280142e-05, + "loss": 0.3556, + "step": 4925 + }, + { + "epoch": 0.39, + "learning_rate": 1.3931194110812896e-05, + "loss": 0.4325, + "step": 4926 + }, + { + "epoch": 0.39, + "learning_rate": 1.3928834547495438e-05, + "loss": 0.4335, + "step": 4927 + }, + { + "epoch": 0.39, + "learning_rate": 1.3926474725483125e-05, + "loss": 0.4212, + "step": 4928 + }, + { + "epoch": 0.39, + "learning_rate": 1.3924114644931346e-05, + "loss": 0.3052, + "step": 4929 + }, + { + "epoch": 0.39, + "learning_rate": 1.3921754305995501e-05, + "loss": 0.3391, + "step": 4930 + }, + { + "epoch": 0.39, + "learning_rate": 1.3919393708831004e-05, + "loss": 0.3893, + "step": 4931 + }, + { + "epoch": 0.39, + "learning_rate": 1.3917032853593289e-05, + "loss": 0.4793, + "step": 4932 + }, + { + "epoch": 0.39, + "learning_rate": 1.3914671740437811e-05, + "loss": 0.2303, + "step": 4933 + }, + { + "epoch": 0.39, + "learning_rate": 1.3912310369520032e-05, + "loss": 0.3922, + "step": 4934 + }, + { + "epoch": 0.39, + "learning_rate": 1.3909948740995442e-05, + "loss": 0.4836, + "step": 4935 + }, + { + "epoch": 0.39, + "learning_rate": 1.3907586855019538e-05, + "loss": 0.441, + "step": 4936 + }, + { + "epoch": 0.39, + "learning_rate": 1.3905224711747844e-05, + "loss": 0.3437, + "step": 4937 + }, + { + "epoch": 0.39, + "learning_rate": 1.3902862311335896e-05, + "loss": 0.3502, + "step": 4938 + }, + { + "epoch": 0.39, + "learning_rate": 1.390049965393924e-05, + "loss": 0.2964, + "step": 4939 + }, + { + "epoch": 0.39, + "learning_rate": 1.3898136739713451e-05, + "loss": 0.2979, + "step": 4940 + }, + { + "epoch": 0.39, + "learning_rate": 1.3895773568814118e-05, + "loss": 0.2975, + "step": 4941 + }, + { + "epoch": 0.39, + "learning_rate": 1.3893410141396835e-05, + "loss": 0.4251, + "step": 4942 + }, + { + "epoch": 0.39, + "learning_rate": 1.3891046457617233e-05, + "loss": 0.3857, + "step": 4943 + }, + { + "epoch": 0.39, + "learning_rate": 1.388868251763094e-05, + "loss": 0.2993, + "step": 4944 + }, + { + "epoch": 0.39, + "learning_rate": 1.3886318321593614e-05, + "loss": 0.3979, + "step": 4945 + }, + { + "epoch": 0.39, + "learning_rate": 1.388395386966093e-05, + "loss": 0.4575, + "step": 4946 + }, + { + "epoch": 0.39, + "learning_rate": 1.388158916198857e-05, + "loss": 0.4166, + "step": 4947 + }, + { + "epoch": 0.39, + "learning_rate": 1.3879224198732239e-05, + "loss": 0.3912, + "step": 4948 + }, + { + "epoch": 0.39, + "learning_rate": 1.3876858980047665e-05, + "loss": 0.3821, + "step": 4949 + }, + { + "epoch": 0.39, + "learning_rate": 1.3874493506090578e-05, + "loss": 0.2435, + "step": 4950 + }, + { + "epoch": 0.39, + "learning_rate": 1.3872127777016739e-05, + "loss": 0.3487, + "step": 4951 + }, + { + "epoch": 0.39, + "learning_rate": 1.3869761792981915e-05, + "loss": 0.3727, + "step": 4952 + }, + { + "epoch": 0.39, + "learning_rate": 1.3867395554141899e-05, + "loss": 0.4371, + "step": 4953 + }, + { + "epoch": 0.39, + "learning_rate": 1.3865029060652493e-05, + "loss": 0.3686, + "step": 4954 + }, + { + "epoch": 0.39, + "learning_rate": 1.3862662312669518e-05, + "loss": 0.2791, + "step": 4955 + }, + { + "epoch": 0.39, + "learning_rate": 1.386029531034882e-05, + "loss": 0.2741, + "step": 4956 + }, + { + "epoch": 0.39, + "learning_rate": 1.385792805384625e-05, + "loss": 0.3289, + "step": 4957 + }, + { + "epoch": 0.39, + "learning_rate": 1.3855560543317679e-05, + "loss": 0.4491, + "step": 4958 + }, + { + "epoch": 0.39, + "learning_rate": 1.3853192778919e-05, + "loss": 0.1701, + "step": 4959 + }, + { + "epoch": 0.39, + "learning_rate": 1.3850824760806115e-05, + "loss": 0.4637, + "step": 4960 + }, + { + "epoch": 0.39, + "learning_rate": 1.384845648913495e-05, + "loss": 0.4408, + "step": 4961 + }, + { + "epoch": 0.39, + "learning_rate": 1.3846087964061442e-05, + "loss": 0.3333, + "step": 4962 + }, + { + "epoch": 0.39, + "learning_rate": 1.3843719185741548e-05, + "loss": 0.4067, + "step": 4963 + }, + { + "epoch": 0.39, + "learning_rate": 1.3841350154331239e-05, + "loss": 0.402, + "step": 4964 + }, + { + "epoch": 0.39, + "learning_rate": 1.383898086998651e-05, + "loss": 0.3637, + "step": 4965 + }, + { + "epoch": 0.39, + "learning_rate": 1.3836611332863356e-05, + "loss": 0.3338, + "step": 4966 + }, + { + "epoch": 0.39, + "learning_rate": 1.383424154311781e-05, + "loss": 0.3259, + "step": 4967 + }, + { + "epoch": 0.39, + "learning_rate": 1.383187150090591e-05, + "loss": 0.4829, + "step": 4968 + }, + { + "epoch": 0.39, + "learning_rate": 1.3829501206383704e-05, + "loss": 0.354, + "step": 4969 + }, + { + "epoch": 0.39, + "learning_rate": 1.3827130659707275e-05, + "loss": 0.2942, + "step": 4970 + }, + { + "epoch": 0.39, + "learning_rate": 1.3824759861032704e-05, + "loss": 0.4705, + "step": 4971 + }, + { + "epoch": 0.39, + "learning_rate": 1.38223888105161e-05, + "loss": 0.4039, + "step": 4972 + }, + { + "epoch": 0.39, + "learning_rate": 1.3820017508313587e-05, + "loss": 0.2781, + "step": 4973 + }, + { + "epoch": 0.39, + "learning_rate": 1.3817645954581301e-05, + "loss": 0.3689, + "step": 4974 + }, + { + "epoch": 0.39, + "learning_rate": 1.3815274149475395e-05, + "loss": 0.3751, + "step": 4975 + }, + { + "epoch": 0.39, + "learning_rate": 1.3812902093152047e-05, + "loss": 0.3313, + "step": 4976 + }, + { + "epoch": 0.39, + "learning_rate": 1.3810529785767444e-05, + "loss": 0.31, + "step": 4977 + }, + { + "epoch": 0.39, + "learning_rate": 1.3808157227477788e-05, + "loss": 0.3504, + "step": 4978 + }, + { + "epoch": 0.39, + "learning_rate": 1.3805784418439303e-05, + "loss": 0.3868, + "step": 4979 + }, + { + "epoch": 0.39, + "learning_rate": 1.3803411358808222e-05, + "loss": 0.3944, + "step": 4980 + }, + { + "epoch": 0.39, + "learning_rate": 1.3801038048740811e-05, + "loss": 0.4445, + "step": 4981 + }, + { + "epoch": 0.39, + "learning_rate": 1.379866448839333e-05, + "loss": 0.3665, + "step": 4982 + }, + { + "epoch": 0.39, + "learning_rate": 1.379629067792207e-05, + "loss": 0.3793, + "step": 4983 + }, + { + "epoch": 0.39, + "learning_rate": 1.3793916617483338e-05, + "loss": 0.3809, + "step": 4984 + }, + { + "epoch": 0.39, + "learning_rate": 1.379154230723345e-05, + "loss": 0.4816, + "step": 4985 + }, + { + "epoch": 0.4, + "learning_rate": 1.3789167747328746e-05, + "loss": 0.3273, + "step": 4986 + }, + { + "epoch": 0.4, + "learning_rate": 1.3786792937925576e-05, + "loss": 0.3829, + "step": 4987 + }, + { + "epoch": 0.4, + "learning_rate": 1.3784417879180314e-05, + "loss": 0.4666, + "step": 4988 + }, + { + "epoch": 0.4, + "learning_rate": 1.3782042571249343e-05, + "loss": 0.2994, + "step": 4989 + }, + { + "epoch": 0.4, + "learning_rate": 1.3779667014289067e-05, + "loss": 0.3513, + "step": 4990 + }, + { + "epoch": 0.4, + "learning_rate": 1.3777291208455902e-05, + "loss": 0.4472, + "step": 4991 + }, + { + "epoch": 0.4, + "learning_rate": 1.3774915153906292e-05, + "loss": 0.4687, + "step": 4992 + }, + { + "epoch": 0.4, + "learning_rate": 1.377253885079668e-05, + "loss": 0.3542, + "step": 4993 + }, + { + "epoch": 0.4, + "learning_rate": 1.3770162299283535e-05, + "loss": 0.416, + "step": 4994 + }, + { + "epoch": 0.4, + "learning_rate": 1.3767785499523347e-05, + "loss": 0.3463, + "step": 4995 + }, + { + "epoch": 0.4, + "learning_rate": 1.376540845167261e-05, + "loss": 0.3892, + "step": 4996 + }, + { + "epoch": 0.4, + "learning_rate": 1.3763031155887847e-05, + "loss": 0.2524, + "step": 4997 + }, + { + "epoch": 0.4, + "learning_rate": 1.3760653612325588e-05, + "loss": 0.2552, + "step": 4998 + }, + { + "epoch": 0.4, + "learning_rate": 1.3758275821142382e-05, + "loss": 0.436, + "step": 4999 + }, + { + "epoch": 0.4, + "learning_rate": 1.3755897782494803e-05, + "loss": 0.3537, + "step": 5000 + }, + { + "epoch": 0.4, + "learning_rate": 1.375351949653942e-05, + "loss": 0.4893, + "step": 5001 + }, + { + "epoch": 0.4, + "learning_rate": 1.375114096343284e-05, + "loss": 0.3502, + "step": 5002 + }, + { + "epoch": 0.4, + "learning_rate": 1.3748762183331681e-05, + "loss": 0.2363, + "step": 5003 + }, + { + "epoch": 0.4, + "learning_rate": 1.3746383156392566e-05, + "loss": 0.4991, + "step": 5004 + }, + { + "epoch": 0.4, + "learning_rate": 1.374400388277215e-05, + "loss": 0.3733, + "step": 5005 + }, + { + "epoch": 0.4, + "learning_rate": 1.3741624362627091e-05, + "loss": 0.3166, + "step": 5006 + }, + { + "epoch": 0.4, + "learning_rate": 1.373924459611407e-05, + "loss": 0.4309, + "step": 5007 + }, + { + "epoch": 0.4, + "learning_rate": 1.3736864583389789e-05, + "loss": 0.3835, + "step": 5008 + }, + { + "epoch": 0.4, + "learning_rate": 1.373448432461095e-05, + "loss": 0.3979, + "step": 5009 + }, + { + "epoch": 0.4, + "learning_rate": 1.373210381993429e-05, + "loss": 0.2923, + "step": 5010 + }, + { + "epoch": 0.4, + "learning_rate": 1.3729723069516554e-05, + "loss": 0.3278, + "step": 5011 + }, + { + "epoch": 0.4, + "learning_rate": 1.3727342073514497e-05, + "loss": 0.2475, + "step": 5012 + }, + { + "epoch": 0.4, + "learning_rate": 1.3724960832084902e-05, + "loss": 0.453, + "step": 5013 + }, + { + "epoch": 0.4, + "learning_rate": 1.3722579345384558e-05, + "loss": 0.3302, + "step": 5014 + }, + { + "epoch": 0.4, + "learning_rate": 1.3720197613570272e-05, + "loss": 0.3889, + "step": 5015 + }, + { + "epoch": 0.4, + "learning_rate": 1.3717815636798879e-05, + "loss": 0.3183, + "step": 5016 + }, + { + "epoch": 0.4, + "learning_rate": 1.3715433415227212e-05, + "loss": 0.4003, + "step": 5017 + }, + { + "epoch": 0.4, + "learning_rate": 1.3713050949012134e-05, + "loss": 0.2989, + "step": 5018 + }, + { + "epoch": 0.4, + "learning_rate": 1.3710668238310519e-05, + "loss": 0.4197, + "step": 5019 + }, + { + "epoch": 0.4, + "learning_rate": 1.3708285283279252e-05, + "loss": 0.3685, + "step": 5020 + }, + { + "epoch": 0.4, + "learning_rate": 1.3705902084075244e-05, + "loss": 0.3367, + "step": 5021 + }, + { + "epoch": 0.4, + "learning_rate": 1.3703518640855414e-05, + "loss": 0.4162, + "step": 5022 + }, + { + "epoch": 0.4, + "learning_rate": 1.37011349537767e-05, + "loss": 0.3623, + "step": 5023 + }, + { + "epoch": 0.4, + "learning_rate": 1.3698751022996061e-05, + "loss": 0.3924, + "step": 5024 + }, + { + "epoch": 0.4, + "learning_rate": 1.3696366848670464e-05, + "loss": 0.3819, + "step": 5025 + }, + { + "epoch": 0.4, + "learning_rate": 1.3693982430956896e-05, + "loss": 0.3701, + "step": 5026 + }, + { + "epoch": 0.4, + "learning_rate": 1.369159777001236e-05, + "loss": 0.3106, + "step": 5027 + }, + { + "epoch": 0.4, + "learning_rate": 1.368921286599387e-05, + "loss": 0.3544, + "step": 5028 + }, + { + "epoch": 0.4, + "learning_rate": 1.368682771905847e-05, + "loss": 0.3792, + "step": 5029 + }, + { + "epoch": 0.4, + "learning_rate": 1.3684442329363199e-05, + "loss": 0.3696, + "step": 5030 + }, + { + "epoch": 0.4, + "learning_rate": 1.368205669706513e-05, + "loss": 0.3631, + "step": 5031 + }, + { + "epoch": 0.4, + "learning_rate": 1.3679670822321347e-05, + "loss": 0.432, + "step": 5032 + }, + { + "epoch": 0.4, + "learning_rate": 1.3677284705288943e-05, + "loss": 0.4116, + "step": 5033 + }, + { + "epoch": 0.4, + "learning_rate": 1.3674898346125036e-05, + "loss": 0.3618, + "step": 5034 + }, + { + "epoch": 0.4, + "learning_rate": 1.3672511744986756e-05, + "loss": 0.4526, + "step": 5035 + }, + { + "epoch": 0.4, + "learning_rate": 1.3670124902031248e-05, + "loss": 0.4178, + "step": 5036 + }, + { + "epoch": 0.4, + "learning_rate": 1.3667737817415679e-05, + "loss": 0.3231, + "step": 5037 + }, + { + "epoch": 0.4, + "learning_rate": 1.3665350491297215e-05, + "loss": 0.2485, + "step": 5038 + }, + { + "epoch": 0.4, + "learning_rate": 1.3662962923833063e-05, + "loss": 0.3247, + "step": 5039 + }, + { + "epoch": 0.4, + "learning_rate": 1.3660575115180427e-05, + "loss": 0.2924, + "step": 5040 + }, + { + "epoch": 0.4, + "learning_rate": 1.3658187065496533e-05, + "loss": 0.39, + "step": 5041 + }, + { + "epoch": 0.4, + "learning_rate": 1.365579877493862e-05, + "loss": 0.4123, + "step": 5042 + }, + { + "epoch": 0.4, + "learning_rate": 1.3653410243663953e-05, + "loss": 0.31, + "step": 5043 + }, + { + "epoch": 0.4, + "learning_rate": 1.3651021471829797e-05, + "loss": 0.4431, + "step": 5044 + }, + { + "epoch": 0.4, + "learning_rate": 1.3648632459593444e-05, + "loss": 0.3757, + "step": 5045 + }, + { + "epoch": 0.4, + "learning_rate": 1.3646243207112204e-05, + "loss": 0.3316, + "step": 5046 + }, + { + "epoch": 0.4, + "learning_rate": 1.3643853714543389e-05, + "loss": 0.3491, + "step": 5047 + }, + { + "epoch": 0.4, + "learning_rate": 1.3641463982044343e-05, + "loss": 0.3926, + "step": 5048 + }, + { + "epoch": 0.4, + "learning_rate": 1.3639074009772412e-05, + "loss": 0.3886, + "step": 5049 + }, + { + "epoch": 0.4, + "learning_rate": 1.3636683797884971e-05, + "loss": 0.3393, + "step": 5050 + }, + { + "epoch": 0.4, + "learning_rate": 1.36342933465394e-05, + "loss": 0.2992, + "step": 5051 + }, + { + "epoch": 0.4, + "learning_rate": 1.3631902655893096e-05, + "loss": 0.4335, + "step": 5052 + }, + { + "epoch": 0.4, + "learning_rate": 1.3629511726103482e-05, + "loss": 0.4656, + "step": 5053 + }, + { + "epoch": 0.4, + "learning_rate": 1.3627120557327982e-05, + "loss": 0.3663, + "step": 5054 + }, + { + "epoch": 0.4, + "learning_rate": 1.3624729149724047e-05, + "loss": 0.4343, + "step": 5055 + }, + { + "epoch": 0.4, + "learning_rate": 1.362233750344914e-05, + "loss": 0.3809, + "step": 5056 + }, + { + "epoch": 0.4, + "learning_rate": 1.3619945618660735e-05, + "loss": 0.2953, + "step": 5057 + }, + { + "epoch": 0.4, + "learning_rate": 1.3617553495516332e-05, + "loss": 0.3754, + "step": 5058 + }, + { + "epoch": 0.4, + "learning_rate": 1.3615161134173435e-05, + "loss": 0.2737, + "step": 5059 + }, + { + "epoch": 0.4, + "learning_rate": 1.3612768534789573e-05, + "loss": 0.3342, + "step": 5060 + }, + { + "epoch": 0.4, + "learning_rate": 1.3610375697522287e-05, + "loss": 0.2336, + "step": 5061 + }, + { + "epoch": 0.4, + "learning_rate": 1.3607982622529135e-05, + "loss": 0.4097, + "step": 5062 + }, + { + "epoch": 0.4, + "learning_rate": 1.3605589309967686e-05, + "loss": 0.2994, + "step": 5063 + }, + { + "epoch": 0.4, + "learning_rate": 1.3603195759995531e-05, + "loss": 0.2807, + "step": 5064 + }, + { + "epoch": 0.4, + "learning_rate": 1.3600801972770272e-05, + "loss": 0.393, + "step": 5065 + }, + { + "epoch": 0.4, + "learning_rate": 1.3598407948449528e-05, + "loss": 0.3034, + "step": 5066 + }, + { + "epoch": 0.4, + "learning_rate": 1.3596013687190936e-05, + "loss": 0.4292, + "step": 5067 + }, + { + "epoch": 0.4, + "learning_rate": 1.3593619189152146e-05, + "loss": 0.3157, + "step": 5068 + }, + { + "epoch": 0.4, + "learning_rate": 1.3591224454490824e-05, + "loss": 0.5418, + "step": 5069 + }, + { + "epoch": 0.4, + "learning_rate": 1.3588829483364652e-05, + "loss": 0.3623, + "step": 5070 + }, + { + "epoch": 0.4, + "learning_rate": 1.3586434275931324e-05, + "loss": 0.4133, + "step": 5071 + }, + { + "epoch": 0.4, + "learning_rate": 1.358403883234856e-05, + "loss": 0.3162, + "step": 5072 + }, + { + "epoch": 0.4, + "learning_rate": 1.358164315277408e-05, + "loss": 0.4519, + "step": 5073 + }, + { + "epoch": 0.4, + "learning_rate": 1.3579247237365634e-05, + "loss": 0.3324, + "step": 5074 + }, + { + "epoch": 0.4, + "learning_rate": 1.357685108628098e-05, + "loss": 0.3256, + "step": 5075 + }, + { + "epoch": 0.4, + "learning_rate": 1.3574454699677893e-05, + "loss": 0.3759, + "step": 5076 + }, + { + "epoch": 0.4, + "learning_rate": 1.357205807771416e-05, + "loss": 0.3879, + "step": 5077 + }, + { + "epoch": 0.4, + "learning_rate": 1.3569661220547596e-05, + "loss": 0.3205, + "step": 5078 + }, + { + "epoch": 0.4, + "learning_rate": 1.3567264128336013e-05, + "loss": 0.2917, + "step": 5079 + }, + { + "epoch": 0.4, + "learning_rate": 1.3564866801237254e-05, + "loss": 0.383, + "step": 5080 + }, + { + "epoch": 0.4, + "learning_rate": 1.3562469239409166e-05, + "loss": 0.2089, + "step": 5081 + }, + { + "epoch": 0.4, + "learning_rate": 1.3560071443009622e-05, + "loss": 0.3811, + "step": 5082 + }, + { + "epoch": 0.4, + "learning_rate": 1.3557673412196504e-05, + "loss": 0.4556, + "step": 5083 + }, + { + "epoch": 0.4, + "learning_rate": 1.3555275147127709e-05, + "loss": 0.3678, + "step": 5084 + }, + { + "epoch": 0.4, + "learning_rate": 1.3552876647961151e-05, + "loss": 0.3925, + "step": 5085 + }, + { + "epoch": 0.4, + "learning_rate": 1.3550477914854766e-05, + "loss": 0.442, + "step": 5086 + }, + { + "epoch": 0.4, + "learning_rate": 1.3548078947966487e-05, + "loss": 0.268, + "step": 5087 + }, + { + "epoch": 0.4, + "learning_rate": 1.3545679747454286e-05, + "loss": 0.2977, + "step": 5088 + }, + { + "epoch": 0.4, + "learning_rate": 1.3543280313476135e-05, + "loss": 0.3129, + "step": 5089 + }, + { + "epoch": 0.4, + "learning_rate": 1.3540880646190022e-05, + "loss": 0.346, + "step": 5090 + }, + { + "epoch": 0.4, + "learning_rate": 1.353848074575396e-05, + "loss": 0.4168, + "step": 5091 + }, + { + "epoch": 0.4, + "learning_rate": 1.3536080612325963e-05, + "loss": 0.3633, + "step": 5092 + }, + { + "epoch": 0.4, + "learning_rate": 1.3533680246064073e-05, + "loss": 0.4731, + "step": 5093 + }, + { + "epoch": 0.4, + "learning_rate": 1.3531279647126342e-05, + "loss": 0.3556, + "step": 5094 + }, + { + "epoch": 0.4, + "learning_rate": 1.352887881567084e-05, + "loss": 0.3649, + "step": 5095 + }, + { + "epoch": 0.4, + "learning_rate": 1.3526477751855645e-05, + "loss": 0.4077, + "step": 5096 + }, + { + "epoch": 0.4, + "learning_rate": 1.3524076455838859e-05, + "loss": 0.256, + "step": 5097 + }, + { + "epoch": 0.4, + "learning_rate": 1.3521674927778594e-05, + "loss": 0.3344, + "step": 5098 + }, + { + "epoch": 0.4, + "learning_rate": 1.3519273167832982e-05, + "loss": 0.4215, + "step": 5099 + }, + { + "epoch": 0.4, + "learning_rate": 1.3516871176160166e-05, + "loss": 0.402, + "step": 5100 + }, + { + "epoch": 0.4, + "learning_rate": 1.3514468952918303e-05, + "loss": 0.3407, + "step": 5101 + }, + { + "epoch": 0.4, + "learning_rate": 1.3512066498265572e-05, + "loss": 0.3815, + "step": 5102 + }, + { + "epoch": 0.4, + "learning_rate": 1.3509663812360161e-05, + "loss": 0.3408, + "step": 5103 + }, + { + "epoch": 0.4, + "learning_rate": 1.3507260895360274e-05, + "loss": 0.3832, + "step": 5104 + }, + { + "epoch": 0.4, + "learning_rate": 1.3504857747424133e-05, + "loss": 0.3679, + "step": 5105 + }, + { + "epoch": 0.4, + "learning_rate": 1.3502454368709973e-05, + "loss": 0.3091, + "step": 5106 + }, + { + "epoch": 0.4, + "learning_rate": 1.3500050759376052e-05, + "loss": 0.4196, + "step": 5107 + }, + { + "epoch": 0.4, + "learning_rate": 1.3497646919580623e-05, + "loss": 0.47, + "step": 5108 + }, + { + "epoch": 0.4, + "learning_rate": 1.3495242849481973e-05, + "loss": 0.3409, + "step": 5109 + }, + { + "epoch": 0.4, + "learning_rate": 1.3492838549238406e-05, + "loss": 0.3569, + "step": 5110 + }, + { + "epoch": 0.4, + "learning_rate": 1.349043401900822e-05, + "loss": 0.3869, + "step": 5111 + }, + { + "epoch": 0.4, + "learning_rate": 1.348802925894975e-05, + "loss": 0.3979, + "step": 5112 + }, + { + "epoch": 0.41, + "learning_rate": 1.348562426922134e-05, + "loss": 0.3447, + "step": 5113 + }, + { + "epoch": 0.41, + "learning_rate": 1.3483219049981343e-05, + "loss": 0.312, + "step": 5114 + }, + { + "epoch": 0.41, + "learning_rate": 1.348081360138813e-05, + "loss": 0.3813, + "step": 5115 + }, + { + "epoch": 0.41, + "learning_rate": 1.347840792360009e-05, + "loss": 0.2951, + "step": 5116 + }, + { + "epoch": 0.41, + "learning_rate": 1.3476002016775626e-05, + "loss": 0.3804, + "step": 5117 + }, + { + "epoch": 0.41, + "learning_rate": 1.3473595881073154e-05, + "loss": 0.3221, + "step": 5118 + }, + { + "epoch": 0.41, + "learning_rate": 1.3471189516651108e-05, + "loss": 0.3316, + "step": 5119 + }, + { + "epoch": 0.41, + "learning_rate": 1.3468782923667936e-05, + "loss": 0.283, + "step": 5120 + }, + { + "epoch": 0.41, + "learning_rate": 1.3466376102282098e-05, + "loss": 0.3349, + "step": 5121 + }, + { + "epoch": 0.41, + "learning_rate": 1.3463969052652073e-05, + "loss": 0.3842, + "step": 5122 + }, + { + "epoch": 0.41, + "learning_rate": 1.3461561774936352e-05, + "loss": 0.3214, + "step": 5123 + }, + { + "epoch": 0.41, + "learning_rate": 1.3459154269293443e-05, + "loss": 0.3654, + "step": 5124 + }, + { + "epoch": 0.41, + "learning_rate": 1.3456746535881872e-05, + "loss": 0.4484, + "step": 5125 + }, + { + "epoch": 0.41, + "learning_rate": 1.3454338574860175e-05, + "loss": 0.2819, + "step": 5126 + }, + { + "epoch": 0.41, + "learning_rate": 1.3451930386386902e-05, + "loss": 0.3465, + "step": 5127 + }, + { + "epoch": 0.41, + "learning_rate": 1.3449521970620624e-05, + "loss": 0.3072, + "step": 5128 + }, + { + "epoch": 0.41, + "learning_rate": 1.3447113327719923e-05, + "loss": 0.3414, + "step": 5129 + }, + { + "epoch": 0.41, + "learning_rate": 1.3444704457843393e-05, + "loss": 0.3416, + "step": 5130 + }, + { + "epoch": 0.41, + "learning_rate": 1.3442295361149651e-05, + "loss": 0.3675, + "step": 5131 + }, + { + "epoch": 0.41, + "learning_rate": 1.3439886037797326e-05, + "loss": 0.3338, + "step": 5132 + }, + { + "epoch": 0.41, + "learning_rate": 1.3437476487945051e-05, + "loss": 0.3553, + "step": 5133 + }, + { + "epoch": 0.41, + "learning_rate": 1.3435066711751494e-05, + "loss": 0.3714, + "step": 5134 + }, + { + "epoch": 0.41, + "learning_rate": 1.343265670937532e-05, + "loss": 0.3376, + "step": 5135 + }, + { + "epoch": 0.41, + "learning_rate": 1.3430246480975218e-05, + "loss": 0.3246, + "step": 5136 + }, + { + "epoch": 0.41, + "learning_rate": 1.3427836026709892e-05, + "loss": 0.4196, + "step": 5137 + }, + { + "epoch": 0.41, + "learning_rate": 1.3425425346738057e-05, + "loss": 0.3053, + "step": 5138 + }, + { + "epoch": 0.41, + "learning_rate": 1.3423014441218444e-05, + "loss": 0.3926, + "step": 5139 + }, + { + "epoch": 0.41, + "learning_rate": 1.3420603310309805e-05, + "loss": 0.2733, + "step": 5140 + }, + { + "epoch": 0.41, + "learning_rate": 1.3418191954170892e-05, + "loss": 0.2588, + "step": 5141 + }, + { + "epoch": 0.41, + "learning_rate": 1.341578037296049e-05, + "loss": 0.2329, + "step": 5142 + }, + { + "epoch": 0.41, + "learning_rate": 1.3413368566837384e-05, + "loss": 0.43, + "step": 5143 + }, + { + "epoch": 0.41, + "learning_rate": 1.341095653596038e-05, + "loss": 0.3449, + "step": 5144 + }, + { + "epoch": 0.41, + "learning_rate": 1.3408544280488305e-05, + "loss": 0.3874, + "step": 5145 + }, + { + "epoch": 0.41, + "learning_rate": 1.3406131800579985e-05, + "loss": 0.3314, + "step": 5146 + }, + { + "epoch": 0.41, + "learning_rate": 1.3403719096394276e-05, + "loss": 0.3499, + "step": 5147 + }, + { + "epoch": 0.41, + "learning_rate": 1.3401306168090047e-05, + "loss": 0.3197, + "step": 5148 + }, + { + "epoch": 0.41, + "learning_rate": 1.3398893015826166e-05, + "loss": 0.3974, + "step": 5149 + }, + { + "epoch": 0.41, + "learning_rate": 1.3396479639761541e-05, + "loss": 0.3676, + "step": 5150 + }, + { + "epoch": 0.41, + "learning_rate": 1.3394066040055071e-05, + "loss": 0.3875, + "step": 5151 + }, + { + "epoch": 0.41, + "learning_rate": 1.3391652216865682e-05, + "loss": 0.4386, + "step": 5152 + }, + { + "epoch": 0.41, + "learning_rate": 1.3389238170352318e-05, + "loss": 0.3634, + "step": 5153 + }, + { + "epoch": 0.41, + "learning_rate": 1.3386823900673926e-05, + "loss": 0.264, + "step": 5154 + }, + { + "epoch": 0.41, + "learning_rate": 1.3384409407989475e-05, + "loss": 0.3957, + "step": 5155 + }, + { + "epoch": 0.41, + "learning_rate": 1.3381994692457956e-05, + "loss": 0.3161, + "step": 5156 + }, + { + "epoch": 0.41, + "learning_rate": 1.3379579754238354e-05, + "loss": 0.3689, + "step": 5157 + }, + { + "epoch": 0.41, + "learning_rate": 1.3377164593489687e-05, + "loss": 0.3886, + "step": 5158 + }, + { + "epoch": 0.41, + "learning_rate": 1.3374749210370983e-05, + "loss": 0.3731, + "step": 5159 + }, + { + "epoch": 0.41, + "learning_rate": 1.3372333605041282e-05, + "loss": 0.3798, + "step": 5160 + }, + { + "epoch": 0.41, + "learning_rate": 1.3369917777659638e-05, + "loss": 0.4551, + "step": 5161 + }, + { + "epoch": 0.41, + "learning_rate": 1.3367501728385124e-05, + "loss": 0.2819, + "step": 5162 + }, + { + "epoch": 0.41, + "learning_rate": 1.3365085457376823e-05, + "loss": 0.3245, + "step": 5163 + }, + { + "epoch": 0.41, + "learning_rate": 1.336266896479384e-05, + "loss": 0.3311, + "step": 5164 + }, + { + "epoch": 0.41, + "learning_rate": 1.3360252250795282e-05, + "loss": 0.3493, + "step": 5165 + }, + { + "epoch": 0.41, + "learning_rate": 1.3357835315540281e-05, + "loss": 0.3402, + "step": 5166 + }, + { + "epoch": 0.41, + "learning_rate": 1.3355418159187988e-05, + "loss": 0.3362, + "step": 5167 + }, + { + "epoch": 0.41, + "learning_rate": 1.335300078189755e-05, + "loss": 0.4208, + "step": 5168 + }, + { + "epoch": 0.41, + "learning_rate": 1.3350583183828143e-05, + "loss": 0.28, + "step": 5169 + }, + { + "epoch": 0.41, + "learning_rate": 1.3348165365138956e-05, + "loss": 0.3419, + "step": 5170 + }, + { + "epoch": 0.41, + "learning_rate": 1.3345747325989188e-05, + "loss": 0.2931, + "step": 5171 + }, + { + "epoch": 0.41, + "learning_rate": 1.3343329066538064e-05, + "loss": 0.3547, + "step": 5172 + }, + { + "epoch": 0.41, + "learning_rate": 1.3340910586944805e-05, + "loss": 0.2756, + "step": 5173 + }, + { + "epoch": 0.41, + "learning_rate": 1.3338491887368656e-05, + "loss": 0.3734, + "step": 5174 + }, + { + "epoch": 0.41, + "learning_rate": 1.3336072967968882e-05, + "loss": 0.4773, + "step": 5175 + }, + { + "epoch": 0.41, + "learning_rate": 1.3333653828904755e-05, + "loss": 0.3503, + "step": 5176 + }, + { + "epoch": 0.41, + "learning_rate": 1.3331234470335566e-05, + "loss": 0.4078, + "step": 5177 + }, + { + "epoch": 0.41, + "learning_rate": 1.3328814892420613e-05, + "loss": 0.3166, + "step": 5178 + }, + { + "epoch": 0.41, + "learning_rate": 1.3326395095319218e-05, + "loss": 0.3823, + "step": 5179 + }, + { + "epoch": 0.41, + "learning_rate": 1.3323975079190713e-05, + "loss": 0.3007, + "step": 5180 + }, + { + "epoch": 0.41, + "learning_rate": 1.332155484419444e-05, + "loss": 0.4479, + "step": 5181 + }, + { + "epoch": 0.41, + "learning_rate": 1.3319134390489765e-05, + "loss": 0.4114, + "step": 5182 + }, + { + "epoch": 0.41, + "learning_rate": 1.3316713718236061e-05, + "loss": 0.4063, + "step": 5183 + }, + { + "epoch": 0.41, + "learning_rate": 1.3314292827592716e-05, + "loss": 0.3937, + "step": 5184 + }, + { + "epoch": 0.41, + "learning_rate": 1.3311871718719137e-05, + "loss": 0.3766, + "step": 5185 + }, + { + "epoch": 0.41, + "learning_rate": 1.330945039177474e-05, + "loss": 0.276, + "step": 5186 + }, + { + "epoch": 0.41, + "learning_rate": 1.3307028846918958e-05, + "loss": 0.3387, + "step": 5187 + }, + { + "epoch": 0.41, + "learning_rate": 1.3304607084311246e-05, + "loss": 0.3723, + "step": 5188 + }, + { + "epoch": 0.41, + "learning_rate": 1.3302185104111049e-05, + "loss": 0.3827, + "step": 5189 + }, + { + "epoch": 0.41, + "learning_rate": 1.3299762906477855e-05, + "loss": 0.4115, + "step": 5190 + }, + { + "epoch": 0.41, + "learning_rate": 1.3297340491571153e-05, + "loss": 0.3383, + "step": 5191 + }, + { + "epoch": 0.41, + "learning_rate": 1.3294917859550444e-05, + "loss": 0.4235, + "step": 5192 + }, + { + "epoch": 0.41, + "learning_rate": 1.3292495010575249e-05, + "loss": 0.2795, + "step": 5193 + }, + { + "epoch": 0.41, + "learning_rate": 1.3290071944805099e-05, + "loss": 0.302, + "step": 5194 + }, + { + "epoch": 0.41, + "learning_rate": 1.3287648662399544e-05, + "loss": 0.4427, + "step": 5195 + }, + { + "epoch": 0.41, + "learning_rate": 1.3285225163518141e-05, + "loss": 0.4431, + "step": 5196 + }, + { + "epoch": 0.41, + "learning_rate": 1.328280144832047e-05, + "loss": 0.436, + "step": 5197 + }, + { + "epoch": 0.41, + "learning_rate": 1.3280377516966118e-05, + "loss": 0.3819, + "step": 5198 + }, + { + "epoch": 0.41, + "learning_rate": 1.3277953369614696e-05, + "loss": 0.2755, + "step": 5199 + }, + { + "epoch": 0.41, + "learning_rate": 1.3275529006425808e-05, + "loss": 0.2902, + "step": 5200 + }, + { + "epoch": 0.41, + "learning_rate": 1.3273104427559102e-05, + "loss": 0.3079, + "step": 5201 + }, + { + "epoch": 0.41, + "learning_rate": 1.3270679633174219e-05, + "loss": 0.4273, + "step": 5202 + }, + { + "epoch": 0.41, + "learning_rate": 1.3268254623430817e-05, + "loss": 0.2498, + "step": 5203 + }, + { + "epoch": 0.41, + "learning_rate": 1.3265829398488576e-05, + "loss": 0.3444, + "step": 5204 + }, + { + "epoch": 0.41, + "learning_rate": 1.3263403958507181e-05, + "loss": 0.2573, + "step": 5205 + }, + { + "epoch": 0.41, + "learning_rate": 1.326097830364634e-05, + "loss": 0.4272, + "step": 5206 + }, + { + "epoch": 0.41, + "learning_rate": 1.3258552434065768e-05, + "loss": 0.4675, + "step": 5207 + }, + { + "epoch": 0.41, + "learning_rate": 1.3256126349925195e-05, + "loss": 0.3453, + "step": 5208 + }, + { + "epoch": 0.41, + "learning_rate": 1.3253700051384371e-05, + "loss": 0.4366, + "step": 5209 + }, + { + "epoch": 0.41, + "learning_rate": 1.3251273538603056e-05, + "loss": 0.3482, + "step": 5210 + }, + { + "epoch": 0.41, + "learning_rate": 1.3248846811741021e-05, + "loss": 0.4109, + "step": 5211 + }, + { + "epoch": 0.41, + "learning_rate": 1.3246419870958056e-05, + "loss": 0.3043, + "step": 5212 + }, + { + "epoch": 0.41, + "learning_rate": 1.3243992716413962e-05, + "loss": 0.4203, + "step": 5213 + }, + { + "epoch": 0.41, + "learning_rate": 1.324156534826856e-05, + "loss": 0.3634, + "step": 5214 + }, + { + "epoch": 0.41, + "learning_rate": 1.3239137766681675e-05, + "loss": 0.2449, + "step": 5215 + }, + { + "epoch": 0.41, + "learning_rate": 1.3236709971813153e-05, + "loss": 0.3647, + "step": 5216 + }, + { + "epoch": 0.41, + "learning_rate": 1.3234281963822856e-05, + "loss": 0.361, + "step": 5217 + }, + { + "epoch": 0.41, + "learning_rate": 1.3231853742870652e-05, + "loss": 0.3476, + "step": 5218 + }, + { + "epoch": 0.41, + "learning_rate": 1.322942530911643e-05, + "loss": 0.3543, + "step": 5219 + }, + { + "epoch": 0.41, + "learning_rate": 1.3226996662720094e-05, + "loss": 0.3812, + "step": 5220 + }, + { + "epoch": 0.41, + "learning_rate": 1.322456780384155e-05, + "loss": 0.4101, + "step": 5221 + }, + { + "epoch": 0.41, + "learning_rate": 1.3222138732640732e-05, + "loss": 0.2842, + "step": 5222 + }, + { + "epoch": 0.41, + "learning_rate": 1.3219709449277584e-05, + "loss": 0.3271, + "step": 5223 + }, + { + "epoch": 0.41, + "learning_rate": 1.3217279953912061e-05, + "loss": 0.4094, + "step": 5224 + }, + { + "epoch": 0.41, + "learning_rate": 1.3214850246704134e-05, + "loss": 0.3867, + "step": 5225 + }, + { + "epoch": 0.41, + "learning_rate": 1.3212420327813789e-05, + "loss": 0.3365, + "step": 5226 + }, + { + "epoch": 0.41, + "learning_rate": 1.3209990197401016e-05, + "loss": 0.3885, + "step": 5227 + }, + { + "epoch": 0.41, + "learning_rate": 1.3207559855625842e-05, + "loss": 0.3665, + "step": 5228 + }, + { + "epoch": 0.41, + "learning_rate": 1.3205129302648282e-05, + "loss": 0.3577, + "step": 5229 + }, + { + "epoch": 0.41, + "learning_rate": 1.3202698538628376e-05, + "loss": 0.3349, + "step": 5230 + }, + { + "epoch": 0.41, + "learning_rate": 1.3200267563726187e-05, + "loss": 0.4518, + "step": 5231 + }, + { + "epoch": 0.41, + "learning_rate": 1.3197836378101773e-05, + "loss": 0.4965, + "step": 5232 + }, + { + "epoch": 0.41, + "learning_rate": 1.3195404981915223e-05, + "loss": 0.3897, + "step": 5233 + }, + { + "epoch": 0.41, + "learning_rate": 1.3192973375326635e-05, + "loss": 0.4954, + "step": 5234 + }, + { + "epoch": 0.41, + "learning_rate": 1.3190541558496106e-05, + "loss": 0.3597, + "step": 5235 + }, + { + "epoch": 0.41, + "learning_rate": 1.318810953158377e-05, + "loss": 0.3572, + "step": 5236 + }, + { + "epoch": 0.41, + "learning_rate": 1.3185677294749763e-05, + "loss": 0.3596, + "step": 5237 + }, + { + "epoch": 0.41, + "learning_rate": 1.3183244848154232e-05, + "loss": 0.3843, + "step": 5238 + }, + { + "epoch": 0.42, + "learning_rate": 1.3180812191957346e-05, + "loss": 0.4429, + "step": 5239 + }, + { + "epoch": 0.42, + "learning_rate": 1.3178379326319284e-05, + "loss": 0.3929, + "step": 5240 + }, + { + "epoch": 0.42, + "learning_rate": 1.3175946251400234e-05, + "loss": 0.4192, + "step": 5241 + }, + { + "epoch": 0.42, + "learning_rate": 1.3173512967360406e-05, + "loss": 0.2738, + "step": 5242 + }, + { + "epoch": 0.42, + "learning_rate": 1.317107947436002e-05, + "loss": 0.4174, + "step": 5243 + }, + { + "epoch": 0.42, + "learning_rate": 1.3168645772559308e-05, + "loss": 0.3821, + "step": 5244 + }, + { + "epoch": 0.42, + "learning_rate": 1.3166211862118519e-05, + "loss": 0.2907, + "step": 5245 + }, + { + "epoch": 0.42, + "learning_rate": 1.3163777743197912e-05, + "loss": 0.2763, + "step": 5246 + }, + { + "epoch": 0.42, + "learning_rate": 1.3161343415957767e-05, + "loss": 0.3538, + "step": 5247 + }, + { + "epoch": 0.42, + "learning_rate": 1.3158908880558366e-05, + "loss": 0.2216, + "step": 5248 + }, + { + "epoch": 0.42, + "learning_rate": 1.3156474137160015e-05, + "loss": 0.3691, + "step": 5249 + }, + { + "epoch": 0.42, + "learning_rate": 1.3154039185923034e-05, + "loss": 0.421, + "step": 5250 + }, + { + "epoch": 0.42, + "learning_rate": 1.3151604027007744e-05, + "loss": 0.4256, + "step": 5251 + }, + { + "epoch": 0.42, + "learning_rate": 1.3149168660574495e-05, + "loss": 0.3696, + "step": 5252 + }, + { + "epoch": 0.42, + "learning_rate": 1.3146733086783646e-05, + "loss": 0.4181, + "step": 5253 + }, + { + "epoch": 0.42, + "learning_rate": 1.3144297305795559e-05, + "loss": 0.3301, + "step": 5254 + }, + { + "epoch": 0.42, + "learning_rate": 1.3141861317770628e-05, + "loss": 0.3021, + "step": 5255 + }, + { + "epoch": 0.42, + "learning_rate": 1.3139425122869244e-05, + "loss": 0.398, + "step": 5256 + }, + { + "epoch": 0.42, + "learning_rate": 1.3136988721251823e-05, + "loss": 0.4028, + "step": 5257 + }, + { + "epoch": 0.42, + "learning_rate": 1.3134552113078788e-05, + "loss": 0.4318, + "step": 5258 + }, + { + "epoch": 0.42, + "learning_rate": 1.3132115298510579e-05, + "loss": 0.4789, + "step": 5259 + }, + { + "epoch": 0.42, + "learning_rate": 1.312967827770765e-05, + "loss": 0.4304, + "step": 5260 + }, + { + "epoch": 0.42, + "learning_rate": 1.3127241050830463e-05, + "loss": 0.3595, + "step": 5261 + }, + { + "epoch": 0.42, + "learning_rate": 1.3124803618039501e-05, + "loss": 0.3274, + "step": 5262 + }, + { + "epoch": 0.42, + "learning_rate": 1.3122365979495259e-05, + "loss": 0.4052, + "step": 5263 + }, + { + "epoch": 0.42, + "learning_rate": 1.3119928135358238e-05, + "loss": 0.3875, + "step": 5264 + }, + { + "epoch": 0.42, + "learning_rate": 1.3117490085788963e-05, + "loss": 0.3756, + "step": 5265 + }, + { + "epoch": 0.42, + "learning_rate": 1.3115051830947966e-05, + "loss": 0.3906, + "step": 5266 + }, + { + "epoch": 0.42, + "learning_rate": 1.3112613370995792e-05, + "loss": 0.3168, + "step": 5267 + }, + { + "epoch": 0.42, + "learning_rate": 1.3110174706093007e-05, + "loss": 0.4175, + "step": 5268 + }, + { + "epoch": 0.42, + "learning_rate": 1.3107735836400184e-05, + "loss": 0.3586, + "step": 5269 + }, + { + "epoch": 0.42, + "learning_rate": 1.3105296762077906e-05, + "loss": 0.3186, + "step": 5270 + }, + { + "epoch": 0.42, + "learning_rate": 1.3102857483286781e-05, + "loss": 0.2678, + "step": 5271 + }, + { + "epoch": 0.42, + "learning_rate": 1.310041800018742e-05, + "loss": 0.3142, + "step": 5272 + }, + { + "epoch": 0.42, + "learning_rate": 1.3097978312940453e-05, + "loss": 0.4013, + "step": 5273 + }, + { + "epoch": 0.42, + "learning_rate": 1.309553842170652e-05, + "loss": 0.3973, + "step": 5274 + }, + { + "epoch": 0.42, + "learning_rate": 1.3093098326646277e-05, + "loss": 0.3381, + "step": 5275 + }, + { + "epoch": 0.42, + "learning_rate": 1.3090658027920391e-05, + "loss": 0.2881, + "step": 5276 + }, + { + "epoch": 0.42, + "learning_rate": 1.3088217525689546e-05, + "loss": 0.4984, + "step": 5277 + }, + { + "epoch": 0.42, + "learning_rate": 1.3085776820114435e-05, + "loss": 0.4206, + "step": 5278 + }, + { + "epoch": 0.42, + "learning_rate": 1.3083335911355768e-05, + "loss": 0.3932, + "step": 5279 + }, + { + "epoch": 0.42, + "learning_rate": 1.3080894799574271e-05, + "loss": 0.3715, + "step": 5280 + }, + { + "epoch": 0.42, + "learning_rate": 1.3078453484930674e-05, + "loss": 0.3689, + "step": 5281 + }, + { + "epoch": 0.42, + "learning_rate": 1.3076011967585727e-05, + "loss": 0.3178, + "step": 5282 + }, + { + "epoch": 0.42, + "learning_rate": 1.3073570247700192e-05, + "loss": 0.4263, + "step": 5283 + }, + { + "epoch": 0.42, + "learning_rate": 1.3071128325434845e-05, + "loss": 0.4102, + "step": 5284 + }, + { + "epoch": 0.42, + "learning_rate": 1.3068686200950475e-05, + "loss": 0.323, + "step": 5285 + }, + { + "epoch": 0.42, + "learning_rate": 1.3066243874407886e-05, + "loss": 0.3231, + "step": 5286 + }, + { + "epoch": 0.42, + "learning_rate": 1.306380134596789e-05, + "loss": 0.3132, + "step": 5287 + }, + { + "epoch": 0.42, + "learning_rate": 1.306135861579132e-05, + "loss": 0.379, + "step": 5288 + }, + { + "epoch": 0.42, + "learning_rate": 1.3058915684039013e-05, + "loss": 0.376, + "step": 5289 + }, + { + "epoch": 0.42, + "learning_rate": 1.3056472550871829e-05, + "loss": 0.2503, + "step": 5290 + }, + { + "epoch": 0.42, + "learning_rate": 1.3054029216450632e-05, + "loss": 0.4658, + "step": 5291 + }, + { + "epoch": 0.42, + "learning_rate": 1.3051585680936305e-05, + "loss": 0.4932, + "step": 5292 + }, + { + "epoch": 0.42, + "learning_rate": 1.304914194448975e-05, + "loss": 0.3252, + "step": 5293 + }, + { + "epoch": 0.42, + "learning_rate": 1.3046698007271864e-05, + "loss": 0.3698, + "step": 5294 + }, + { + "epoch": 0.42, + "learning_rate": 1.3044253869443575e-05, + "loss": 0.3003, + "step": 5295 + }, + { + "epoch": 0.42, + "learning_rate": 1.3041809531165819e-05, + "loss": 0.2754, + "step": 5296 + }, + { + "epoch": 0.42, + "learning_rate": 1.3039364992599538e-05, + "loss": 0.4447, + "step": 5297 + }, + { + "epoch": 0.42, + "learning_rate": 1.30369202539057e-05, + "loss": 0.4115, + "step": 5298 + }, + { + "epoch": 0.42, + "learning_rate": 1.3034475315245273e-05, + "loss": 0.354, + "step": 5299 + }, + { + "epoch": 0.42, + "learning_rate": 1.303203017677925e-05, + "loss": 0.3021, + "step": 5300 + }, + { + "epoch": 0.42, + "learning_rate": 1.302958483866863e-05, + "loss": 0.4179, + "step": 5301 + }, + { + "epoch": 0.42, + "learning_rate": 1.3027139301074423e-05, + "loss": 0.4454, + "step": 5302 + }, + { + "epoch": 0.42, + "learning_rate": 1.3024693564157658e-05, + "loss": 0.3512, + "step": 5303 + }, + { + "epoch": 0.42, + "learning_rate": 1.3022247628079381e-05, + "loss": 0.4157, + "step": 5304 + }, + { + "epoch": 0.42, + "learning_rate": 1.3019801493000634e-05, + "loss": 0.376, + "step": 5305 + }, + { + "epoch": 0.42, + "learning_rate": 1.3017355159082495e-05, + "loss": 0.3913, + "step": 5306 + }, + { + "epoch": 0.42, + "learning_rate": 1.3014908626486032e-05, + "loss": 0.3676, + "step": 5307 + }, + { + "epoch": 0.42, + "learning_rate": 1.3012461895372343e-05, + "loss": 0.2352, + "step": 5308 + }, + { + "epoch": 0.42, + "learning_rate": 1.3010014965902535e-05, + "loss": 0.315, + "step": 5309 + }, + { + "epoch": 0.42, + "learning_rate": 1.3007567838237725e-05, + "loss": 0.3674, + "step": 5310 + }, + { + "epoch": 0.42, + "learning_rate": 1.3005120512539042e-05, + "loss": 0.4, + "step": 5311 + }, + { + "epoch": 0.42, + "learning_rate": 1.300267298896764e-05, + "loss": 0.394, + "step": 5312 + }, + { + "epoch": 0.42, + "learning_rate": 1.3000225267684663e-05, + "loss": 0.4545, + "step": 5313 + }, + { + "epoch": 0.42, + "learning_rate": 1.2997777348851288e-05, + "loss": 0.3956, + "step": 5314 + }, + { + "epoch": 0.42, + "learning_rate": 1.2995329232628702e-05, + "loss": 0.3353, + "step": 5315 + }, + { + "epoch": 0.42, + "learning_rate": 1.2992880919178097e-05, + "loss": 0.369, + "step": 5316 + }, + { + "epoch": 0.42, + "learning_rate": 1.2990432408660682e-05, + "loss": 0.2961, + "step": 5317 + }, + { + "epoch": 0.42, + "learning_rate": 1.2987983701237688e-05, + "loss": 0.4089, + "step": 5318 + }, + { + "epoch": 0.42, + "learning_rate": 1.298553479707034e-05, + "loss": 0.4283, + "step": 5319 + }, + { + "epoch": 0.42, + "learning_rate": 1.2983085696319892e-05, + "loss": 0.3955, + "step": 5320 + }, + { + "epoch": 0.42, + "learning_rate": 1.2980636399147606e-05, + "loss": 0.3531, + "step": 5321 + }, + { + "epoch": 0.42, + "learning_rate": 1.2978186905714752e-05, + "loss": 0.3677, + "step": 5322 + }, + { + "epoch": 0.42, + "learning_rate": 1.2975737216182625e-05, + "loss": 0.4386, + "step": 5323 + }, + { + "epoch": 0.42, + "learning_rate": 1.2973287330712516e-05, + "loss": 0.3441, + "step": 5324 + }, + { + "epoch": 0.42, + "learning_rate": 1.2970837249465746e-05, + "loss": 0.3392, + "step": 5325 + }, + { + "epoch": 0.42, + "learning_rate": 1.2968386972603635e-05, + "loss": 0.5178, + "step": 5326 + }, + { + "epoch": 0.42, + "learning_rate": 1.2965936500287526e-05, + "loss": 0.2961, + "step": 5327 + }, + { + "epoch": 0.42, + "learning_rate": 1.2963485832678772e-05, + "loss": 0.2352, + "step": 5328 + }, + { + "epoch": 0.42, + "learning_rate": 1.2961034969938732e-05, + "loss": 0.2472, + "step": 5329 + }, + { + "epoch": 0.42, + "learning_rate": 1.2958583912228785e-05, + "loss": 0.4243, + "step": 5330 + }, + { + "epoch": 0.42, + "learning_rate": 1.295613265971033e-05, + "loss": 0.297, + "step": 5331 + }, + { + "epoch": 0.42, + "learning_rate": 1.2953681212544757e-05, + "loss": 0.4237, + "step": 5332 + }, + { + "epoch": 0.42, + "learning_rate": 1.2951229570893493e-05, + "loss": 0.3313, + "step": 5333 + }, + { + "epoch": 0.42, + "learning_rate": 1.2948777734917961e-05, + "loss": 0.3711, + "step": 5334 + }, + { + "epoch": 0.42, + "learning_rate": 1.2946325704779602e-05, + "loss": 0.4003, + "step": 5335 + }, + { + "epoch": 0.42, + "learning_rate": 1.2943873480639875e-05, + "loss": 0.3898, + "step": 5336 + }, + { + "epoch": 0.42, + "learning_rate": 1.294142106266024e-05, + "loss": 0.4002, + "step": 5337 + }, + { + "epoch": 0.42, + "learning_rate": 1.2938968451002183e-05, + "loss": 0.4224, + "step": 5338 + }, + { + "epoch": 0.42, + "learning_rate": 1.2936515645827198e-05, + "loss": 0.4207, + "step": 5339 + }, + { + "epoch": 0.42, + "learning_rate": 1.2934062647296783e-05, + "loss": 0.3584, + "step": 5340 + }, + { + "epoch": 0.42, + "learning_rate": 1.2931609455572462e-05, + "loss": 0.3527, + "step": 5341 + }, + { + "epoch": 0.42, + "learning_rate": 1.2929156070815765e-05, + "loss": 0.2631, + "step": 5342 + }, + { + "epoch": 0.42, + "learning_rate": 1.2926702493188235e-05, + "loss": 0.4247, + "step": 5343 + }, + { + "epoch": 0.42, + "learning_rate": 1.292424872285143e-05, + "loss": 0.2773, + "step": 5344 + }, + { + "epoch": 0.42, + "learning_rate": 1.2921794759966913e-05, + "loss": 0.3802, + "step": 5345 + }, + { + "epoch": 0.42, + "learning_rate": 1.2919340604696272e-05, + "loss": 0.381, + "step": 5346 + }, + { + "epoch": 0.42, + "learning_rate": 1.29168862572011e-05, + "loss": 0.4436, + "step": 5347 + }, + { + "epoch": 0.42, + "learning_rate": 1.2914431717643e-05, + "loss": 0.3065, + "step": 5348 + }, + { + "epoch": 0.42, + "learning_rate": 1.2911976986183598e-05, + "loss": 0.3583, + "step": 5349 + }, + { + "epoch": 0.42, + "learning_rate": 1.2909522062984524e-05, + "loss": 0.4104, + "step": 5350 + }, + { + "epoch": 0.42, + "learning_rate": 1.290706694820742e-05, + "loss": 0.3587, + "step": 5351 + }, + { + "epoch": 0.42, + "learning_rate": 1.2904611642013945e-05, + "loss": 0.3286, + "step": 5352 + }, + { + "epoch": 0.42, + "learning_rate": 1.2902156144565769e-05, + "loss": 0.3404, + "step": 5353 + }, + { + "epoch": 0.42, + "learning_rate": 1.2899700456024576e-05, + "loss": 0.3095, + "step": 5354 + }, + { + "epoch": 0.42, + "learning_rate": 1.2897244576552062e-05, + "loss": 0.3611, + "step": 5355 + }, + { + "epoch": 0.42, + "learning_rate": 1.289478850630993e-05, + "loss": 0.4431, + "step": 5356 + }, + { + "epoch": 0.42, + "learning_rate": 1.2892332245459904e-05, + "loss": 0.3473, + "step": 5357 + }, + { + "epoch": 0.42, + "learning_rate": 1.288987579416372e-05, + "loss": 0.3306, + "step": 5358 + }, + { + "epoch": 0.42, + "learning_rate": 1.2887419152583117e-05, + "loss": 0.2653, + "step": 5359 + }, + { + "epoch": 0.42, + "learning_rate": 1.2884962320879857e-05, + "loss": 0.4562, + "step": 5360 + }, + { + "epoch": 0.42, + "learning_rate": 1.2882505299215711e-05, + "loss": 0.4973, + "step": 5361 + }, + { + "epoch": 0.42, + "learning_rate": 1.288004808775246e-05, + "loss": 0.4, + "step": 5362 + }, + { + "epoch": 0.42, + "learning_rate": 1.28775906866519e-05, + "loss": 0.2134, + "step": 5363 + }, + { + "epoch": 0.42, + "learning_rate": 1.2875133096075839e-05, + "loss": 0.3946, + "step": 5364 + }, + { + "epoch": 0.43, + "learning_rate": 1.2872675316186096e-05, + "loss": 0.3794, + "step": 5365 + }, + { + "epoch": 0.43, + "learning_rate": 1.2870217347144511e-05, + "loss": 0.4004, + "step": 5366 + }, + { + "epoch": 0.43, + "learning_rate": 1.2867759189112921e-05, + "loss": 0.3621, + "step": 5367 + }, + { + "epoch": 0.43, + "learning_rate": 1.2865300842253188e-05, + "loss": 0.2139, + "step": 5368 + }, + { + "epoch": 0.43, + "learning_rate": 1.2862842306727181e-05, + "loss": 0.2876, + "step": 5369 + }, + { + "epoch": 0.43, + "learning_rate": 1.2860383582696783e-05, + "loss": 0.3578, + "step": 5370 + }, + { + "epoch": 0.43, + "learning_rate": 1.2857924670323892e-05, + "loss": 0.3658, + "step": 5371 + }, + { + "epoch": 0.43, + "learning_rate": 1.2855465569770407e-05, + "loss": 0.2953, + "step": 5372 + }, + { + "epoch": 0.43, + "learning_rate": 1.2853006281198257e-05, + "loss": 0.3372, + "step": 5373 + }, + { + "epoch": 0.43, + "learning_rate": 1.2850546804769372e-05, + "loss": 0.4334, + "step": 5374 + }, + { + "epoch": 0.43, + "learning_rate": 1.2848087140645695e-05, + "loss": 0.4221, + "step": 5375 + }, + { + "epoch": 0.43, + "learning_rate": 1.2845627288989186e-05, + "loss": 0.2837, + "step": 5376 + }, + { + "epoch": 0.43, + "learning_rate": 1.284316724996181e-05, + "loss": 0.3907, + "step": 5377 + }, + { + "epoch": 0.43, + "learning_rate": 1.2840707023725552e-05, + "loss": 0.457, + "step": 5378 + }, + { + "epoch": 0.43, + "learning_rate": 1.2838246610442406e-05, + "loss": 0.2965, + "step": 5379 + }, + { + "epoch": 0.43, + "learning_rate": 1.2835786010274376e-05, + "loss": 0.3025, + "step": 5380 + }, + { + "epoch": 0.43, + "learning_rate": 1.283332522338348e-05, + "loss": 0.2684, + "step": 5381 + }, + { + "epoch": 0.43, + "learning_rate": 1.2830864249931756e-05, + "loss": 0.3933, + "step": 5382 + }, + { + "epoch": 0.43, + "learning_rate": 1.2828403090081238e-05, + "loss": 0.3838, + "step": 5383 + }, + { + "epoch": 0.43, + "learning_rate": 1.282594174399399e-05, + "loss": 0.3944, + "step": 5384 + }, + { + "epoch": 0.43, + "learning_rate": 1.2823480211832073e-05, + "loss": 0.2757, + "step": 5385 + }, + { + "epoch": 0.43, + "learning_rate": 1.2821018493757569e-05, + "loss": 0.3086, + "step": 5386 + }, + { + "epoch": 0.43, + "learning_rate": 1.2818556589932575e-05, + "loss": 0.4134, + "step": 5387 + }, + { + "epoch": 0.43, + "learning_rate": 1.2816094500519188e-05, + "loss": 0.3948, + "step": 5388 + }, + { + "epoch": 0.43, + "learning_rate": 1.2813632225679528e-05, + "loss": 0.3508, + "step": 5389 + }, + { + "epoch": 0.43, + "learning_rate": 1.281116976557573e-05, + "loss": 0.3566, + "step": 5390 + }, + { + "epoch": 0.43, + "learning_rate": 1.2808707120369923e-05, + "loss": 0.3488, + "step": 5391 + }, + { + "epoch": 0.43, + "learning_rate": 1.280624429022427e-05, + "loss": 0.3425, + "step": 5392 + }, + { + "epoch": 0.43, + "learning_rate": 1.2803781275300933e-05, + "loss": 0.3714, + "step": 5393 + }, + { + "epoch": 0.43, + "learning_rate": 1.2801318075762088e-05, + "loss": 0.3638, + "step": 5394 + }, + { + "epoch": 0.43, + "learning_rate": 1.2798854691769927e-05, + "loss": 0.3249, + "step": 5395 + }, + { + "epoch": 0.43, + "learning_rate": 1.2796391123486654e-05, + "loss": 0.2984, + "step": 5396 + }, + { + "epoch": 0.43, + "learning_rate": 1.2793927371074477e-05, + "loss": 0.358, + "step": 5397 + }, + { + "epoch": 0.43, + "learning_rate": 1.279146343469563e-05, + "loss": 0.2948, + "step": 5398 + }, + { + "epoch": 0.43, + "learning_rate": 1.2788999314512347e-05, + "loss": 0.3053, + "step": 5399 + }, + { + "epoch": 0.43, + "learning_rate": 1.2786535010686879e-05, + "loss": 0.2545, + "step": 5400 + }, + { + "epoch": 0.43, + "learning_rate": 1.2784070523381487e-05, + "loss": 0.3147, + "step": 5401 + }, + { + "epoch": 0.43, + "learning_rate": 1.2781605852758448e-05, + "loss": 0.2404, + "step": 5402 + }, + { + "epoch": 0.43, + "learning_rate": 1.2779140998980048e-05, + "loss": 0.355, + "step": 5403 + }, + { + "epoch": 0.43, + "learning_rate": 1.2776675962208585e-05, + "loss": 0.3971, + "step": 5404 + }, + { + "epoch": 0.43, + "learning_rate": 1.2774210742606368e-05, + "loss": 0.3243, + "step": 5405 + }, + { + "epoch": 0.43, + "learning_rate": 1.2771745340335726e-05, + "loss": 0.4171, + "step": 5406 + }, + { + "epoch": 0.43, + "learning_rate": 1.276927975555899e-05, + "loss": 0.3057, + "step": 5407 + }, + { + "epoch": 0.43, + "learning_rate": 1.2766813988438505e-05, + "loss": 0.3955, + "step": 5408 + }, + { + "epoch": 0.43, + "learning_rate": 1.2764348039136634e-05, + "loss": 0.3615, + "step": 5409 + }, + { + "epoch": 0.43, + "learning_rate": 1.2761881907815744e-05, + "loss": 0.4471, + "step": 5410 + }, + { + "epoch": 0.43, + "learning_rate": 1.275941559463822e-05, + "loss": 0.361, + "step": 5411 + }, + { + "epoch": 0.43, + "learning_rate": 1.2756949099766458e-05, + "loss": 0.3648, + "step": 5412 + }, + { + "epoch": 0.43, + "learning_rate": 1.2754482423362861e-05, + "loss": 0.2874, + "step": 5413 + }, + { + "epoch": 0.43, + "learning_rate": 1.2752015565589852e-05, + "loss": 0.3625, + "step": 5414 + }, + { + "epoch": 0.43, + "learning_rate": 1.2749548526609858e-05, + "loss": 0.3875, + "step": 5415 + }, + { + "epoch": 0.43, + "learning_rate": 1.2747081306585325e-05, + "loss": 0.4194, + "step": 5416 + }, + { + "epoch": 0.43, + "learning_rate": 1.2744613905678707e-05, + "loss": 0.4238, + "step": 5417 + }, + { + "epoch": 0.43, + "learning_rate": 1.2742146324052466e-05, + "loss": 0.3241, + "step": 5418 + }, + { + "epoch": 0.43, + "learning_rate": 1.273967856186909e-05, + "loss": 0.3855, + "step": 5419 + }, + { + "epoch": 0.43, + "learning_rate": 1.2737210619291058e-05, + "loss": 0.3483, + "step": 5420 + }, + { + "epoch": 0.43, + "learning_rate": 1.2734742496480878e-05, + "loss": 0.4058, + "step": 5421 + }, + { + "epoch": 0.43, + "learning_rate": 1.2732274193601066e-05, + "loss": 0.5001, + "step": 5422 + }, + { + "epoch": 0.43, + "learning_rate": 1.2729805710814142e-05, + "loss": 0.337, + "step": 5423 + }, + { + "epoch": 0.43, + "learning_rate": 1.2727337048282649e-05, + "loss": 0.4653, + "step": 5424 + }, + { + "epoch": 0.43, + "learning_rate": 1.2724868206169134e-05, + "loss": 0.3336, + "step": 5425 + }, + { + "epoch": 0.43, + "learning_rate": 1.2722399184636158e-05, + "loss": 0.4364, + "step": 5426 + }, + { + "epoch": 0.43, + "learning_rate": 1.2719929983846298e-05, + "loss": 0.3127, + "step": 5427 + }, + { + "epoch": 0.43, + "learning_rate": 1.2717460603962132e-05, + "loss": 0.3992, + "step": 5428 + }, + { + "epoch": 0.43, + "learning_rate": 1.2714991045146265e-05, + "loss": 0.4503, + "step": 5429 + }, + { + "epoch": 0.43, + "learning_rate": 1.2712521307561298e-05, + "loss": 0.3589, + "step": 5430 + }, + { + "epoch": 0.43, + "learning_rate": 1.2710051391369857e-05, + "loss": 0.3118, + "step": 5431 + }, + { + "epoch": 0.43, + "learning_rate": 1.270758129673457e-05, + "loss": 0.3584, + "step": 5432 + }, + { + "epoch": 0.43, + "learning_rate": 1.2705111023818083e-05, + "loss": 0.375, + "step": 5433 + }, + { + "epoch": 0.43, + "learning_rate": 1.2702640572783051e-05, + "loss": 0.2881, + "step": 5434 + }, + { + "epoch": 0.43, + "learning_rate": 1.2700169943792143e-05, + "loss": 0.4272, + "step": 5435 + }, + { + "epoch": 0.43, + "learning_rate": 1.2697699137008038e-05, + "loss": 0.2536, + "step": 5436 + }, + { + "epoch": 0.43, + "learning_rate": 1.2695228152593419e-05, + "loss": 0.3671, + "step": 5437 + }, + { + "epoch": 0.43, + "learning_rate": 1.2692756990710998e-05, + "loss": 0.4139, + "step": 5438 + }, + { + "epoch": 0.43, + "learning_rate": 1.269028565152349e-05, + "loss": 0.3324, + "step": 5439 + }, + { + "epoch": 0.43, + "learning_rate": 1.2687814135193613e-05, + "loss": 0.2832, + "step": 5440 + }, + { + "epoch": 0.43, + "learning_rate": 1.2685342441884107e-05, + "loss": 0.3699, + "step": 5441 + }, + { + "epoch": 0.43, + "learning_rate": 1.2682870571757724e-05, + "loss": 0.5151, + "step": 5442 + }, + { + "epoch": 0.43, + "learning_rate": 1.2680398524977222e-05, + "loss": 0.4251, + "step": 5443 + }, + { + "epoch": 0.43, + "learning_rate": 1.2677926301705376e-05, + "loss": 0.4011, + "step": 5444 + }, + { + "epoch": 0.43, + "learning_rate": 1.2675453902104967e-05, + "loss": 0.4112, + "step": 5445 + }, + { + "epoch": 0.43, + "learning_rate": 1.2672981326338793e-05, + "loss": 0.3314, + "step": 5446 + }, + { + "epoch": 0.43, + "learning_rate": 1.267050857456966e-05, + "loss": 0.4001, + "step": 5447 + }, + { + "epoch": 0.43, + "learning_rate": 1.2668035646960384e-05, + "loss": 0.3733, + "step": 5448 + }, + { + "epoch": 0.43, + "learning_rate": 1.2665562543673803e-05, + "loss": 0.3591, + "step": 5449 + }, + { + "epoch": 0.43, + "learning_rate": 1.2663089264872751e-05, + "loss": 0.2957, + "step": 5450 + }, + { + "epoch": 0.43, + "learning_rate": 1.2660615810720087e-05, + "loss": 0.3155, + "step": 5451 + }, + { + "epoch": 0.43, + "learning_rate": 1.2658142181378675e-05, + "loss": 0.3059, + "step": 5452 + }, + { + "epoch": 0.43, + "learning_rate": 1.2655668377011387e-05, + "loss": 0.384, + "step": 5453 + }, + { + "epoch": 0.43, + "learning_rate": 1.2653194397781117e-05, + "loss": 0.4159, + "step": 5454 + }, + { + "epoch": 0.43, + "learning_rate": 1.2650720243850762e-05, + "loss": 0.4287, + "step": 5455 + }, + { + "epoch": 0.43, + "learning_rate": 1.2648245915383233e-05, + "loss": 0.4761, + "step": 5456 + }, + { + "epoch": 0.43, + "learning_rate": 1.2645771412541455e-05, + "loss": 0.3686, + "step": 5457 + }, + { + "epoch": 0.43, + "learning_rate": 1.2643296735488355e-05, + "loss": 0.3459, + "step": 5458 + }, + { + "epoch": 0.43, + "learning_rate": 1.2640821884386887e-05, + "loss": 0.4036, + "step": 5459 + }, + { + "epoch": 0.43, + "learning_rate": 1.2638346859400006e-05, + "loss": 0.4454, + "step": 5460 + }, + { + "epoch": 0.43, + "learning_rate": 1.2635871660690677e-05, + "loss": 0.3897, + "step": 5461 + }, + { + "epoch": 0.43, + "learning_rate": 1.2633396288421884e-05, + "loss": 0.4526, + "step": 5462 + }, + { + "epoch": 0.43, + "learning_rate": 1.2630920742756616e-05, + "loss": 0.2968, + "step": 5463 + }, + { + "epoch": 0.43, + "learning_rate": 1.2628445023857875e-05, + "loss": 0.4422, + "step": 5464 + }, + { + "epoch": 0.43, + "learning_rate": 1.2625969131888677e-05, + "loss": 0.3906, + "step": 5465 + }, + { + "epoch": 0.43, + "learning_rate": 1.2623493067012047e-05, + "loss": 0.3354, + "step": 5466 + }, + { + "epoch": 0.43, + "learning_rate": 1.2621016829391022e-05, + "loss": 0.195, + "step": 5467 + }, + { + "epoch": 0.43, + "learning_rate": 1.2618540419188654e-05, + "loss": 0.3906, + "step": 5468 + }, + { + "epoch": 0.43, + "learning_rate": 1.2616063836567994e-05, + "loss": 0.333, + "step": 5469 + }, + { + "epoch": 0.43, + "learning_rate": 1.2613587081692118e-05, + "loss": 0.3751, + "step": 5470 + }, + { + "epoch": 0.43, + "learning_rate": 1.2611110154724113e-05, + "loss": 0.5078, + "step": 5471 + }, + { + "epoch": 0.43, + "learning_rate": 1.2608633055827064e-05, + "loss": 0.4314, + "step": 5472 + }, + { + "epoch": 0.43, + "learning_rate": 1.260615578516408e-05, + "loss": 0.3141, + "step": 5473 + }, + { + "epoch": 0.43, + "learning_rate": 1.260367834289828e-05, + "loss": 0.4017, + "step": 5474 + }, + { + "epoch": 0.43, + "learning_rate": 1.2601200729192789e-05, + "loss": 0.4112, + "step": 5475 + }, + { + "epoch": 0.43, + "learning_rate": 1.2598722944210746e-05, + "loss": 0.3825, + "step": 5476 + }, + { + "epoch": 0.43, + "learning_rate": 1.25962449881153e-05, + "loss": 0.4936, + "step": 5477 + }, + { + "epoch": 0.43, + "learning_rate": 1.2593766861069615e-05, + "loss": 0.3892, + "step": 5478 + }, + { + "epoch": 0.43, + "learning_rate": 1.2591288563236864e-05, + "loss": 0.4561, + "step": 5479 + }, + { + "epoch": 0.43, + "learning_rate": 1.2588810094780227e-05, + "loss": 0.434, + "step": 5480 + }, + { + "epoch": 0.43, + "learning_rate": 1.2586331455862902e-05, + "loss": 0.3707, + "step": 5481 + }, + { + "epoch": 0.43, + "learning_rate": 1.2583852646648097e-05, + "loss": 0.3801, + "step": 5482 + }, + { + "epoch": 0.43, + "learning_rate": 1.2581373667299026e-05, + "loss": 0.3955, + "step": 5483 + }, + { + "epoch": 0.43, + "learning_rate": 1.257889451797892e-05, + "loss": 0.3381, + "step": 5484 + }, + { + "epoch": 0.43, + "learning_rate": 1.257641519885102e-05, + "loss": 0.3299, + "step": 5485 + }, + { + "epoch": 0.43, + "learning_rate": 1.2573935710078576e-05, + "loss": 0.3563, + "step": 5486 + }, + { + "epoch": 0.43, + "learning_rate": 1.2571456051824851e-05, + "loss": 0.3904, + "step": 5487 + }, + { + "epoch": 0.43, + "learning_rate": 1.2568976224253115e-05, + "loss": 0.2701, + "step": 5488 + }, + { + "epoch": 0.43, + "learning_rate": 1.256649622752666e-05, + "loss": 0.3697, + "step": 5489 + }, + { + "epoch": 0.43, + "learning_rate": 1.2564016061808774e-05, + "loss": 0.3199, + "step": 5490 + }, + { + "epoch": 0.44, + "learning_rate": 1.2561535727262769e-05, + "loss": 0.4109, + "step": 5491 + }, + { + "epoch": 0.44, + "learning_rate": 1.2559055224051963e-05, + "loss": 0.3729, + "step": 5492 + }, + { + "epoch": 0.44, + "learning_rate": 1.2556574552339682e-05, + "loss": 0.4298, + "step": 5493 + }, + { + "epoch": 0.44, + "learning_rate": 1.2554093712289267e-05, + "loss": 0.6414, + "step": 5494 + }, + { + "epoch": 0.44, + "learning_rate": 1.2551612704064074e-05, + "loss": 0.416, + "step": 5495 + }, + { + "epoch": 0.44, + "learning_rate": 1.2549131527827458e-05, + "loss": 0.3917, + "step": 5496 + }, + { + "epoch": 0.44, + "learning_rate": 1.2546650183742801e-05, + "loss": 0.3433, + "step": 5497 + }, + { + "epoch": 0.44, + "learning_rate": 1.254416867197348e-05, + "loss": 0.3756, + "step": 5498 + }, + { + "epoch": 0.44, + "learning_rate": 1.2541686992682896e-05, + "loss": 0.5008, + "step": 5499 + }, + { + "epoch": 0.44, + "learning_rate": 1.2539205146034452e-05, + "loss": 0.3377, + "step": 5500 + }, + { + "epoch": 0.44, + "learning_rate": 1.2536723132191566e-05, + "loss": 0.4052, + "step": 5501 + }, + { + "epoch": 0.44, + "learning_rate": 1.2534240951317669e-05, + "loss": 0.451, + "step": 5502 + }, + { + "epoch": 0.44, + "learning_rate": 1.25317586035762e-05, + "loss": 0.3645, + "step": 5503 + }, + { + "epoch": 0.44, + "learning_rate": 1.2529276089130607e-05, + "loss": 0.4054, + "step": 5504 + }, + { + "epoch": 0.44, + "learning_rate": 1.2526793408144355e-05, + "loss": 0.2882, + "step": 5505 + }, + { + "epoch": 0.44, + "learning_rate": 1.2524310560780914e-05, + "loss": 0.4327, + "step": 5506 + }, + { + "epoch": 0.44, + "learning_rate": 1.2521827547203773e-05, + "loss": 0.2672, + "step": 5507 + }, + { + "epoch": 0.44, + "learning_rate": 1.2519344367576418e-05, + "loss": 0.3035, + "step": 5508 + }, + { + "epoch": 0.44, + "learning_rate": 1.2516861022062361e-05, + "loss": 0.4183, + "step": 5509 + }, + { + "epoch": 0.44, + "learning_rate": 1.2514377510825113e-05, + "loss": 0.3573, + "step": 5510 + }, + { + "epoch": 0.44, + "learning_rate": 1.2511893834028209e-05, + "loss": 0.48, + "step": 5511 + }, + { + "epoch": 0.44, + "learning_rate": 1.2509409991835178e-05, + "loss": 0.3699, + "step": 5512 + }, + { + "epoch": 0.44, + "learning_rate": 1.2506925984409574e-05, + "loss": 0.4098, + "step": 5513 + }, + { + "epoch": 0.44, + "learning_rate": 1.250444181191496e-05, + "loss": 0.3579, + "step": 5514 + }, + { + "epoch": 0.44, + "learning_rate": 1.2501957474514898e-05, + "loss": 0.3325, + "step": 5515 + }, + { + "epoch": 0.44, + "learning_rate": 1.249947297237298e-05, + "loss": 0.3578, + "step": 5516 + }, + { + "epoch": 0.44, + "learning_rate": 1.249698830565279e-05, + "loss": 0.448, + "step": 5517 + }, + { + "epoch": 0.44, + "learning_rate": 1.2494503474517935e-05, + "loss": 0.2674, + "step": 5518 + }, + { + "epoch": 0.44, + "learning_rate": 1.2492018479132033e-05, + "loss": 0.276, + "step": 5519 + }, + { + "epoch": 0.44, + "learning_rate": 1.2489533319658703e-05, + "loss": 0.3776, + "step": 5520 + }, + { + "epoch": 0.44, + "learning_rate": 1.2487047996261578e-05, + "loss": 0.502, + "step": 5521 + }, + { + "epoch": 0.44, + "learning_rate": 1.2484562509104316e-05, + "loss": 0.445, + "step": 5522 + }, + { + "epoch": 0.44, + "learning_rate": 1.2482076858350564e-05, + "loss": 0.3403, + "step": 5523 + }, + { + "epoch": 0.44, + "learning_rate": 1.2479591044163997e-05, + "loss": 0.4892, + "step": 5524 + }, + { + "epoch": 0.44, + "learning_rate": 1.2477105066708286e-05, + "loss": 0.4507, + "step": 5525 + }, + { + "epoch": 0.44, + "learning_rate": 1.2474618926147129e-05, + "loss": 0.4032, + "step": 5526 + }, + { + "epoch": 0.44, + "learning_rate": 1.2472132622644222e-05, + "loss": 0.269, + "step": 5527 + }, + { + "epoch": 0.44, + "learning_rate": 1.2469646156363276e-05, + "loss": 0.4668, + "step": 5528 + }, + { + "epoch": 0.44, + "learning_rate": 1.2467159527468014e-05, + "loss": 0.4489, + "step": 5529 + }, + { + "epoch": 0.44, + "learning_rate": 1.246467273612217e-05, + "loss": 0.383, + "step": 5530 + }, + { + "epoch": 0.44, + "learning_rate": 1.2462185782489484e-05, + "loss": 0.4048, + "step": 5531 + }, + { + "epoch": 0.44, + "learning_rate": 1.2459698666733712e-05, + "loss": 0.3971, + "step": 5532 + }, + { + "epoch": 0.44, + "learning_rate": 1.2457211389018619e-05, + "loss": 0.4031, + "step": 5533 + }, + { + "epoch": 0.44, + "learning_rate": 1.2454723949507978e-05, + "loss": 0.397, + "step": 5534 + }, + { + "epoch": 0.44, + "learning_rate": 1.2452236348365579e-05, + "loss": 0.3294, + "step": 5535 + }, + { + "epoch": 0.44, + "learning_rate": 1.244974858575521e-05, + "loss": 0.3242, + "step": 5536 + }, + { + "epoch": 0.44, + "learning_rate": 1.2447260661840688e-05, + "loss": 0.4226, + "step": 5537 + }, + { + "epoch": 0.44, + "learning_rate": 1.2444772576785828e-05, + "loss": 0.4337, + "step": 5538 + }, + { + "epoch": 0.44, + "learning_rate": 1.2442284330754456e-05, + "loss": 0.4002, + "step": 5539 + }, + { + "epoch": 0.44, + "learning_rate": 1.2439795923910413e-05, + "loss": 0.3608, + "step": 5540 + }, + { + "epoch": 0.44, + "learning_rate": 1.2437307356417547e-05, + "loss": 0.4232, + "step": 5541 + }, + { + "epoch": 0.44, + "learning_rate": 1.2434818628439718e-05, + "loss": 0.3318, + "step": 5542 + }, + { + "epoch": 0.44, + "learning_rate": 1.24323297401408e-05, + "loss": 0.3963, + "step": 5543 + }, + { + "epoch": 0.44, + "learning_rate": 1.2429840691684672e-05, + "loss": 0.4844, + "step": 5544 + }, + { + "epoch": 0.44, + "learning_rate": 1.2427351483235224e-05, + "loss": 0.2929, + "step": 5545 + }, + { + "epoch": 0.44, + "learning_rate": 1.2424862114956367e-05, + "loss": 0.426, + "step": 5546 + }, + { + "epoch": 0.44, + "learning_rate": 1.2422372587012001e-05, + "loss": 0.4607, + "step": 5547 + }, + { + "epoch": 0.44, + "learning_rate": 1.2419882899566056e-05, + "loss": 0.3518, + "step": 5548 + }, + { + "epoch": 0.44, + "learning_rate": 1.241739305278247e-05, + "loss": 0.5226, + "step": 5549 + }, + { + "epoch": 0.44, + "learning_rate": 1.2414903046825178e-05, + "loss": 0.3716, + "step": 5550 + }, + { + "epoch": 0.44, + "learning_rate": 1.2412412881858142e-05, + "loss": 0.3663, + "step": 5551 + }, + { + "epoch": 0.44, + "learning_rate": 1.240992255804533e-05, + "loss": 0.2664, + "step": 5552 + }, + { + "epoch": 0.44, + "learning_rate": 1.2407432075550707e-05, + "loss": 0.3841, + "step": 5553 + }, + { + "epoch": 0.44, + "learning_rate": 1.2404941434538269e-05, + "loss": 0.3098, + "step": 5554 + }, + { + "epoch": 0.44, + "learning_rate": 1.2402450635172008e-05, + "loss": 0.5265, + "step": 5555 + }, + { + "epoch": 0.44, + "learning_rate": 1.2399959677615932e-05, + "loss": 0.2851, + "step": 5556 + }, + { + "epoch": 0.44, + "learning_rate": 1.239746856203406e-05, + "loss": 0.4619, + "step": 5557 + }, + { + "epoch": 0.44, + "learning_rate": 1.239497728859042e-05, + "loss": 0.4402, + "step": 5558 + }, + { + "epoch": 0.44, + "learning_rate": 1.2392485857449048e-05, + "loss": 0.4192, + "step": 5559 + }, + { + "epoch": 0.44, + "learning_rate": 1.2389994268773995e-05, + "loss": 0.3851, + "step": 5560 + }, + { + "epoch": 0.44, + "learning_rate": 1.238750252272932e-05, + "loss": 0.4208, + "step": 5561 + }, + { + "epoch": 0.44, + "learning_rate": 1.2385010619479093e-05, + "loss": 0.3893, + "step": 5562 + }, + { + "epoch": 0.44, + "learning_rate": 1.2382518559187389e-05, + "loss": 0.4184, + "step": 5563 + }, + { + "epoch": 0.44, + "learning_rate": 1.23800263420183e-05, + "loss": 0.3334, + "step": 5564 + }, + { + "epoch": 0.44, + "learning_rate": 1.2377533968135934e-05, + "loss": 0.419, + "step": 5565 + }, + { + "epoch": 0.44, + "learning_rate": 1.2375041437704394e-05, + "loss": 0.3938, + "step": 5566 + }, + { + "epoch": 0.44, + "learning_rate": 1.2372548750887805e-05, + "loss": 0.3714, + "step": 5567 + }, + { + "epoch": 0.44, + "learning_rate": 1.2370055907850293e-05, + "loss": 0.3404, + "step": 5568 + }, + { + "epoch": 0.44, + "learning_rate": 1.2367562908756005e-05, + "loss": 0.3726, + "step": 5569 + }, + { + "epoch": 0.44, + "learning_rate": 1.2365069753769092e-05, + "loss": 0.255, + "step": 5570 + }, + { + "epoch": 0.44, + "learning_rate": 1.2362576443053716e-05, + "loss": 0.3534, + "step": 5571 + }, + { + "epoch": 0.44, + "learning_rate": 1.2360082976774049e-05, + "loss": 0.4525, + "step": 5572 + }, + { + "epoch": 0.44, + "learning_rate": 1.2357589355094275e-05, + "loss": 0.2638, + "step": 5573 + }, + { + "epoch": 0.44, + "learning_rate": 1.2355095578178582e-05, + "loss": 0.3924, + "step": 5574 + }, + { + "epoch": 0.44, + "learning_rate": 1.2352601646191182e-05, + "loss": 0.3456, + "step": 5575 + }, + { + "epoch": 0.44, + "learning_rate": 1.235010755929628e-05, + "loss": 0.3017, + "step": 5576 + }, + { + "epoch": 0.44, + "learning_rate": 1.2347613317658105e-05, + "loss": 0.3475, + "step": 5577 + }, + { + "epoch": 0.44, + "learning_rate": 1.234511892144089e-05, + "loss": 0.4928, + "step": 5578 + }, + { + "epoch": 0.44, + "learning_rate": 1.2342624370808876e-05, + "loss": 0.3778, + "step": 5579 + }, + { + "epoch": 0.44, + "learning_rate": 1.2340129665926319e-05, + "loss": 0.2709, + "step": 5580 + }, + { + "epoch": 0.44, + "learning_rate": 1.2337634806957486e-05, + "loss": 0.3431, + "step": 5581 + }, + { + "epoch": 0.44, + "learning_rate": 1.2335139794066645e-05, + "loss": 0.3615, + "step": 5582 + }, + { + "epoch": 0.44, + "learning_rate": 1.2332644627418088e-05, + "loss": 0.3258, + "step": 5583 + }, + { + "epoch": 0.44, + "learning_rate": 1.2330149307176105e-05, + "loss": 0.3851, + "step": 5584 + }, + { + "epoch": 0.44, + "learning_rate": 1.2327653833505005e-05, + "loss": 0.323, + "step": 5585 + }, + { + "epoch": 0.44, + "learning_rate": 1.2325158206569095e-05, + "loss": 0.5329, + "step": 5586 + }, + { + "epoch": 0.44, + "learning_rate": 1.232266242653271e-05, + "loss": 0.3604, + "step": 5587 + }, + { + "epoch": 0.44, + "learning_rate": 1.2320166493560176e-05, + "loss": 0.417, + "step": 5588 + }, + { + "epoch": 0.44, + "learning_rate": 1.2317670407815844e-05, + "loss": 0.4215, + "step": 5589 + }, + { + "epoch": 0.44, + "learning_rate": 1.2315174169464068e-05, + "loss": 0.3232, + "step": 5590 + }, + { + "epoch": 0.44, + "learning_rate": 1.2312677778669211e-05, + "loss": 0.3444, + "step": 5591 + }, + { + "epoch": 0.44, + "learning_rate": 1.2310181235595652e-05, + "loss": 0.3915, + "step": 5592 + }, + { + "epoch": 0.44, + "learning_rate": 1.2307684540407775e-05, + "loss": 0.3538, + "step": 5593 + }, + { + "epoch": 0.44, + "learning_rate": 1.230518769326997e-05, + "loss": 0.3138, + "step": 5594 + }, + { + "epoch": 0.44, + "learning_rate": 1.2302690694346654e-05, + "loss": 0.2096, + "step": 5595 + }, + { + "epoch": 0.44, + "learning_rate": 1.230019354380223e-05, + "loss": 0.3122, + "step": 5596 + }, + { + "epoch": 0.44, + "learning_rate": 1.2297696241801133e-05, + "loss": 0.3021, + "step": 5597 + }, + { + "epoch": 0.44, + "learning_rate": 1.2295198788507794e-05, + "loss": 0.3452, + "step": 5598 + }, + { + "epoch": 0.44, + "learning_rate": 1.2292701184086656e-05, + "loss": 0.3758, + "step": 5599 + }, + { + "epoch": 0.44, + "learning_rate": 1.2290203428702178e-05, + "loss": 0.4003, + "step": 5600 + }, + { + "epoch": 0.44, + "learning_rate": 1.2287705522518824e-05, + "loss": 0.2911, + "step": 5601 + }, + { + "epoch": 0.44, + "learning_rate": 1.228520746570107e-05, + "loss": 0.3235, + "step": 5602 + }, + { + "epoch": 0.44, + "learning_rate": 1.22827092584134e-05, + "loss": 0.5061, + "step": 5603 + }, + { + "epoch": 0.44, + "learning_rate": 1.2280210900820309e-05, + "loss": 0.3749, + "step": 5604 + }, + { + "epoch": 0.44, + "learning_rate": 1.22777123930863e-05, + "loss": 0.3171, + "step": 5605 + }, + { + "epoch": 0.44, + "learning_rate": 1.227521373537589e-05, + "loss": 0.2968, + "step": 5606 + }, + { + "epoch": 0.44, + "learning_rate": 1.2272714927853604e-05, + "loss": 0.3497, + "step": 5607 + }, + { + "epoch": 0.44, + "learning_rate": 1.2270215970683977e-05, + "loss": 0.3511, + "step": 5608 + }, + { + "epoch": 0.44, + "learning_rate": 1.226771686403155e-05, + "loss": 0.4094, + "step": 5609 + }, + { + "epoch": 0.44, + "learning_rate": 1.2265217608060879e-05, + "loss": 0.333, + "step": 5610 + }, + { + "epoch": 0.44, + "learning_rate": 1.226271820293653e-05, + "loss": 0.3787, + "step": 5611 + }, + { + "epoch": 0.44, + "learning_rate": 1.2260218648823073e-05, + "loss": 0.3252, + "step": 5612 + }, + { + "epoch": 0.44, + "learning_rate": 1.2257718945885096e-05, + "loss": 0.3477, + "step": 5613 + }, + { + "epoch": 0.44, + "learning_rate": 1.2255219094287186e-05, + "loss": 0.4533, + "step": 5614 + }, + { + "epoch": 0.44, + "learning_rate": 1.225271909419395e-05, + "loss": 0.3295, + "step": 5615 + }, + { + "epoch": 0.44, + "learning_rate": 1.2250218945770005e-05, + "loss": 0.3028, + "step": 5616 + }, + { + "epoch": 0.44, + "learning_rate": 1.2247718649179966e-05, + "loss": 0.3657, + "step": 5617 + }, + { + "epoch": 0.45, + "learning_rate": 1.2245218204588474e-05, + "loss": 0.3551, + "step": 5618 + }, + { + "epoch": 0.45, + "learning_rate": 1.2242717612160163e-05, + "loss": 0.4386, + "step": 5619 + }, + { + "epoch": 0.45, + "learning_rate": 1.2240216872059687e-05, + "loss": 0.4251, + "step": 5620 + }, + { + "epoch": 0.45, + "learning_rate": 1.2237715984451713e-05, + "loss": 0.3309, + "step": 5621 + }, + { + "epoch": 0.45, + "learning_rate": 1.2235214949500906e-05, + "loss": 0.2828, + "step": 5622 + }, + { + "epoch": 0.45, + "learning_rate": 1.223271376737195e-05, + "loss": 0.3783, + "step": 5623 + }, + { + "epoch": 0.45, + "learning_rate": 1.2230212438229539e-05, + "loss": 0.3998, + "step": 5624 + }, + { + "epoch": 0.45, + "learning_rate": 1.2227710962238367e-05, + "loss": 0.3958, + "step": 5625 + }, + { + "epoch": 0.45, + "learning_rate": 1.2225209339563144e-05, + "loss": 0.4092, + "step": 5626 + }, + { + "epoch": 0.45, + "learning_rate": 1.22227075703686e-05, + "loss": 0.3437, + "step": 5627 + }, + { + "epoch": 0.45, + "learning_rate": 1.2220205654819453e-05, + "loss": 0.3143, + "step": 5628 + }, + { + "epoch": 0.45, + "learning_rate": 1.2217703593080445e-05, + "loss": 0.4502, + "step": 5629 + }, + { + "epoch": 0.45, + "learning_rate": 1.221520138531633e-05, + "loss": 0.3906, + "step": 5630 + }, + { + "epoch": 0.45, + "learning_rate": 1.2212699031691861e-05, + "loss": 0.2508, + "step": 5631 + }, + { + "epoch": 0.45, + "learning_rate": 1.221019653237181e-05, + "loss": 0.4246, + "step": 5632 + }, + { + "epoch": 0.45, + "learning_rate": 1.2207693887520949e-05, + "loss": 0.4111, + "step": 5633 + }, + { + "epoch": 0.45, + "learning_rate": 1.2205191097304067e-05, + "loss": 0.2757, + "step": 5634 + }, + { + "epoch": 0.45, + "learning_rate": 1.2202688161885967e-05, + "loss": 0.3613, + "step": 5635 + }, + { + "epoch": 0.45, + "learning_rate": 1.2200185081431446e-05, + "loss": 0.5181, + "step": 5636 + }, + { + "epoch": 0.45, + "learning_rate": 1.2197681856105326e-05, + "loss": 0.3646, + "step": 5637 + }, + { + "epoch": 0.45, + "learning_rate": 1.219517848607243e-05, + "loss": 0.4334, + "step": 5638 + }, + { + "epoch": 0.45, + "learning_rate": 1.2192674971497593e-05, + "loss": 0.334, + "step": 5639 + }, + { + "epoch": 0.45, + "learning_rate": 1.219017131254566e-05, + "loss": 0.3065, + "step": 5640 + }, + { + "epoch": 0.45, + "learning_rate": 1.2187667509381484e-05, + "loss": 0.3049, + "step": 5641 + }, + { + "epoch": 0.45, + "learning_rate": 1.2185163562169928e-05, + "loss": 0.2775, + "step": 5642 + }, + { + "epoch": 0.45, + "learning_rate": 1.2182659471075868e-05, + "loss": 0.3332, + "step": 5643 + }, + { + "epoch": 0.45, + "learning_rate": 1.2180155236264182e-05, + "loss": 0.2871, + "step": 5644 + }, + { + "epoch": 0.45, + "learning_rate": 1.2177650857899767e-05, + "loss": 0.3522, + "step": 5645 + }, + { + "epoch": 0.45, + "learning_rate": 1.217514633614752e-05, + "loss": 0.3951, + "step": 5646 + }, + { + "epoch": 0.45, + "learning_rate": 1.217264167117235e-05, + "loss": 0.3478, + "step": 5647 + }, + { + "epoch": 0.45, + "learning_rate": 1.2170136863139183e-05, + "loss": 0.4503, + "step": 5648 + }, + { + "epoch": 0.45, + "learning_rate": 1.2167631912212942e-05, + "loss": 0.5019, + "step": 5649 + }, + { + "epoch": 0.45, + "learning_rate": 1.2165126818558572e-05, + "loss": 0.2467, + "step": 5650 + }, + { + "epoch": 0.45, + "learning_rate": 1.2162621582341021e-05, + "loss": 0.3725, + "step": 5651 + }, + { + "epoch": 0.45, + "learning_rate": 1.2160116203725243e-05, + "loss": 0.3162, + "step": 5652 + }, + { + "epoch": 0.45, + "learning_rate": 1.2157610682876206e-05, + "loss": 0.3573, + "step": 5653 + }, + { + "epoch": 0.45, + "learning_rate": 1.2155105019958888e-05, + "loss": 0.2426, + "step": 5654 + }, + { + "epoch": 0.45, + "learning_rate": 1.2152599215138274e-05, + "loss": 0.3721, + "step": 5655 + }, + { + "epoch": 0.45, + "learning_rate": 1.215009326857936e-05, + "loss": 0.3645, + "step": 5656 + }, + { + "epoch": 0.45, + "learning_rate": 1.2147587180447149e-05, + "loss": 0.4197, + "step": 5657 + }, + { + "epoch": 0.45, + "learning_rate": 1.2145080950906656e-05, + "loss": 0.3068, + "step": 5658 + }, + { + "epoch": 0.45, + "learning_rate": 1.2142574580122903e-05, + "loss": 0.3792, + "step": 5659 + }, + { + "epoch": 0.45, + "learning_rate": 1.2140068068260923e-05, + "loss": 0.3809, + "step": 5660 + }, + { + "epoch": 0.45, + "learning_rate": 1.2137561415485761e-05, + "loss": 0.3664, + "step": 5661 + }, + { + "epoch": 0.45, + "learning_rate": 1.2135054621962464e-05, + "loss": 0.3696, + "step": 5662 + }, + { + "epoch": 0.45, + "learning_rate": 1.2132547687856093e-05, + "loss": 0.4266, + "step": 5663 + }, + { + "epoch": 0.45, + "learning_rate": 1.2130040613331717e-05, + "loss": 0.4078, + "step": 5664 + }, + { + "epoch": 0.45, + "learning_rate": 1.2127533398554417e-05, + "loss": 0.2492, + "step": 5665 + }, + { + "epoch": 0.45, + "learning_rate": 1.2125026043689278e-05, + "loss": 0.2655, + "step": 5666 + }, + { + "epoch": 0.45, + "learning_rate": 1.2122518548901401e-05, + "loss": 0.273, + "step": 5667 + }, + { + "epoch": 0.45, + "learning_rate": 1.2120010914355888e-05, + "loss": 0.424, + "step": 5668 + }, + { + "epoch": 0.45, + "learning_rate": 1.2117503140217858e-05, + "loss": 0.4382, + "step": 5669 + }, + { + "epoch": 0.45, + "learning_rate": 1.2114995226652437e-05, + "loss": 0.2138, + "step": 5670 + }, + { + "epoch": 0.45, + "learning_rate": 1.2112487173824755e-05, + "loss": 0.3565, + "step": 5671 + }, + { + "epoch": 0.45, + "learning_rate": 1.2109978981899956e-05, + "loss": 0.3466, + "step": 5672 + }, + { + "epoch": 0.45, + "learning_rate": 1.2107470651043198e-05, + "loss": 0.384, + "step": 5673 + }, + { + "epoch": 0.45, + "learning_rate": 1.2104962181419635e-05, + "loss": 0.48, + "step": 5674 + }, + { + "epoch": 0.45, + "learning_rate": 1.2102453573194442e-05, + "loss": 0.4515, + "step": 5675 + }, + { + "epoch": 0.45, + "learning_rate": 1.2099944826532796e-05, + "loss": 0.3057, + "step": 5676 + }, + { + "epoch": 0.45, + "learning_rate": 1.2097435941599886e-05, + "loss": 0.3002, + "step": 5677 + }, + { + "epoch": 0.45, + "learning_rate": 1.2094926918560917e-05, + "loss": 0.3972, + "step": 5678 + }, + { + "epoch": 0.45, + "learning_rate": 1.2092417757581085e-05, + "loss": 0.5161, + "step": 5679 + }, + { + "epoch": 0.45, + "learning_rate": 1.2089908458825614e-05, + "loss": 0.3298, + "step": 5680 + }, + { + "epoch": 0.45, + "learning_rate": 1.2087399022459729e-05, + "loss": 0.273, + "step": 5681 + }, + { + "epoch": 0.45, + "learning_rate": 1.208488944864866e-05, + "loss": 0.2247, + "step": 5682 + }, + { + "epoch": 0.45, + "learning_rate": 1.2082379737557655e-05, + "loss": 0.4293, + "step": 5683 + }, + { + "epoch": 0.45, + "learning_rate": 1.2079869889351961e-05, + "loss": 0.3721, + "step": 5684 + }, + { + "epoch": 0.45, + "learning_rate": 1.2077359904196841e-05, + "loss": 0.3712, + "step": 5685 + }, + { + "epoch": 0.45, + "learning_rate": 1.2074849782257572e-05, + "loss": 0.2925, + "step": 5686 + }, + { + "epoch": 0.45, + "learning_rate": 1.2072339523699426e-05, + "loss": 0.4053, + "step": 5687 + }, + { + "epoch": 0.45, + "learning_rate": 1.2069829128687693e-05, + "loss": 0.4258, + "step": 5688 + }, + { + "epoch": 0.45, + "learning_rate": 1.2067318597387672e-05, + "loss": 0.4224, + "step": 5689 + }, + { + "epoch": 0.45, + "learning_rate": 1.2064807929964668e-05, + "loss": 0.3947, + "step": 5690 + }, + { + "epoch": 0.45, + "learning_rate": 1.2062297126584e-05, + "loss": 0.2718, + "step": 5691 + }, + { + "epoch": 0.45, + "learning_rate": 1.2059786187410984e-05, + "loss": 0.3866, + "step": 5692 + }, + { + "epoch": 0.45, + "learning_rate": 1.2057275112610962e-05, + "loss": 0.309, + "step": 5693 + }, + { + "epoch": 0.45, + "learning_rate": 1.2054763902349273e-05, + "loss": 0.414, + "step": 5694 + }, + { + "epoch": 0.45, + "learning_rate": 1.2052252556791267e-05, + "loss": 0.4445, + "step": 5695 + }, + { + "epoch": 0.45, + "learning_rate": 1.2049741076102307e-05, + "loss": 0.3982, + "step": 5696 + }, + { + "epoch": 0.45, + "learning_rate": 1.2047229460447759e-05, + "loss": 0.3906, + "step": 5697 + }, + { + "epoch": 0.45, + "learning_rate": 1.2044717709993e-05, + "loss": 0.4323, + "step": 5698 + }, + { + "epoch": 0.45, + "learning_rate": 1.2042205824903419e-05, + "loss": 0.3424, + "step": 5699 + }, + { + "epoch": 0.45, + "learning_rate": 1.203969380534441e-05, + "loss": 0.3294, + "step": 5700 + }, + { + "epoch": 0.45, + "learning_rate": 1.2037181651481378e-05, + "loss": 0.2892, + "step": 5701 + }, + { + "epoch": 0.45, + "learning_rate": 1.2034669363479741e-05, + "loss": 0.2521, + "step": 5702 + }, + { + "epoch": 0.45, + "learning_rate": 1.2032156941504913e-05, + "loss": 0.4058, + "step": 5703 + }, + { + "epoch": 0.45, + "learning_rate": 1.2029644385722327e-05, + "loss": 0.4624, + "step": 5704 + }, + { + "epoch": 0.45, + "learning_rate": 1.2027131696297429e-05, + "loss": 0.3677, + "step": 5705 + }, + { + "epoch": 0.45, + "learning_rate": 1.202461887339566e-05, + "loss": 0.3915, + "step": 5706 + }, + { + "epoch": 0.45, + "learning_rate": 1.2022105917182478e-05, + "loss": 0.2922, + "step": 5707 + }, + { + "epoch": 0.45, + "learning_rate": 1.2019592827823354e-05, + "loss": 0.3048, + "step": 5708 + }, + { + "epoch": 0.45, + "learning_rate": 1.2017079605483758e-05, + "loss": 0.3323, + "step": 5709 + }, + { + "epoch": 0.45, + "learning_rate": 1.201456625032918e-05, + "loss": 0.2587, + "step": 5710 + }, + { + "epoch": 0.45, + "learning_rate": 1.2012052762525104e-05, + "loss": 0.4465, + "step": 5711 + }, + { + "epoch": 0.45, + "learning_rate": 1.2009539142237034e-05, + "loss": 0.3604, + "step": 5712 + }, + { + "epoch": 0.45, + "learning_rate": 1.2007025389630484e-05, + "loss": 0.4273, + "step": 5713 + }, + { + "epoch": 0.45, + "learning_rate": 1.2004511504870966e-05, + "loss": 0.3903, + "step": 5714 + }, + { + "epoch": 0.45, + "learning_rate": 1.2001997488124011e-05, + "loss": 0.3082, + "step": 5715 + }, + { + "epoch": 0.45, + "learning_rate": 1.1999483339555159e-05, + "loss": 0.3729, + "step": 5716 + }, + { + "epoch": 0.45, + "learning_rate": 1.1996969059329944e-05, + "loss": 0.3588, + "step": 5717 + }, + { + "epoch": 0.45, + "learning_rate": 1.1994454647613928e-05, + "loss": 0.3765, + "step": 5718 + }, + { + "epoch": 0.45, + "learning_rate": 1.199194010457267e-05, + "loss": 0.3711, + "step": 5719 + }, + { + "epoch": 0.45, + "learning_rate": 1.1989425430371739e-05, + "loss": 0.4567, + "step": 5720 + }, + { + "epoch": 0.45, + "learning_rate": 1.198691062517672e-05, + "loss": 0.4672, + "step": 5721 + }, + { + "epoch": 0.45, + "learning_rate": 1.1984395689153195e-05, + "loss": 0.2544, + "step": 5722 + }, + { + "epoch": 0.45, + "learning_rate": 1.1981880622466759e-05, + "loss": 0.2973, + "step": 5723 + }, + { + "epoch": 0.45, + "learning_rate": 1.1979365425283022e-05, + "loss": 0.4272, + "step": 5724 + }, + { + "epoch": 0.45, + "learning_rate": 1.1976850097767598e-05, + "loss": 0.421, + "step": 5725 + }, + { + "epoch": 0.45, + "learning_rate": 1.1974334640086104e-05, + "loss": 0.3879, + "step": 5726 + }, + { + "epoch": 0.45, + "learning_rate": 1.1971819052404177e-05, + "loss": 0.3314, + "step": 5727 + }, + { + "epoch": 0.45, + "learning_rate": 1.196930333488745e-05, + "loss": 0.3107, + "step": 5728 + }, + { + "epoch": 0.45, + "learning_rate": 1.1966787487701577e-05, + "loss": 0.3482, + "step": 5729 + }, + { + "epoch": 0.45, + "learning_rate": 1.1964271511012208e-05, + "loss": 0.3868, + "step": 5730 + }, + { + "epoch": 0.45, + "learning_rate": 1.1961755404985015e-05, + "loss": 0.4838, + "step": 5731 + }, + { + "epoch": 0.45, + "learning_rate": 1.1959239169785668e-05, + "loss": 0.4282, + "step": 5732 + }, + { + "epoch": 0.45, + "learning_rate": 1.1956722805579846e-05, + "loss": 0.2598, + "step": 5733 + }, + { + "epoch": 0.45, + "learning_rate": 1.1954206312533246e-05, + "loss": 0.2904, + "step": 5734 + }, + { + "epoch": 0.45, + "learning_rate": 1.1951689690811558e-05, + "loss": 0.4289, + "step": 5735 + }, + { + "epoch": 0.45, + "learning_rate": 1.1949172940580498e-05, + "loss": 0.4463, + "step": 5736 + }, + { + "epoch": 0.45, + "learning_rate": 1.1946656062005781e-05, + "loss": 0.3725, + "step": 5737 + }, + { + "epoch": 0.45, + "learning_rate": 1.1944139055253126e-05, + "loss": 0.4712, + "step": 5738 + }, + { + "epoch": 0.45, + "learning_rate": 1.1941621920488271e-05, + "loss": 0.4489, + "step": 5739 + }, + { + "epoch": 0.45, + "learning_rate": 1.1939104657876953e-05, + "loss": 0.4843, + "step": 5740 + }, + { + "epoch": 0.45, + "learning_rate": 1.1936587267584924e-05, + "loss": 0.3524, + "step": 5741 + }, + { + "epoch": 0.45, + "learning_rate": 1.193406974977794e-05, + "loss": 0.3591, + "step": 5742 + }, + { + "epoch": 0.45, + "learning_rate": 1.1931552104621776e-05, + "loss": 0.3706, + "step": 5743 + }, + { + "epoch": 0.46, + "learning_rate": 1.1929034332282192e-05, + "loss": 0.3305, + "step": 5744 + }, + { + "epoch": 0.46, + "learning_rate": 1.1926516432924984e-05, + "loss": 0.3921, + "step": 5745 + }, + { + "epoch": 0.46, + "learning_rate": 1.1923998406715937e-05, + "loss": 0.277, + "step": 5746 + }, + { + "epoch": 0.46, + "learning_rate": 1.1921480253820852e-05, + "loss": 0.3575, + "step": 5747 + }, + { + "epoch": 0.46, + "learning_rate": 1.1918961974405539e-05, + "loss": 0.3328, + "step": 5748 + }, + { + "epoch": 0.46, + "learning_rate": 1.1916443568635812e-05, + "loss": 0.2261, + "step": 5749 + }, + { + "epoch": 0.46, + "learning_rate": 1.1913925036677497e-05, + "loss": 0.3996, + "step": 5750 + }, + { + "epoch": 0.46, + "learning_rate": 1.191140637869643e-05, + "loss": 0.3383, + "step": 5751 + }, + { + "epoch": 0.46, + "learning_rate": 1.1908887594858447e-05, + "loss": 0.406, + "step": 5752 + }, + { + "epoch": 0.46, + "learning_rate": 1.1906368685329403e-05, + "loss": 0.4104, + "step": 5753 + }, + { + "epoch": 0.46, + "learning_rate": 1.1903849650275154e-05, + "loss": 0.3154, + "step": 5754 + }, + { + "epoch": 0.46, + "learning_rate": 1.1901330489861564e-05, + "loss": 0.4317, + "step": 5755 + }, + { + "epoch": 0.46, + "learning_rate": 1.1898811204254515e-05, + "loss": 0.4127, + "step": 5756 + }, + { + "epoch": 0.46, + "learning_rate": 1.189629179361988e-05, + "loss": 0.2542, + "step": 5757 + }, + { + "epoch": 0.46, + "learning_rate": 1.1893772258123554e-05, + "loss": 0.2998, + "step": 5758 + }, + { + "epoch": 0.46, + "learning_rate": 1.1891252597931441e-05, + "loss": 0.2479, + "step": 5759 + }, + { + "epoch": 0.46, + "learning_rate": 1.1888732813209442e-05, + "loss": 0.4307, + "step": 5760 + }, + { + "epoch": 0.46, + "learning_rate": 1.1886212904123477e-05, + "loss": 0.3399, + "step": 5761 + }, + { + "epoch": 0.46, + "learning_rate": 1.1883692870839466e-05, + "loss": 0.328, + "step": 5762 + }, + { + "epoch": 0.46, + "learning_rate": 1.1881172713523346e-05, + "loss": 0.3344, + "step": 5763 + }, + { + "epoch": 0.46, + "learning_rate": 1.1878652432341053e-05, + "loss": 0.4404, + "step": 5764 + }, + { + "epoch": 0.46, + "learning_rate": 1.1876132027458535e-05, + "loss": 0.4289, + "step": 5765 + }, + { + "epoch": 0.46, + "learning_rate": 1.1873611499041752e-05, + "loss": 0.3477, + "step": 5766 + }, + { + "epoch": 0.46, + "learning_rate": 1.1871090847256667e-05, + "loss": 0.3965, + "step": 5767 + }, + { + "epoch": 0.46, + "learning_rate": 1.1868570072269252e-05, + "loss": 0.3366, + "step": 5768 + }, + { + "epoch": 0.46, + "learning_rate": 1.186604917424549e-05, + "loss": 0.3745, + "step": 5769 + }, + { + "epoch": 0.46, + "learning_rate": 1.1863528153351369e-05, + "loss": 0.3541, + "step": 5770 + }, + { + "epoch": 0.46, + "learning_rate": 1.1861007009752884e-05, + "loss": 0.4605, + "step": 5771 + }, + { + "epoch": 0.46, + "learning_rate": 1.1858485743616044e-05, + "loss": 0.3892, + "step": 5772 + }, + { + "epoch": 0.46, + "learning_rate": 1.185596435510686e-05, + "loss": 0.2823, + "step": 5773 + }, + { + "epoch": 0.46, + "learning_rate": 1.1853442844391354e-05, + "loss": 0.3494, + "step": 5774 + }, + { + "epoch": 0.46, + "learning_rate": 1.1850921211635554e-05, + "loss": 0.3728, + "step": 5775 + }, + { + "epoch": 0.46, + "learning_rate": 1.1848399457005496e-05, + "loss": 0.3583, + "step": 5776 + }, + { + "epoch": 0.46, + "learning_rate": 1.1845877580667232e-05, + "loss": 0.3036, + "step": 5777 + }, + { + "epoch": 0.46, + "learning_rate": 1.1843355582786806e-05, + "loss": 0.3479, + "step": 5778 + }, + { + "epoch": 0.46, + "learning_rate": 1.1840833463530289e-05, + "loss": 0.4601, + "step": 5779 + }, + { + "epoch": 0.46, + "learning_rate": 1.1838311223063745e-05, + "loss": 0.3906, + "step": 5780 + }, + { + "epoch": 0.46, + "learning_rate": 1.1835788861553252e-05, + "loss": 0.4824, + "step": 5781 + }, + { + "epoch": 0.46, + "learning_rate": 1.1833266379164894e-05, + "loss": 0.328, + "step": 5782 + }, + { + "epoch": 0.46, + "learning_rate": 1.183074377606477e-05, + "loss": 0.2902, + "step": 5783 + }, + { + "epoch": 0.46, + "learning_rate": 1.1828221052418973e-05, + "loss": 0.3592, + "step": 5784 + }, + { + "epoch": 0.46, + "learning_rate": 1.182569820839362e-05, + "loss": 0.3746, + "step": 5785 + }, + { + "epoch": 0.46, + "learning_rate": 1.1823175244154823e-05, + "loss": 0.4296, + "step": 5786 + }, + { + "epoch": 0.46, + "learning_rate": 1.1820652159868706e-05, + "loss": 0.306, + "step": 5787 + }, + { + "epoch": 0.46, + "learning_rate": 1.1818128955701409e-05, + "loss": 0.2761, + "step": 5788 + }, + { + "epoch": 0.46, + "learning_rate": 1.1815605631819066e-05, + "loss": 0.3252, + "step": 5789 + }, + { + "epoch": 0.46, + "learning_rate": 1.181308218838783e-05, + "loss": 0.469, + "step": 5790 + }, + { + "epoch": 0.46, + "learning_rate": 1.1810558625573856e-05, + "loss": 0.3145, + "step": 5791 + }, + { + "epoch": 0.46, + "learning_rate": 1.1808034943543308e-05, + "loss": 0.3994, + "step": 5792 + }, + { + "epoch": 0.46, + "learning_rate": 1.1805511142462355e-05, + "loss": 0.3284, + "step": 5793 + }, + { + "epoch": 0.46, + "learning_rate": 1.1802987222497186e-05, + "loss": 0.2692, + "step": 5794 + }, + { + "epoch": 0.46, + "learning_rate": 1.1800463183813982e-05, + "loss": 0.4558, + "step": 5795 + }, + { + "epoch": 0.46, + "learning_rate": 1.1797939026578941e-05, + "loss": 0.4075, + "step": 5796 + }, + { + "epoch": 0.46, + "learning_rate": 1.1795414750958265e-05, + "loss": 0.4049, + "step": 5797 + }, + { + "epoch": 0.46, + "learning_rate": 1.1792890357118165e-05, + "loss": 0.4415, + "step": 5798 + }, + { + "epoch": 0.46, + "learning_rate": 1.1790365845224866e-05, + "loss": 0.3889, + "step": 5799 + }, + { + "epoch": 0.46, + "learning_rate": 1.1787841215444588e-05, + "loss": 0.4423, + "step": 5800 + }, + { + "epoch": 0.46, + "learning_rate": 1.1785316467943568e-05, + "loss": 0.3406, + "step": 5801 + }, + { + "epoch": 0.46, + "learning_rate": 1.1782791602888052e-05, + "loss": 0.4192, + "step": 5802 + }, + { + "epoch": 0.46, + "learning_rate": 1.1780266620444285e-05, + "loss": 0.2746, + "step": 5803 + }, + { + "epoch": 0.46, + "learning_rate": 1.1777741520778529e-05, + "loss": 0.3337, + "step": 5804 + }, + { + "epoch": 0.46, + "learning_rate": 1.1775216304057046e-05, + "loss": 0.4311, + "step": 5805 + }, + { + "epoch": 0.46, + "learning_rate": 1.1772690970446113e-05, + "loss": 0.3243, + "step": 5806 + }, + { + "epoch": 0.46, + "learning_rate": 1.177016552011201e-05, + "loss": 0.3326, + "step": 5807 + }, + { + "epoch": 0.46, + "learning_rate": 1.176763995322102e-05, + "loss": 0.2245, + "step": 5808 + }, + { + "epoch": 0.46, + "learning_rate": 1.1765114269939448e-05, + "loss": 0.3235, + "step": 5809 + }, + { + "epoch": 0.46, + "learning_rate": 1.1762588470433593e-05, + "loss": 0.3737, + "step": 5810 + }, + { + "epoch": 0.46, + "learning_rate": 1.176006255486977e-05, + "loss": 0.502, + "step": 5811 + }, + { + "epoch": 0.46, + "learning_rate": 1.1757536523414297e-05, + "loss": 0.3326, + "step": 5812 + }, + { + "epoch": 0.46, + "learning_rate": 1.1755010376233498e-05, + "loss": 0.4617, + "step": 5813 + }, + { + "epoch": 0.46, + "learning_rate": 1.175248411349371e-05, + "loss": 0.323, + "step": 5814 + }, + { + "epoch": 0.46, + "learning_rate": 1.1749957735361279e-05, + "loss": 0.4149, + "step": 5815 + }, + { + "epoch": 0.46, + "learning_rate": 1.174743124200255e-05, + "loss": 0.4073, + "step": 5816 + }, + { + "epoch": 0.46, + "learning_rate": 1.1744904633583883e-05, + "loss": 0.3038, + "step": 5817 + }, + { + "epoch": 0.46, + "learning_rate": 1.1742377910271638e-05, + "loss": 0.3544, + "step": 5818 + }, + { + "epoch": 0.46, + "learning_rate": 1.1739851072232195e-05, + "loss": 0.2898, + "step": 5819 + }, + { + "epoch": 0.46, + "learning_rate": 1.1737324119631927e-05, + "loss": 0.2871, + "step": 5820 + }, + { + "epoch": 0.46, + "learning_rate": 1.173479705263723e-05, + "loss": 0.416, + "step": 5821 + }, + { + "epoch": 0.46, + "learning_rate": 1.1732269871414492e-05, + "loss": 0.257, + "step": 5822 + }, + { + "epoch": 0.46, + "learning_rate": 1.1729742576130119e-05, + "loss": 0.4041, + "step": 5823 + }, + { + "epoch": 0.46, + "learning_rate": 1.1727215166950519e-05, + "loss": 0.3686, + "step": 5824 + }, + { + "epoch": 0.46, + "learning_rate": 1.172468764404211e-05, + "loss": 0.2834, + "step": 5825 + }, + { + "epoch": 0.46, + "learning_rate": 1.172216000757132e-05, + "loss": 0.3427, + "step": 5826 + }, + { + "epoch": 0.46, + "learning_rate": 1.1719632257704581e-05, + "loss": 0.2961, + "step": 5827 + }, + { + "epoch": 0.46, + "learning_rate": 1.171710439460833e-05, + "loss": 0.3286, + "step": 5828 + }, + { + "epoch": 0.46, + "learning_rate": 1.1714576418449017e-05, + "loss": 0.2613, + "step": 5829 + }, + { + "epoch": 0.46, + "learning_rate": 1.1712048329393097e-05, + "loss": 0.4251, + "step": 5830 + }, + { + "epoch": 0.46, + "learning_rate": 1.1709520127607035e-05, + "loss": 0.321, + "step": 5831 + }, + { + "epoch": 0.46, + "learning_rate": 1.1706991813257295e-05, + "loss": 0.2906, + "step": 5832 + }, + { + "epoch": 0.46, + "learning_rate": 1.1704463386510358e-05, + "loss": 0.3202, + "step": 5833 + }, + { + "epoch": 0.46, + "learning_rate": 1.170193484753271e-05, + "loss": 0.2212, + "step": 5834 + }, + { + "epoch": 0.46, + "learning_rate": 1.169940619649084e-05, + "loss": 0.406, + "step": 5835 + }, + { + "epoch": 0.46, + "learning_rate": 1.1696877433551248e-05, + "loss": 0.3583, + "step": 5836 + }, + { + "epoch": 0.46, + "learning_rate": 1.1694348558880447e-05, + "loss": 0.3048, + "step": 5837 + }, + { + "epoch": 0.46, + "learning_rate": 1.1691819572644941e-05, + "loss": 0.3965, + "step": 5838 + }, + { + "epoch": 0.46, + "learning_rate": 1.1689290475011258e-05, + "loss": 0.4148, + "step": 5839 + }, + { + "epoch": 0.46, + "learning_rate": 1.1686761266145926e-05, + "loss": 0.406, + "step": 5840 + }, + { + "epoch": 0.46, + "learning_rate": 1.1684231946215478e-05, + "loss": 0.2982, + "step": 5841 + }, + { + "epoch": 0.46, + "learning_rate": 1.1681702515386466e-05, + "loss": 0.4447, + "step": 5842 + }, + { + "epoch": 0.46, + "learning_rate": 1.167917297382543e-05, + "loss": 0.3023, + "step": 5843 + }, + { + "epoch": 0.46, + "learning_rate": 1.1676643321698934e-05, + "loss": 0.3534, + "step": 5844 + }, + { + "epoch": 0.46, + "learning_rate": 1.1674113559173548e-05, + "loss": 0.4657, + "step": 5845 + }, + { + "epoch": 0.46, + "learning_rate": 1.1671583686415833e-05, + "loss": 0.396, + "step": 5846 + }, + { + "epoch": 0.46, + "learning_rate": 1.1669053703592381e-05, + "loss": 0.3841, + "step": 5847 + }, + { + "epoch": 0.46, + "learning_rate": 1.1666523610869769e-05, + "loss": 0.4248, + "step": 5848 + }, + { + "epoch": 0.46, + "learning_rate": 1.1663993408414597e-05, + "loss": 0.358, + "step": 5849 + }, + { + "epoch": 0.46, + "learning_rate": 1.1661463096393468e-05, + "loss": 0.2983, + "step": 5850 + }, + { + "epoch": 0.46, + "learning_rate": 1.1658932674972985e-05, + "loss": 0.3636, + "step": 5851 + }, + { + "epoch": 0.46, + "learning_rate": 1.1656402144319772e-05, + "loss": 0.3123, + "step": 5852 + }, + { + "epoch": 0.46, + "learning_rate": 1.1653871504600445e-05, + "loss": 0.3208, + "step": 5853 + }, + { + "epoch": 0.46, + "learning_rate": 1.1651340755981634e-05, + "loss": 0.377, + "step": 5854 + }, + { + "epoch": 0.46, + "learning_rate": 1.1648809898629987e-05, + "loss": 0.3386, + "step": 5855 + }, + { + "epoch": 0.46, + "learning_rate": 1.1646278932712138e-05, + "loss": 0.3632, + "step": 5856 + }, + { + "epoch": 0.46, + "learning_rate": 1.1643747858394743e-05, + "loss": 0.3596, + "step": 5857 + }, + { + "epoch": 0.46, + "learning_rate": 1.1641216675844461e-05, + "loss": 0.3353, + "step": 5858 + }, + { + "epoch": 0.46, + "learning_rate": 1.1638685385227958e-05, + "loss": 0.3475, + "step": 5859 + }, + { + "epoch": 0.46, + "learning_rate": 1.1636153986711906e-05, + "loss": 0.4358, + "step": 5860 + }, + { + "epoch": 0.46, + "learning_rate": 1.163362248046299e-05, + "loss": 0.3068, + "step": 5861 + }, + { + "epoch": 0.46, + "learning_rate": 1.1631090866647891e-05, + "loss": 0.3529, + "step": 5862 + }, + { + "epoch": 0.46, + "learning_rate": 1.1628559145433308e-05, + "loss": 0.2837, + "step": 5863 + }, + { + "epoch": 0.46, + "learning_rate": 1.1626027316985942e-05, + "loss": 0.3371, + "step": 5864 + }, + { + "epoch": 0.46, + "learning_rate": 1.1623495381472499e-05, + "loss": 0.3887, + "step": 5865 + }, + { + "epoch": 0.46, + "learning_rate": 1.16209633390597e-05, + "loss": 0.2737, + "step": 5866 + }, + { + "epoch": 0.46, + "learning_rate": 1.161843118991426e-05, + "loss": 0.2311, + "step": 5867 + }, + { + "epoch": 0.46, + "learning_rate": 1.1615898934202917e-05, + "loss": 0.3283, + "step": 5868 + }, + { + "epoch": 0.46, + "learning_rate": 1.1613366572092404e-05, + "loss": 0.4271, + "step": 5869 + }, + { + "epoch": 0.47, + "learning_rate": 1.1610834103749465e-05, + "loss": 0.3591, + "step": 5870 + }, + { + "epoch": 0.47, + "learning_rate": 1.1608301529340848e-05, + "loss": 0.4016, + "step": 5871 + }, + { + "epoch": 0.47, + "learning_rate": 1.1605768849033318e-05, + "loss": 0.3216, + "step": 5872 + }, + { + "epoch": 0.47, + "learning_rate": 1.1603236062993635e-05, + "loss": 0.317, + "step": 5873 + }, + { + "epoch": 0.47, + "learning_rate": 1.1600703171388572e-05, + "loss": 0.452, + "step": 5874 + }, + { + "epoch": 0.47, + "learning_rate": 1.1598170174384907e-05, + "loss": 0.3232, + "step": 5875 + }, + { + "epoch": 0.47, + "learning_rate": 1.1595637072149424e-05, + "loss": 0.4459, + "step": 5876 + }, + { + "epoch": 0.47, + "learning_rate": 1.159310386484892e-05, + "loss": 0.3425, + "step": 5877 + }, + { + "epoch": 0.47, + "learning_rate": 1.159057055265019e-05, + "loss": 0.2788, + "step": 5878 + }, + { + "epoch": 0.47, + "learning_rate": 1.1588037135720043e-05, + "loss": 0.4464, + "step": 5879 + }, + { + "epoch": 0.47, + "learning_rate": 1.1585503614225292e-05, + "loss": 0.3051, + "step": 5880 + }, + { + "epoch": 0.47, + "learning_rate": 1.1582969988332757e-05, + "loss": 0.3578, + "step": 5881 + }, + { + "epoch": 0.47, + "learning_rate": 1.1580436258209266e-05, + "loss": 0.4095, + "step": 5882 + }, + { + "epoch": 0.47, + "learning_rate": 1.1577902424021653e-05, + "loss": 0.3379, + "step": 5883 + }, + { + "epoch": 0.47, + "learning_rate": 1.1575368485936752e-05, + "loss": 0.3825, + "step": 5884 + }, + { + "epoch": 0.47, + "learning_rate": 1.1572834444121424e-05, + "loss": 0.3939, + "step": 5885 + }, + { + "epoch": 0.47, + "learning_rate": 1.157030029874251e-05, + "loss": 0.4125, + "step": 5886 + }, + { + "epoch": 0.47, + "learning_rate": 1.1567766049966882e-05, + "loss": 0.4751, + "step": 5887 + }, + { + "epoch": 0.47, + "learning_rate": 1.1565231697961398e-05, + "loss": 0.3971, + "step": 5888 + }, + { + "epoch": 0.47, + "learning_rate": 1.1562697242892939e-05, + "loss": 0.2704, + "step": 5889 + }, + { + "epoch": 0.47, + "learning_rate": 1.156016268492839e-05, + "loss": 0.3314, + "step": 5890 + }, + { + "epoch": 0.47, + "learning_rate": 1.155762802423463e-05, + "loss": 0.3381, + "step": 5891 + }, + { + "epoch": 0.47, + "learning_rate": 1.1555093260978562e-05, + "loss": 0.2675, + "step": 5892 + }, + { + "epoch": 0.47, + "learning_rate": 1.1552558395327087e-05, + "loss": 0.2866, + "step": 5893 + }, + { + "epoch": 0.47, + "learning_rate": 1.155002342744711e-05, + "loss": 0.2396, + "step": 5894 + }, + { + "epoch": 0.47, + "learning_rate": 1.1547488357505549e-05, + "loss": 0.4434, + "step": 5895 + }, + { + "epoch": 0.47, + "learning_rate": 1.1544953185669327e-05, + "loss": 0.3305, + "step": 5896 + }, + { + "epoch": 0.47, + "learning_rate": 1.154241791210537e-05, + "loss": 0.37, + "step": 5897 + }, + { + "epoch": 0.47, + "learning_rate": 1.1539882536980616e-05, + "loss": 0.2642, + "step": 5898 + }, + { + "epoch": 0.47, + "learning_rate": 1.1537347060462007e-05, + "loss": 0.3714, + "step": 5899 + }, + { + "epoch": 0.47, + "learning_rate": 1.1534811482716487e-05, + "loss": 0.4119, + "step": 5900 + }, + { + "epoch": 0.47, + "learning_rate": 1.1532275803911021e-05, + "loss": 0.3376, + "step": 5901 + }, + { + "epoch": 0.47, + "learning_rate": 1.1529740024212566e-05, + "loss": 0.4139, + "step": 5902 + }, + { + "epoch": 0.47, + "learning_rate": 1.1527204143788086e-05, + "loss": 0.3959, + "step": 5903 + }, + { + "epoch": 0.47, + "learning_rate": 1.1524668162804566e-05, + "loss": 0.3052, + "step": 5904 + }, + { + "epoch": 0.47, + "learning_rate": 1.1522132081428982e-05, + "loss": 0.4127, + "step": 5905 + }, + { + "epoch": 0.47, + "learning_rate": 1.1519595899828325e-05, + "loss": 0.4811, + "step": 5906 + }, + { + "epoch": 0.47, + "learning_rate": 1.151705961816959e-05, + "loss": 0.4097, + "step": 5907 + }, + { + "epoch": 0.47, + "learning_rate": 1.151452323661978e-05, + "loss": 0.4494, + "step": 5908 + }, + { + "epoch": 0.47, + "learning_rate": 1.15119867553459e-05, + "loss": 0.3655, + "step": 5909 + }, + { + "epoch": 0.47, + "learning_rate": 1.150945017451497e-05, + "loss": 0.3538, + "step": 5910 + }, + { + "epoch": 0.47, + "learning_rate": 1.1506913494294005e-05, + "loss": 0.3186, + "step": 5911 + }, + { + "epoch": 0.47, + "learning_rate": 1.1504376714850041e-05, + "loss": 0.4169, + "step": 5912 + }, + { + "epoch": 0.47, + "learning_rate": 1.1501839836350106e-05, + "loss": 0.4157, + "step": 5913 + }, + { + "epoch": 0.47, + "learning_rate": 1.1499302858961245e-05, + "loss": 0.438, + "step": 5914 + }, + { + "epoch": 0.47, + "learning_rate": 1.1496765782850507e-05, + "loss": 0.2773, + "step": 5915 + }, + { + "epoch": 0.47, + "learning_rate": 1.149422860818494e-05, + "loss": 0.4751, + "step": 5916 + }, + { + "epoch": 0.47, + "learning_rate": 1.1491691335131614e-05, + "loss": 0.4796, + "step": 5917 + }, + { + "epoch": 0.47, + "learning_rate": 1.148915396385759e-05, + "loss": 0.307, + "step": 5918 + }, + { + "epoch": 0.47, + "learning_rate": 1.1486616494529939e-05, + "loss": 0.383, + "step": 5919 + }, + { + "epoch": 0.47, + "learning_rate": 1.1484078927315749e-05, + "loss": 0.3418, + "step": 5920 + }, + { + "epoch": 0.47, + "learning_rate": 1.1481541262382102e-05, + "loss": 0.2968, + "step": 5921 + }, + { + "epoch": 0.47, + "learning_rate": 1.1479003499896089e-05, + "loss": 0.3126, + "step": 5922 + }, + { + "epoch": 0.47, + "learning_rate": 1.1476465640024814e-05, + "loss": 0.2743, + "step": 5923 + }, + { + "epoch": 0.47, + "learning_rate": 1.147392768293538e-05, + "loss": 0.3234, + "step": 5924 + }, + { + "epoch": 0.47, + "learning_rate": 1.1471389628794902e-05, + "loss": 0.4107, + "step": 5925 + }, + { + "epoch": 0.47, + "learning_rate": 1.1468851477770495e-05, + "loss": 0.4101, + "step": 5926 + }, + { + "epoch": 0.47, + "learning_rate": 1.1466313230029284e-05, + "loss": 0.4347, + "step": 5927 + }, + { + "epoch": 0.47, + "learning_rate": 1.1463774885738408e-05, + "loss": 0.4425, + "step": 5928 + }, + { + "epoch": 0.47, + "learning_rate": 1.1461236445064993e-05, + "loss": 0.3312, + "step": 5929 + }, + { + "epoch": 0.47, + "learning_rate": 1.1458697908176194e-05, + "loss": 0.3839, + "step": 5930 + }, + { + "epoch": 0.47, + "learning_rate": 1.1456159275239153e-05, + "loss": 0.3881, + "step": 5931 + }, + { + "epoch": 0.47, + "learning_rate": 1.1453620546421032e-05, + "loss": 0.3307, + "step": 5932 + }, + { + "epoch": 0.47, + "learning_rate": 1.1451081721888992e-05, + "loss": 0.4268, + "step": 5933 + }, + { + "epoch": 0.47, + "learning_rate": 1.1448542801810203e-05, + "loss": 0.4241, + "step": 5934 + }, + { + "epoch": 0.47, + "learning_rate": 1.144600378635184e-05, + "loss": 0.4257, + "step": 5935 + }, + { + "epoch": 0.47, + "learning_rate": 1.1443464675681089e-05, + "loss": 0.348, + "step": 5936 + }, + { + "epoch": 0.47, + "learning_rate": 1.1440925469965129e-05, + "loss": 0.3204, + "step": 5937 + }, + { + "epoch": 0.47, + "learning_rate": 1.1438386169371164e-05, + "loss": 0.4182, + "step": 5938 + }, + { + "epoch": 0.47, + "learning_rate": 1.143584677406639e-05, + "loss": 0.5538, + "step": 5939 + }, + { + "epoch": 0.47, + "learning_rate": 1.1433307284218014e-05, + "loss": 0.3655, + "step": 5940 + }, + { + "epoch": 0.47, + "learning_rate": 1.1430767699993247e-05, + "loss": 0.2698, + "step": 5941 + }, + { + "epoch": 0.47, + "learning_rate": 1.1428228021559316e-05, + "loss": 0.3294, + "step": 5942 + }, + { + "epoch": 0.47, + "learning_rate": 1.142568824908344e-05, + "loss": 0.3075, + "step": 5943 + }, + { + "epoch": 0.47, + "learning_rate": 1.1423148382732854e-05, + "loss": 0.3035, + "step": 5944 + }, + { + "epoch": 0.47, + "learning_rate": 1.1420608422674793e-05, + "loss": 0.3218, + "step": 5945 + }, + { + "epoch": 0.47, + "learning_rate": 1.1418068369076503e-05, + "loss": 0.2432, + "step": 5946 + }, + { + "epoch": 0.47, + "learning_rate": 1.1415528222105237e-05, + "loss": 0.2999, + "step": 5947 + }, + { + "epoch": 0.47, + "learning_rate": 1.1412987981928245e-05, + "loss": 0.3284, + "step": 5948 + }, + { + "epoch": 0.47, + "learning_rate": 1.1410447648712795e-05, + "loss": 0.4114, + "step": 5949 + }, + { + "epoch": 0.47, + "learning_rate": 1.1407907222626156e-05, + "loss": 0.3195, + "step": 5950 + }, + { + "epoch": 0.47, + "learning_rate": 1.1405366703835596e-05, + "loss": 0.378, + "step": 5951 + }, + { + "epoch": 0.47, + "learning_rate": 1.1402826092508405e-05, + "loss": 0.3517, + "step": 5952 + }, + { + "epoch": 0.47, + "learning_rate": 1.1400285388811862e-05, + "loss": 0.295, + "step": 5953 + }, + { + "epoch": 0.47, + "learning_rate": 1.1397744592913268e-05, + "loss": 0.4747, + "step": 5954 + }, + { + "epoch": 0.47, + "learning_rate": 1.1395203704979915e-05, + "loss": 0.2862, + "step": 5955 + }, + { + "epoch": 0.47, + "learning_rate": 1.1392662725179114e-05, + "loss": 0.3014, + "step": 5956 + }, + { + "epoch": 0.47, + "learning_rate": 1.139012165367817e-05, + "loss": 0.3333, + "step": 5957 + }, + { + "epoch": 0.47, + "learning_rate": 1.1387580490644408e-05, + "loss": 0.2847, + "step": 5958 + }, + { + "epoch": 0.47, + "learning_rate": 1.1385039236245143e-05, + "loss": 0.3847, + "step": 5959 + }, + { + "epoch": 0.47, + "learning_rate": 1.1382497890647712e-05, + "loss": 0.4294, + "step": 5960 + }, + { + "epoch": 0.47, + "learning_rate": 1.1379956454019445e-05, + "loss": 0.3169, + "step": 5961 + }, + { + "epoch": 0.47, + "learning_rate": 1.1377414926527688e-05, + "loss": 0.3185, + "step": 5962 + }, + { + "epoch": 0.47, + "learning_rate": 1.1374873308339784e-05, + "loss": 0.3985, + "step": 5963 + }, + { + "epoch": 0.47, + "learning_rate": 1.1372331599623088e-05, + "loss": 0.3477, + "step": 5964 + }, + { + "epoch": 0.47, + "learning_rate": 1.136978980054496e-05, + "loss": 0.4618, + "step": 5965 + }, + { + "epoch": 0.47, + "learning_rate": 1.1367247911272765e-05, + "loss": 0.3965, + "step": 5966 + }, + { + "epoch": 0.47, + "learning_rate": 1.1364705931973872e-05, + "loss": 0.4161, + "step": 5967 + }, + { + "epoch": 0.47, + "learning_rate": 1.1362163862815663e-05, + "loss": 0.3331, + "step": 5968 + }, + { + "epoch": 0.47, + "learning_rate": 1.1359621703965516e-05, + "loss": 0.3779, + "step": 5969 + }, + { + "epoch": 0.47, + "learning_rate": 1.135707945559082e-05, + "loss": 0.3939, + "step": 5970 + }, + { + "epoch": 0.47, + "learning_rate": 1.1354537117858975e-05, + "loss": 0.4436, + "step": 5971 + }, + { + "epoch": 0.47, + "learning_rate": 1.1351994690937377e-05, + "loss": 0.3277, + "step": 5972 + }, + { + "epoch": 0.47, + "learning_rate": 1.1349452174993437e-05, + "loss": 0.439, + "step": 5973 + }, + { + "epoch": 0.47, + "learning_rate": 1.1346909570194558e-05, + "loss": 0.338, + "step": 5974 + }, + { + "epoch": 0.47, + "learning_rate": 1.134436687670817e-05, + "loss": 0.3312, + "step": 5975 + }, + { + "epoch": 0.47, + "learning_rate": 1.134182409470169e-05, + "loss": 0.3865, + "step": 5976 + }, + { + "epoch": 0.47, + "learning_rate": 1.133928122434255e-05, + "loss": 0.3123, + "step": 5977 + }, + { + "epoch": 0.47, + "learning_rate": 1.1336738265798187e-05, + "loss": 0.3428, + "step": 5978 + }, + { + "epoch": 0.47, + "learning_rate": 1.1334195219236039e-05, + "loss": 0.3109, + "step": 5979 + }, + { + "epoch": 0.47, + "learning_rate": 1.1331652084823554e-05, + "loss": 0.337, + "step": 5980 + }, + { + "epoch": 0.47, + "learning_rate": 1.1329108862728192e-05, + "loss": 0.3629, + "step": 5981 + }, + { + "epoch": 0.47, + "learning_rate": 1.1326565553117404e-05, + "loss": 0.3481, + "step": 5982 + }, + { + "epoch": 0.47, + "learning_rate": 1.1324022156158654e-05, + "loss": 0.2929, + "step": 5983 + }, + { + "epoch": 0.47, + "learning_rate": 1.132147867201942e-05, + "loss": 0.2722, + "step": 5984 + }, + { + "epoch": 0.47, + "learning_rate": 1.1318935100867172e-05, + "loss": 0.3098, + "step": 5985 + }, + { + "epoch": 0.47, + "learning_rate": 1.1316391442869394e-05, + "loss": 0.363, + "step": 5986 + }, + { + "epoch": 0.47, + "learning_rate": 1.1313847698193577e-05, + "loss": 0.4601, + "step": 5987 + }, + { + "epoch": 0.47, + "learning_rate": 1.1311303867007207e-05, + "loss": 0.3566, + "step": 5988 + }, + { + "epoch": 0.47, + "learning_rate": 1.1308759949477786e-05, + "loss": 0.3622, + "step": 5989 + }, + { + "epoch": 0.47, + "learning_rate": 1.1306215945772823e-05, + "loss": 0.3689, + "step": 5990 + }, + { + "epoch": 0.47, + "learning_rate": 1.1303671856059824e-05, + "loss": 0.2792, + "step": 5991 + }, + { + "epoch": 0.47, + "learning_rate": 1.1301127680506305e-05, + "loss": 0.3251, + "step": 5992 + }, + { + "epoch": 0.47, + "learning_rate": 1.1298583419279792e-05, + "loss": 0.4571, + "step": 5993 + }, + { + "epoch": 0.47, + "learning_rate": 1.1296039072547804e-05, + "loss": 0.3296, + "step": 5994 + }, + { + "epoch": 0.47, + "learning_rate": 1.1293494640477885e-05, + "loss": 0.3324, + "step": 5995 + }, + { + "epoch": 0.48, + "learning_rate": 1.1290950123237564e-05, + "loss": 0.2863, + "step": 5996 + }, + { + "epoch": 0.48, + "learning_rate": 1.128840552099439e-05, + "loss": 0.4909, + "step": 5997 + }, + { + "epoch": 0.48, + "learning_rate": 1.1285860833915914e-05, + "loss": 0.2063, + "step": 5998 + }, + { + "epoch": 0.48, + "learning_rate": 1.1283316062169685e-05, + "loss": 0.2743, + "step": 5999 + }, + { + "epoch": 0.48, + "learning_rate": 1.1280771205923269e-05, + "loss": 0.3626, + "step": 6000 + }, + { + "epoch": 0.48, + "learning_rate": 1.1278226265344234e-05, + "loss": 0.3528, + "step": 6001 + }, + { + "epoch": 0.48, + "learning_rate": 1.127568124060015e-05, + "loss": 0.382, + "step": 6002 + }, + { + "epoch": 0.48, + "learning_rate": 1.1273136131858595e-05, + "loss": 0.4033, + "step": 6003 + }, + { + "epoch": 0.48, + "learning_rate": 1.1270590939287149e-05, + "loss": 0.412, + "step": 6004 + }, + { + "epoch": 0.48, + "learning_rate": 1.1268045663053404e-05, + "loss": 0.4667, + "step": 6005 + }, + { + "epoch": 0.48, + "learning_rate": 1.1265500303324954e-05, + "loss": 0.1684, + "step": 6006 + }, + { + "epoch": 0.48, + "learning_rate": 1.12629548602694e-05, + "loss": 0.3592, + "step": 6007 + }, + { + "epoch": 0.48, + "learning_rate": 1.1260409334054342e-05, + "loss": 0.46, + "step": 6008 + }, + { + "epoch": 0.48, + "learning_rate": 1.1257863724847398e-05, + "loss": 0.3145, + "step": 6009 + }, + { + "epoch": 0.48, + "learning_rate": 1.1255318032816175e-05, + "loss": 0.3628, + "step": 6010 + }, + { + "epoch": 0.48, + "learning_rate": 1.1252772258128303e-05, + "loss": 0.3364, + "step": 6011 + }, + { + "epoch": 0.48, + "learning_rate": 1.1250226400951408e-05, + "loss": 0.2894, + "step": 6012 + }, + { + "epoch": 0.48, + "learning_rate": 1.1247680461453114e-05, + "loss": 0.2981, + "step": 6013 + }, + { + "epoch": 0.48, + "learning_rate": 1.1245134439801073e-05, + "loss": 0.3266, + "step": 6014 + }, + { + "epoch": 0.48, + "learning_rate": 1.1242588336162916e-05, + "loss": 0.3461, + "step": 6015 + }, + { + "epoch": 0.48, + "learning_rate": 1.1240042150706296e-05, + "loss": 0.4388, + "step": 6016 + }, + { + "epoch": 0.48, + "learning_rate": 1.1237495883598868e-05, + "loss": 0.3975, + "step": 6017 + }, + { + "epoch": 0.48, + "learning_rate": 1.1234949535008289e-05, + "loss": 0.4227, + "step": 6018 + }, + { + "epoch": 0.48, + "learning_rate": 1.1232403105102226e-05, + "loss": 0.3629, + "step": 6019 + }, + { + "epoch": 0.48, + "learning_rate": 1.122985659404835e-05, + "loss": 0.3681, + "step": 6020 + }, + { + "epoch": 0.48, + "learning_rate": 1.1227310002014332e-05, + "loss": 0.2271, + "step": 6021 + }, + { + "epoch": 0.48, + "learning_rate": 1.1224763329167859e-05, + "loss": 0.3914, + "step": 6022 + }, + { + "epoch": 0.48, + "learning_rate": 1.122221657567661e-05, + "loss": 0.3622, + "step": 6023 + }, + { + "epoch": 0.48, + "learning_rate": 1.1219669741708282e-05, + "loss": 0.299, + "step": 6024 + }, + { + "epoch": 0.48, + "learning_rate": 1.121712282743057e-05, + "loss": 0.3294, + "step": 6025 + }, + { + "epoch": 0.48, + "learning_rate": 1.1214575833011178e-05, + "loss": 0.4289, + "step": 6026 + }, + { + "epoch": 0.48, + "learning_rate": 1.121202875861781e-05, + "loss": 0.4819, + "step": 6027 + }, + { + "epoch": 0.48, + "learning_rate": 1.1209481604418182e-05, + "loss": 0.3802, + "step": 6028 + }, + { + "epoch": 0.48, + "learning_rate": 1.1206934370580009e-05, + "loss": 0.3078, + "step": 6029 + }, + { + "epoch": 0.48, + "learning_rate": 1.1204387057271016e-05, + "loss": 0.4232, + "step": 6030 + }, + { + "epoch": 0.48, + "learning_rate": 1.1201839664658929e-05, + "loss": 0.3518, + "step": 6031 + }, + { + "epoch": 0.48, + "learning_rate": 1.1199292192911482e-05, + "loss": 0.4117, + "step": 6032 + }, + { + "epoch": 0.48, + "learning_rate": 1.1196744642196417e-05, + "loss": 0.4102, + "step": 6033 + }, + { + "epoch": 0.48, + "learning_rate": 1.1194197012681473e-05, + "loss": 0.2985, + "step": 6034 + }, + { + "epoch": 0.48, + "learning_rate": 1.1191649304534405e-05, + "loss": 0.3648, + "step": 6035 + }, + { + "epoch": 0.48, + "learning_rate": 1.1189101517922961e-05, + "loss": 0.3776, + "step": 6036 + }, + { + "epoch": 0.48, + "learning_rate": 1.1186553653014906e-05, + "loss": 0.2762, + "step": 6037 + }, + { + "epoch": 0.48, + "learning_rate": 1.1184005709978002e-05, + "loss": 0.3327, + "step": 6038 + }, + { + "epoch": 0.48, + "learning_rate": 1.118145768898002e-05, + "loss": 0.2241, + "step": 6039 + }, + { + "epoch": 0.48, + "learning_rate": 1.1178909590188731e-05, + "loss": 0.4193, + "step": 6040 + }, + { + "epoch": 0.48, + "learning_rate": 1.117636141377192e-05, + "loss": 0.3885, + "step": 6041 + }, + { + "epoch": 0.48, + "learning_rate": 1.117381315989737e-05, + "loss": 0.3209, + "step": 6042 + }, + { + "epoch": 0.48, + "learning_rate": 1.117126482873287e-05, + "loss": 0.3697, + "step": 6043 + }, + { + "epoch": 0.48, + "learning_rate": 1.1168716420446219e-05, + "loss": 0.3822, + "step": 6044 + }, + { + "epoch": 0.48, + "learning_rate": 1.1166167935205214e-05, + "loss": 0.3273, + "step": 6045 + }, + { + "epoch": 0.48, + "learning_rate": 1.1163619373177663e-05, + "loss": 0.3748, + "step": 6046 + }, + { + "epoch": 0.48, + "learning_rate": 1.1161070734531375e-05, + "loss": 0.4059, + "step": 6047 + }, + { + "epoch": 0.48, + "learning_rate": 1.1158522019434163e-05, + "loss": 0.4148, + "step": 6048 + }, + { + "epoch": 0.48, + "learning_rate": 1.1155973228053854e-05, + "loss": 0.4565, + "step": 6049 + }, + { + "epoch": 0.48, + "learning_rate": 1.1153424360558268e-05, + "loss": 0.4746, + "step": 6050 + }, + { + "epoch": 0.48, + "learning_rate": 1.115087541711524e-05, + "loss": 0.3542, + "step": 6051 + }, + { + "epoch": 0.48, + "learning_rate": 1.1148326397892601e-05, + "loss": 0.2958, + "step": 6052 + }, + { + "epoch": 0.48, + "learning_rate": 1.1145777303058197e-05, + "loss": 0.3119, + "step": 6053 + }, + { + "epoch": 0.48, + "learning_rate": 1.1143228132779867e-05, + "loss": 0.2537, + "step": 6054 + }, + { + "epoch": 0.48, + "learning_rate": 1.1140678887225468e-05, + "loss": 0.3814, + "step": 6055 + }, + { + "epoch": 0.48, + "learning_rate": 1.1138129566562853e-05, + "loss": 0.4016, + "step": 6056 + }, + { + "epoch": 0.48, + "learning_rate": 1.1135580170959881e-05, + "loss": 0.3141, + "step": 6057 + }, + { + "epoch": 0.48, + "learning_rate": 1.1133030700584419e-05, + "loss": 0.3413, + "step": 6058 + }, + { + "epoch": 0.48, + "learning_rate": 1.1130481155604336e-05, + "loss": 0.3944, + "step": 6059 + }, + { + "epoch": 0.48, + "learning_rate": 1.1127931536187511e-05, + "loss": 0.3713, + "step": 6060 + }, + { + "epoch": 0.48, + "learning_rate": 1.1125381842501819e-05, + "loss": 0.4027, + "step": 6061 + }, + { + "epoch": 0.48, + "learning_rate": 1.1122832074715149e-05, + "loss": 0.3553, + "step": 6062 + }, + { + "epoch": 0.48, + "learning_rate": 1.1120282232995389e-05, + "loss": 0.3981, + "step": 6063 + }, + { + "epoch": 0.48, + "learning_rate": 1.1117732317510437e-05, + "loss": 0.4849, + "step": 6064 + }, + { + "epoch": 0.48, + "learning_rate": 1.111518232842819e-05, + "loss": 0.2873, + "step": 6065 + }, + { + "epoch": 0.48, + "learning_rate": 1.1112632265916548e-05, + "loss": 0.483, + "step": 6066 + }, + { + "epoch": 0.48, + "learning_rate": 1.1110082130143427e-05, + "loss": 0.3349, + "step": 6067 + }, + { + "epoch": 0.48, + "learning_rate": 1.1107531921276742e-05, + "loss": 0.3166, + "step": 6068 + }, + { + "epoch": 0.48, + "learning_rate": 1.1104981639484404e-05, + "loss": 0.277, + "step": 6069 + }, + { + "epoch": 0.48, + "learning_rate": 1.1102431284934345e-05, + "loss": 0.3473, + "step": 6070 + }, + { + "epoch": 0.48, + "learning_rate": 1.1099880857794491e-05, + "loss": 0.5149, + "step": 6071 + }, + { + "epoch": 0.48, + "learning_rate": 1.1097330358232775e-05, + "loss": 0.4565, + "step": 6072 + }, + { + "epoch": 0.48, + "learning_rate": 1.1094779786417133e-05, + "loss": 0.2361, + "step": 6073 + }, + { + "epoch": 0.48, + "learning_rate": 1.1092229142515512e-05, + "loss": 0.365, + "step": 6074 + }, + { + "epoch": 0.48, + "learning_rate": 1.1089678426695854e-05, + "loss": 0.399, + "step": 6075 + }, + { + "epoch": 0.48, + "learning_rate": 1.1087127639126118e-05, + "loss": 0.3179, + "step": 6076 + }, + { + "epoch": 0.48, + "learning_rate": 1.1084576779974257e-05, + "loss": 0.3113, + "step": 6077 + }, + { + "epoch": 0.48, + "learning_rate": 1.1082025849408231e-05, + "loss": 0.2938, + "step": 6078 + }, + { + "epoch": 0.48, + "learning_rate": 1.1079474847596014e-05, + "loss": 0.3589, + "step": 6079 + }, + { + "epoch": 0.48, + "learning_rate": 1.1076923774705568e-05, + "loss": 0.3365, + "step": 6080 + }, + { + "epoch": 0.48, + "learning_rate": 1.1074372630904878e-05, + "loss": 0.3383, + "step": 6081 + }, + { + "epoch": 0.48, + "learning_rate": 1.1071821416361917e-05, + "loss": 0.3016, + "step": 6082 + }, + { + "epoch": 0.48, + "learning_rate": 1.106927013124467e-05, + "loss": 0.2696, + "step": 6083 + }, + { + "epoch": 0.48, + "learning_rate": 1.1066718775721135e-05, + "loss": 0.2511, + "step": 6084 + }, + { + "epoch": 0.48, + "learning_rate": 1.1064167349959299e-05, + "loss": 0.297, + "step": 6085 + }, + { + "epoch": 0.48, + "learning_rate": 1.1061615854127165e-05, + "loss": 0.3461, + "step": 6086 + }, + { + "epoch": 0.48, + "learning_rate": 1.1059064288392733e-05, + "loss": 0.37, + "step": 6087 + }, + { + "epoch": 0.48, + "learning_rate": 1.1056512652924014e-05, + "loss": 0.2515, + "step": 6088 + }, + { + "epoch": 0.48, + "learning_rate": 1.1053960947889021e-05, + "loss": 0.3336, + "step": 6089 + }, + { + "epoch": 0.48, + "learning_rate": 1.1051409173455771e-05, + "loss": 0.2995, + "step": 6090 + }, + { + "epoch": 0.48, + "learning_rate": 1.1048857329792284e-05, + "loss": 0.242, + "step": 6091 + }, + { + "epoch": 0.48, + "learning_rate": 1.1046305417066594e-05, + "loss": 0.4302, + "step": 6092 + }, + { + "epoch": 0.48, + "learning_rate": 1.1043753435446722e-05, + "loss": 0.4064, + "step": 6093 + }, + { + "epoch": 0.48, + "learning_rate": 1.104120138510071e-05, + "loss": 0.338, + "step": 6094 + }, + { + "epoch": 0.48, + "learning_rate": 1.1038649266196597e-05, + "loss": 0.3641, + "step": 6095 + }, + { + "epoch": 0.48, + "learning_rate": 1.1036097078902428e-05, + "loss": 0.3148, + "step": 6096 + }, + { + "epoch": 0.48, + "learning_rate": 1.1033544823386248e-05, + "loss": 0.4983, + "step": 6097 + }, + { + "epoch": 0.48, + "learning_rate": 1.103099249981612e-05, + "loss": 0.2941, + "step": 6098 + }, + { + "epoch": 0.48, + "learning_rate": 1.1028440108360092e-05, + "loss": 0.3158, + "step": 6099 + }, + { + "epoch": 0.48, + "learning_rate": 1.1025887649186236e-05, + "loss": 0.3321, + "step": 6100 + }, + { + "epoch": 0.48, + "learning_rate": 1.1023335122462611e-05, + "loss": 0.3945, + "step": 6101 + }, + { + "epoch": 0.48, + "learning_rate": 1.102078252835729e-05, + "loss": 0.3354, + "step": 6102 + }, + { + "epoch": 0.48, + "learning_rate": 1.1018229867038358e-05, + "loss": 0.3857, + "step": 6103 + }, + { + "epoch": 0.48, + "learning_rate": 1.1015677138673882e-05, + "loss": 0.3422, + "step": 6104 + }, + { + "epoch": 0.48, + "learning_rate": 1.1013124343431955e-05, + "loss": 0.3931, + "step": 6105 + }, + { + "epoch": 0.48, + "learning_rate": 1.1010571481480668e-05, + "loss": 0.3766, + "step": 6106 + }, + { + "epoch": 0.48, + "learning_rate": 1.1008018552988109e-05, + "loss": 0.2647, + "step": 6107 + }, + { + "epoch": 0.48, + "learning_rate": 1.1005465558122382e-05, + "loss": 0.3251, + "step": 6108 + }, + { + "epoch": 0.48, + "learning_rate": 1.1002912497051582e-05, + "loss": 0.276, + "step": 6109 + }, + { + "epoch": 0.48, + "learning_rate": 1.1000359369943818e-05, + "loss": 0.3216, + "step": 6110 + }, + { + "epoch": 0.48, + "learning_rate": 1.099780617696721e-05, + "loss": 0.4347, + "step": 6111 + }, + { + "epoch": 0.48, + "learning_rate": 1.099525291828986e-05, + "loss": 0.2998, + "step": 6112 + }, + { + "epoch": 0.48, + "learning_rate": 1.0992699594079896e-05, + "loss": 0.4389, + "step": 6113 + }, + { + "epoch": 0.48, + "learning_rate": 1.0990146204505444e-05, + "loss": 0.3824, + "step": 6114 + }, + { + "epoch": 0.48, + "learning_rate": 1.0987592749734624e-05, + "loss": 0.3972, + "step": 6115 + }, + { + "epoch": 0.48, + "learning_rate": 1.0985039229935575e-05, + "loss": 0.5073, + "step": 6116 + }, + { + "epoch": 0.48, + "learning_rate": 1.098248564527643e-05, + "loss": 0.2787, + "step": 6117 + }, + { + "epoch": 0.48, + "learning_rate": 1.0979931995925335e-05, + "loss": 0.33, + "step": 6118 + }, + { + "epoch": 0.48, + "learning_rate": 1.0977378282050436e-05, + "loss": 0.3681, + "step": 6119 + }, + { + "epoch": 0.48, + "learning_rate": 1.0974824503819877e-05, + "loss": 0.2552, + "step": 6120 + }, + { + "epoch": 0.48, + "learning_rate": 1.0972270661401812e-05, + "loss": 0.3814, + "step": 6121 + }, + { + "epoch": 0.49, + "learning_rate": 1.0969716754964408e-05, + "loss": 0.395, + "step": 6122 + }, + { + "epoch": 0.49, + "learning_rate": 1.0967162784675818e-05, + "loss": 0.4038, + "step": 6123 + }, + { + "epoch": 0.49, + "learning_rate": 1.0964608750704215e-05, + "loss": 0.3146, + "step": 6124 + }, + { + "epoch": 0.49, + "learning_rate": 1.0962054653217764e-05, + "loss": 0.2915, + "step": 6125 + }, + { + "epoch": 0.49, + "learning_rate": 1.0959500492384646e-05, + "loss": 0.3689, + "step": 6126 + }, + { + "epoch": 0.49, + "learning_rate": 1.0956946268373034e-05, + "loss": 0.2841, + "step": 6127 + }, + { + "epoch": 0.49, + "learning_rate": 1.0954391981351117e-05, + "loss": 0.4168, + "step": 6128 + }, + { + "epoch": 0.49, + "learning_rate": 1.0951837631487081e-05, + "loss": 0.2991, + "step": 6129 + }, + { + "epoch": 0.49, + "learning_rate": 1.0949283218949117e-05, + "loss": 0.4915, + "step": 6130 + }, + { + "epoch": 0.49, + "learning_rate": 1.094672874390542e-05, + "loss": 0.4031, + "step": 6131 + }, + { + "epoch": 0.49, + "learning_rate": 1.094417420652419e-05, + "loss": 0.3877, + "step": 6132 + }, + { + "epoch": 0.49, + "learning_rate": 1.0941619606973633e-05, + "loss": 0.3234, + "step": 6133 + }, + { + "epoch": 0.49, + "learning_rate": 1.0939064945421953e-05, + "loss": 0.3525, + "step": 6134 + }, + { + "epoch": 0.49, + "learning_rate": 1.0936510222037368e-05, + "loss": 0.3538, + "step": 6135 + }, + { + "epoch": 0.49, + "learning_rate": 1.0933955436988088e-05, + "loss": 0.3046, + "step": 6136 + }, + { + "epoch": 0.49, + "learning_rate": 1.0931400590442337e-05, + "loss": 0.3727, + "step": 6137 + }, + { + "epoch": 0.49, + "learning_rate": 1.0928845682568344e-05, + "loss": 0.4228, + "step": 6138 + }, + { + "epoch": 0.49, + "learning_rate": 1.0926290713534324e-05, + "loss": 0.4246, + "step": 6139 + }, + { + "epoch": 0.49, + "learning_rate": 1.0923735683508521e-05, + "loss": 0.3437, + "step": 6140 + }, + { + "epoch": 0.49, + "learning_rate": 1.092118059265917e-05, + "loss": 0.4174, + "step": 6141 + }, + { + "epoch": 0.49, + "learning_rate": 1.0918625441154508e-05, + "loss": 0.333, + "step": 6142 + }, + { + "epoch": 0.49, + "learning_rate": 1.091607022916278e-05, + "loss": 0.4404, + "step": 6143 + }, + { + "epoch": 0.49, + "learning_rate": 1.0913514956852236e-05, + "loss": 0.2352, + "step": 6144 + }, + { + "epoch": 0.49, + "learning_rate": 1.0910959624391127e-05, + "loss": 0.3619, + "step": 6145 + }, + { + "epoch": 0.49, + "learning_rate": 1.090840423194771e-05, + "loss": 0.4185, + "step": 6146 + }, + { + "epoch": 0.49, + "learning_rate": 1.0905848779690246e-05, + "loss": 0.3826, + "step": 6147 + }, + { + "epoch": 0.49, + "learning_rate": 1.0903293267786998e-05, + "loss": 0.276, + "step": 6148 + }, + { + "epoch": 0.49, + "learning_rate": 1.0900737696406235e-05, + "loss": 0.2457, + "step": 6149 + }, + { + "epoch": 0.49, + "learning_rate": 1.0898182065716227e-05, + "loss": 0.2925, + "step": 6150 + }, + { + "epoch": 0.49, + "learning_rate": 1.0895626375885255e-05, + "loss": 0.2746, + "step": 6151 + }, + { + "epoch": 0.49, + "learning_rate": 1.0893070627081595e-05, + "loss": 0.3234, + "step": 6152 + }, + { + "epoch": 0.49, + "learning_rate": 1.089051481947353e-05, + "loss": 0.4237, + "step": 6153 + }, + { + "epoch": 0.49, + "learning_rate": 1.0887958953229349e-05, + "loss": 0.3755, + "step": 6154 + }, + { + "epoch": 0.49, + "learning_rate": 1.0885403028517345e-05, + "loss": 0.3077, + "step": 6155 + }, + { + "epoch": 0.49, + "learning_rate": 1.0882847045505809e-05, + "loss": 0.489, + "step": 6156 + }, + { + "epoch": 0.49, + "learning_rate": 1.0880291004363047e-05, + "loss": 0.3201, + "step": 6157 + }, + { + "epoch": 0.49, + "learning_rate": 1.0877734905257354e-05, + "loss": 0.2975, + "step": 6158 + }, + { + "epoch": 0.49, + "learning_rate": 1.0875178748357045e-05, + "loss": 0.2685, + "step": 6159 + }, + { + "epoch": 0.49, + "learning_rate": 1.0872622533830423e-05, + "loss": 0.3445, + "step": 6160 + }, + { + "epoch": 0.49, + "learning_rate": 1.0870066261845807e-05, + "loss": 0.3824, + "step": 6161 + }, + { + "epoch": 0.49, + "learning_rate": 1.0867509932571517e-05, + "loss": 0.2702, + "step": 6162 + }, + { + "epoch": 0.49, + "learning_rate": 1.0864953546175867e-05, + "loss": 0.3455, + "step": 6163 + }, + { + "epoch": 0.49, + "learning_rate": 1.0862397102827189e-05, + "loss": 0.3949, + "step": 6164 + }, + { + "epoch": 0.49, + "learning_rate": 1.0859840602693813e-05, + "loss": 0.3949, + "step": 6165 + }, + { + "epoch": 0.49, + "learning_rate": 1.0857284045944071e-05, + "loss": 0.3458, + "step": 6166 + }, + { + "epoch": 0.49, + "learning_rate": 1.0854727432746302e-05, + "loss": 0.32, + "step": 6167 + }, + { + "epoch": 0.49, + "learning_rate": 1.0852170763268838e-05, + "loss": 0.2848, + "step": 6168 + }, + { + "epoch": 0.49, + "learning_rate": 1.0849614037680032e-05, + "loss": 0.4398, + "step": 6169 + }, + { + "epoch": 0.49, + "learning_rate": 1.0847057256148234e-05, + "loss": 0.3237, + "step": 6170 + }, + { + "epoch": 0.49, + "learning_rate": 1.0844500418841788e-05, + "loss": 0.2792, + "step": 6171 + }, + { + "epoch": 0.49, + "learning_rate": 1.0841943525929053e-05, + "loss": 0.4598, + "step": 6172 + }, + { + "epoch": 0.49, + "learning_rate": 1.0839386577578389e-05, + "loss": 0.3927, + "step": 6173 + }, + { + "epoch": 0.49, + "learning_rate": 1.0836829573958155e-05, + "loss": 0.314, + "step": 6174 + }, + { + "epoch": 0.49, + "learning_rate": 1.083427251523672e-05, + "loss": 0.3395, + "step": 6175 + }, + { + "epoch": 0.49, + "learning_rate": 1.0831715401582458e-05, + "loss": 0.2957, + "step": 6176 + }, + { + "epoch": 0.49, + "learning_rate": 1.0829158233163737e-05, + "loss": 0.2367, + "step": 6177 + }, + { + "epoch": 0.49, + "learning_rate": 1.0826601010148935e-05, + "loss": 0.5682, + "step": 6178 + }, + { + "epoch": 0.49, + "learning_rate": 1.0824043732706435e-05, + "loss": 0.3671, + "step": 6179 + }, + { + "epoch": 0.49, + "learning_rate": 1.0821486401004618e-05, + "loss": 0.3275, + "step": 6180 + }, + { + "epoch": 0.49, + "learning_rate": 1.0818929015211877e-05, + "loss": 0.3033, + "step": 6181 + }, + { + "epoch": 0.49, + "learning_rate": 1.0816371575496598e-05, + "loss": 0.3134, + "step": 6182 + }, + { + "epoch": 0.49, + "learning_rate": 1.081381408202718e-05, + "loss": 0.3225, + "step": 6183 + }, + { + "epoch": 0.49, + "learning_rate": 1.0811256534972024e-05, + "loss": 0.4829, + "step": 6184 + }, + { + "epoch": 0.49, + "learning_rate": 1.0808698934499524e-05, + "loss": 0.3313, + "step": 6185 + }, + { + "epoch": 0.49, + "learning_rate": 1.0806141280778093e-05, + "loss": 0.3529, + "step": 6186 + }, + { + "epoch": 0.49, + "learning_rate": 1.0803583573976137e-05, + "loss": 0.3874, + "step": 6187 + }, + { + "epoch": 0.49, + "learning_rate": 1.0801025814262068e-05, + "loss": 0.2688, + "step": 6188 + }, + { + "epoch": 0.49, + "learning_rate": 1.0798468001804305e-05, + "loss": 0.3562, + "step": 6189 + }, + { + "epoch": 0.49, + "learning_rate": 1.0795910136771266e-05, + "loss": 0.3813, + "step": 6190 + }, + { + "epoch": 0.49, + "learning_rate": 1.0793352219331371e-05, + "loss": 0.3579, + "step": 6191 + }, + { + "epoch": 0.49, + "learning_rate": 1.0790794249653056e-05, + "loss": 0.3733, + "step": 6192 + }, + { + "epoch": 0.49, + "learning_rate": 1.0788236227904738e-05, + "loss": 0.3595, + "step": 6193 + }, + { + "epoch": 0.49, + "learning_rate": 1.0785678154254865e-05, + "loss": 0.3285, + "step": 6194 + }, + { + "epoch": 0.49, + "learning_rate": 1.0783120028871858e-05, + "loss": 0.2864, + "step": 6195 + }, + { + "epoch": 0.49, + "learning_rate": 1.0780561851924168e-05, + "loss": 0.3167, + "step": 6196 + }, + { + "epoch": 0.49, + "learning_rate": 1.0778003623580237e-05, + "loss": 0.4127, + "step": 6197 + }, + { + "epoch": 0.49, + "learning_rate": 1.077544534400851e-05, + "loss": 0.3726, + "step": 6198 + }, + { + "epoch": 0.49, + "learning_rate": 1.0772887013377438e-05, + "loss": 0.3905, + "step": 6199 + }, + { + "epoch": 0.49, + "learning_rate": 1.0770328631855476e-05, + "loss": 0.3981, + "step": 6200 + }, + { + "epoch": 0.49, + "learning_rate": 1.0767770199611078e-05, + "loss": 0.3169, + "step": 6201 + }, + { + "epoch": 0.49, + "learning_rate": 1.076521171681271e-05, + "loss": 0.3902, + "step": 6202 + }, + { + "epoch": 0.49, + "learning_rate": 1.0762653183628831e-05, + "loss": 0.3456, + "step": 6203 + }, + { + "epoch": 0.49, + "learning_rate": 1.0760094600227908e-05, + "loss": 0.4043, + "step": 6204 + }, + { + "epoch": 0.49, + "learning_rate": 1.0757535966778416e-05, + "loss": 0.319, + "step": 6205 + }, + { + "epoch": 0.49, + "learning_rate": 1.0754977283448824e-05, + "loss": 0.4477, + "step": 6206 + }, + { + "epoch": 0.49, + "learning_rate": 1.0752418550407611e-05, + "loss": 0.4664, + "step": 6207 + }, + { + "epoch": 0.49, + "learning_rate": 1.0749859767823256e-05, + "loss": 0.3876, + "step": 6208 + }, + { + "epoch": 0.49, + "learning_rate": 1.0747300935864245e-05, + "loss": 0.473, + "step": 6209 + }, + { + "epoch": 0.49, + "learning_rate": 1.074474205469906e-05, + "loss": 0.3703, + "step": 6210 + }, + { + "epoch": 0.49, + "learning_rate": 1.0742183124496197e-05, + "loss": 0.3697, + "step": 6211 + }, + { + "epoch": 0.49, + "learning_rate": 1.0739624145424146e-05, + "loss": 0.3893, + "step": 6212 + }, + { + "epoch": 0.49, + "learning_rate": 1.0737065117651404e-05, + "loss": 0.3132, + "step": 6213 + }, + { + "epoch": 0.49, + "learning_rate": 1.0734506041346468e-05, + "loss": 0.3628, + "step": 6214 + }, + { + "epoch": 0.49, + "learning_rate": 1.0731946916677847e-05, + "loss": 0.4696, + "step": 6215 + }, + { + "epoch": 0.49, + "learning_rate": 1.0729387743814041e-05, + "loss": 0.2343, + "step": 6216 + }, + { + "epoch": 0.49, + "learning_rate": 1.0726828522923563e-05, + "loss": 0.3762, + "step": 6217 + }, + { + "epoch": 0.49, + "learning_rate": 1.0724269254174921e-05, + "loss": 0.3867, + "step": 6218 + }, + { + "epoch": 0.49, + "learning_rate": 1.0721709937736638e-05, + "loss": 0.4161, + "step": 6219 + }, + { + "epoch": 0.49, + "learning_rate": 1.0719150573777226e-05, + "loss": 0.2261, + "step": 6220 + }, + { + "epoch": 0.49, + "learning_rate": 1.071659116246521e-05, + "loss": 0.3209, + "step": 6221 + }, + { + "epoch": 0.49, + "learning_rate": 1.0714031703969112e-05, + "loss": 0.302, + "step": 6222 + }, + { + "epoch": 0.49, + "learning_rate": 1.0711472198457462e-05, + "loss": 0.4019, + "step": 6223 + }, + { + "epoch": 0.49, + "learning_rate": 1.0708912646098795e-05, + "loss": 0.4281, + "step": 6224 + }, + { + "epoch": 0.49, + "learning_rate": 1.0706353047061638e-05, + "loss": 0.3902, + "step": 6225 + }, + { + "epoch": 0.49, + "learning_rate": 1.070379340151453e-05, + "loss": 0.3941, + "step": 6226 + }, + { + "epoch": 0.49, + "learning_rate": 1.0701233709626018e-05, + "loss": 0.3321, + "step": 6227 + }, + { + "epoch": 0.49, + "learning_rate": 1.0698673971564637e-05, + "loss": 0.2646, + "step": 6228 + }, + { + "epoch": 0.49, + "learning_rate": 1.0696114187498938e-05, + "loss": 0.397, + "step": 6229 + }, + { + "epoch": 0.49, + "learning_rate": 1.0693554357597469e-05, + "loss": 0.2873, + "step": 6230 + }, + { + "epoch": 0.49, + "learning_rate": 1.069099448202878e-05, + "loss": 0.3324, + "step": 6231 + }, + { + "epoch": 0.49, + "learning_rate": 1.0688434560961434e-05, + "loss": 0.3771, + "step": 6232 + }, + { + "epoch": 0.49, + "learning_rate": 1.068587459456398e-05, + "loss": 0.3833, + "step": 6233 + }, + { + "epoch": 0.49, + "learning_rate": 1.0683314583004986e-05, + "loss": 0.3984, + "step": 6234 + }, + { + "epoch": 0.49, + "learning_rate": 1.0680754526453017e-05, + "loss": 0.3003, + "step": 6235 + }, + { + "epoch": 0.49, + "learning_rate": 1.0678194425076633e-05, + "loss": 0.4579, + "step": 6236 + }, + { + "epoch": 0.49, + "learning_rate": 1.0675634279044416e-05, + "loss": 0.3914, + "step": 6237 + }, + { + "epoch": 0.49, + "learning_rate": 1.0673074088524926e-05, + "loss": 0.4162, + "step": 6238 + }, + { + "epoch": 0.49, + "learning_rate": 1.067051385368675e-05, + "loss": 0.3849, + "step": 6239 + }, + { + "epoch": 0.49, + "learning_rate": 1.0667953574698461e-05, + "loss": 0.3925, + "step": 6240 + }, + { + "epoch": 0.49, + "learning_rate": 1.0665393251728645e-05, + "loss": 0.2719, + "step": 6241 + }, + { + "epoch": 0.49, + "learning_rate": 1.0662832884945884e-05, + "loss": 0.4063, + "step": 6242 + }, + { + "epoch": 0.49, + "learning_rate": 1.0660272474518767e-05, + "loss": 0.3664, + "step": 6243 + }, + { + "epoch": 0.49, + "learning_rate": 1.0657712020615885e-05, + "loss": 0.4322, + "step": 6244 + }, + { + "epoch": 0.49, + "learning_rate": 1.0655151523405831e-05, + "loss": 0.4385, + "step": 6245 + }, + { + "epoch": 0.49, + "learning_rate": 1.06525909830572e-05, + "loss": 0.3438, + "step": 6246 + }, + { + "epoch": 0.49, + "learning_rate": 1.0650030399738594e-05, + "loss": 0.322, + "step": 6247 + }, + { + "epoch": 0.49, + "learning_rate": 1.0647469773618617e-05, + "loss": 0.232, + "step": 6248 + }, + { + "epoch": 0.5, + "learning_rate": 1.0644909104865869e-05, + "loss": 0.3509, + "step": 6249 + }, + { + "epoch": 0.5, + "learning_rate": 1.0642348393648956e-05, + "loss": 0.389, + "step": 6250 + }, + { + "epoch": 0.5, + "learning_rate": 1.0639787640136497e-05, + "loss": 0.3505, + "step": 6251 + }, + { + "epoch": 0.5, + "learning_rate": 1.0637226844497096e-05, + "loss": 0.3375, + "step": 6252 + }, + { + "epoch": 0.5, + "learning_rate": 1.0634666006899375e-05, + "loss": 0.2631, + "step": 6253 + }, + { + "epoch": 0.5, + "learning_rate": 1.0632105127511952e-05, + "loss": 0.3459, + "step": 6254 + }, + { + "epoch": 0.5, + "learning_rate": 1.0629544206503445e-05, + "loss": 0.3674, + "step": 6255 + }, + { + "epoch": 0.5, + "learning_rate": 1.0626983244042486e-05, + "loss": 0.3314, + "step": 6256 + }, + { + "epoch": 0.5, + "learning_rate": 1.0624422240297694e-05, + "loss": 0.3927, + "step": 6257 + }, + { + "epoch": 0.5, + "learning_rate": 1.0621861195437703e-05, + "loss": 0.3821, + "step": 6258 + }, + { + "epoch": 0.5, + "learning_rate": 1.0619300109631146e-05, + "loss": 0.3597, + "step": 6259 + }, + { + "epoch": 0.5, + "learning_rate": 1.0616738983046652e-05, + "loss": 0.3389, + "step": 6260 + }, + { + "epoch": 0.5, + "learning_rate": 1.0614177815852866e-05, + "loss": 0.4203, + "step": 6261 + }, + { + "epoch": 0.5, + "learning_rate": 1.0611616608218429e-05, + "loss": 0.371, + "step": 6262 + }, + { + "epoch": 0.5, + "learning_rate": 1.0609055360311978e-05, + "loss": 0.4336, + "step": 6263 + }, + { + "epoch": 0.5, + "learning_rate": 1.0606494072302164e-05, + "loss": 0.3038, + "step": 6264 + }, + { + "epoch": 0.5, + "learning_rate": 1.0603932744357632e-05, + "loss": 0.3513, + "step": 6265 + }, + { + "epoch": 0.5, + "learning_rate": 1.0601371376647034e-05, + "loss": 0.3828, + "step": 6266 + }, + { + "epoch": 0.5, + "learning_rate": 1.0598809969339028e-05, + "loss": 0.4925, + "step": 6267 + }, + { + "epoch": 0.5, + "learning_rate": 1.0596248522602264e-05, + "loss": 0.3385, + "step": 6268 + }, + { + "epoch": 0.5, + "learning_rate": 1.0593687036605402e-05, + "loss": 0.312, + "step": 6269 + }, + { + "epoch": 0.5, + "learning_rate": 1.0591125511517108e-05, + "loss": 0.2923, + "step": 6270 + }, + { + "epoch": 0.5, + "learning_rate": 1.0588563947506043e-05, + "loss": 0.4041, + "step": 6271 + }, + { + "epoch": 0.5, + "learning_rate": 1.0586002344740875e-05, + "loss": 0.3502, + "step": 6272 + }, + { + "epoch": 0.5, + "learning_rate": 1.0583440703390271e-05, + "loss": 0.3512, + "step": 6273 + }, + { + "epoch": 0.5, + "learning_rate": 1.0580879023622903e-05, + "loss": 0.3318, + "step": 6274 + }, + { + "epoch": 0.5, + "learning_rate": 1.0578317305607451e-05, + "loss": 0.3112, + "step": 6275 + }, + { + "epoch": 0.5, + "learning_rate": 1.057575554951258e-05, + "loss": 0.3415, + "step": 6276 + }, + { + "epoch": 0.5, + "learning_rate": 1.0573193755506982e-05, + "loss": 0.262, + "step": 6277 + }, + { + "epoch": 0.5, + "learning_rate": 1.0570631923759331e-05, + "loss": 0.38, + "step": 6278 + }, + { + "epoch": 0.5, + "learning_rate": 1.0568070054438314e-05, + "loss": 0.4143, + "step": 6279 + }, + { + "epoch": 0.5, + "learning_rate": 1.0565508147712618e-05, + "loss": 0.3416, + "step": 6280 + }, + { + "epoch": 0.5, + "learning_rate": 1.056294620375093e-05, + "loss": 0.3969, + "step": 6281 + }, + { + "epoch": 0.5, + "learning_rate": 1.0560384222721943e-05, + "loss": 0.3823, + "step": 6282 + }, + { + "epoch": 0.5, + "learning_rate": 1.0557822204794353e-05, + "loss": 0.4175, + "step": 6283 + }, + { + "epoch": 0.5, + "learning_rate": 1.0555260150136852e-05, + "loss": 0.2981, + "step": 6284 + }, + { + "epoch": 0.5, + "learning_rate": 1.0552698058918146e-05, + "loss": 0.3218, + "step": 6285 + }, + { + "epoch": 0.5, + "learning_rate": 1.055013593130693e-05, + "loss": 0.3527, + "step": 6286 + }, + { + "epoch": 0.5, + "learning_rate": 1.0547573767471913e-05, + "loss": 0.3857, + "step": 6287 + }, + { + "epoch": 0.5, + "learning_rate": 1.0545011567581794e-05, + "loss": 0.2703, + "step": 6288 + }, + { + "epoch": 0.5, + "learning_rate": 1.0542449331805287e-05, + "loss": 0.3581, + "step": 6289 + }, + { + "epoch": 0.5, + "learning_rate": 1.05398870603111e-05, + "loss": 0.3993, + "step": 6290 + }, + { + "epoch": 0.5, + "learning_rate": 1.0537324753267952e-05, + "loss": 0.2527, + "step": 6291 + }, + { + "epoch": 0.5, + "learning_rate": 1.053476241084455e-05, + "loss": 0.4424, + "step": 6292 + }, + { + "epoch": 0.5, + "learning_rate": 1.0532200033209618e-05, + "loss": 0.3177, + "step": 6293 + }, + { + "epoch": 0.5, + "learning_rate": 1.0529637620531876e-05, + "loss": 0.3158, + "step": 6294 + }, + { + "epoch": 0.5, + "learning_rate": 1.0527075172980043e-05, + "loss": 0.4027, + "step": 6295 + }, + { + "epoch": 0.5, + "learning_rate": 1.0524512690722848e-05, + "loss": 0.4993, + "step": 6296 + }, + { + "epoch": 0.5, + "learning_rate": 1.0521950173929017e-05, + "loss": 0.4586, + "step": 6297 + }, + { + "epoch": 0.5, + "learning_rate": 1.0519387622767274e-05, + "loss": 0.4199, + "step": 6298 + }, + { + "epoch": 0.5, + "learning_rate": 1.051682503740636e-05, + "loss": 0.2482, + "step": 6299 + }, + { + "epoch": 0.5, + "learning_rate": 1.0514262418015e-05, + "loss": 0.4616, + "step": 6300 + }, + { + "epoch": 0.5, + "learning_rate": 1.0511699764761935e-05, + "loss": 0.3476, + "step": 6301 + }, + { + "epoch": 0.5, + "learning_rate": 1.0509137077815906e-05, + "loss": 0.4998, + "step": 6302 + }, + { + "epoch": 0.5, + "learning_rate": 1.0506574357345647e-05, + "loss": 0.3968, + "step": 6303 + }, + { + "epoch": 0.5, + "learning_rate": 1.0504011603519904e-05, + "loss": 0.2265, + "step": 6304 + }, + { + "epoch": 0.5, + "learning_rate": 1.0501448816507425e-05, + "loss": 0.3547, + "step": 6305 + }, + { + "epoch": 0.5, + "learning_rate": 1.0498885996476952e-05, + "loss": 0.2761, + "step": 6306 + }, + { + "epoch": 0.5, + "learning_rate": 1.0496323143597237e-05, + "loss": 0.3718, + "step": 6307 + }, + { + "epoch": 0.5, + "learning_rate": 1.049376025803703e-05, + "loss": 0.3553, + "step": 6308 + }, + { + "epoch": 0.5, + "learning_rate": 1.0491197339965087e-05, + "loss": 0.4452, + "step": 6309 + }, + { + "epoch": 0.5, + "learning_rate": 1.0488634389550166e-05, + "loss": 0.2959, + "step": 6310 + }, + { + "epoch": 0.5, + "learning_rate": 1.0486071406961017e-05, + "loss": 0.4045, + "step": 6311 + }, + { + "epoch": 0.5, + "learning_rate": 1.0483508392366404e-05, + "loss": 0.4355, + "step": 6312 + }, + { + "epoch": 0.5, + "learning_rate": 1.0480945345935094e-05, + "loss": 0.4534, + "step": 6313 + }, + { + "epoch": 0.5, + "learning_rate": 1.0478382267835843e-05, + "loss": 0.3611, + "step": 6314 + }, + { + "epoch": 0.5, + "learning_rate": 1.0475819158237426e-05, + "loss": 0.4064, + "step": 6315 + }, + { + "epoch": 0.5, + "learning_rate": 1.0473256017308601e-05, + "loss": 0.4476, + "step": 6316 + }, + { + "epoch": 0.5, + "learning_rate": 1.047069284521815e-05, + "loss": 0.3944, + "step": 6317 + }, + { + "epoch": 0.5, + "learning_rate": 1.0468129642134837e-05, + "loss": 0.3735, + "step": 6318 + }, + { + "epoch": 0.5, + "learning_rate": 1.046556640822744e-05, + "loss": 0.3212, + "step": 6319 + }, + { + "epoch": 0.5, + "learning_rate": 1.0463003143664734e-05, + "loss": 0.3415, + "step": 6320 + }, + { + "epoch": 0.5, + "learning_rate": 1.0460439848615502e-05, + "loss": 0.266, + "step": 6321 + }, + { + "epoch": 0.5, + "learning_rate": 1.0457876523248518e-05, + "loss": 0.2452, + "step": 6322 + }, + { + "epoch": 0.5, + "learning_rate": 1.0455313167732573e-05, + "loss": 0.3876, + "step": 6323 + }, + { + "epoch": 0.5, + "learning_rate": 1.0452749782236443e-05, + "loss": 0.3462, + "step": 6324 + }, + { + "epoch": 0.5, + "learning_rate": 1.0450186366928917e-05, + "loss": 0.3353, + "step": 6325 + }, + { + "epoch": 0.5, + "learning_rate": 1.044762292197879e-05, + "loss": 0.3363, + "step": 6326 + }, + { + "epoch": 0.5, + "learning_rate": 1.0445059447554844e-05, + "loss": 0.3544, + "step": 6327 + }, + { + "epoch": 0.5, + "learning_rate": 1.0442495943825874e-05, + "loss": 0.3698, + "step": 6328 + }, + { + "epoch": 0.5, + "learning_rate": 1.0439932410960678e-05, + "loss": 0.4223, + "step": 6329 + }, + { + "epoch": 0.5, + "learning_rate": 1.0437368849128046e-05, + "loss": 0.3085, + "step": 6330 + }, + { + "epoch": 0.5, + "learning_rate": 1.043480525849678e-05, + "loss": 0.3224, + "step": 6331 + }, + { + "epoch": 0.5, + "learning_rate": 1.0432241639235686e-05, + "loss": 0.3052, + "step": 6332 + }, + { + "epoch": 0.5, + "learning_rate": 1.0429677991513554e-05, + "loss": 0.2526, + "step": 6333 + }, + { + "epoch": 0.5, + "learning_rate": 1.0427114315499196e-05, + "loss": 0.372, + "step": 6334 + }, + { + "epoch": 0.5, + "learning_rate": 1.0424550611361412e-05, + "loss": 0.3417, + "step": 6335 + }, + { + "epoch": 0.5, + "learning_rate": 1.0421986879269017e-05, + "loss": 0.4515, + "step": 6336 + }, + { + "epoch": 0.5, + "learning_rate": 1.0419423119390815e-05, + "loss": 0.3738, + "step": 6337 + }, + { + "epoch": 0.5, + "learning_rate": 1.041685933189562e-05, + "loss": 0.2692, + "step": 6338 + }, + { + "epoch": 0.5, + "learning_rate": 1.041429551695224e-05, + "loss": 0.3891, + "step": 6339 + }, + { + "epoch": 0.5, + "learning_rate": 1.0411731674729497e-05, + "loss": 0.3734, + "step": 6340 + }, + { + "epoch": 0.5, + "learning_rate": 1.0409167805396202e-05, + "loss": 0.2261, + "step": 6341 + }, + { + "epoch": 0.5, + "learning_rate": 1.040660390912118e-05, + "loss": 0.4555, + "step": 6342 + }, + { + "epoch": 0.5, + "learning_rate": 1.0404039986073244e-05, + "loss": 0.4407, + "step": 6343 + }, + { + "epoch": 0.5, + "learning_rate": 1.0401476036421219e-05, + "loss": 0.336, + "step": 6344 + }, + { + "epoch": 0.5, + "learning_rate": 1.039891206033393e-05, + "loss": 0.2796, + "step": 6345 + }, + { + "epoch": 0.5, + "learning_rate": 1.0396348057980202e-05, + "loss": 0.3759, + "step": 6346 + }, + { + "epoch": 0.5, + "learning_rate": 1.0393784029528858e-05, + "loss": 0.3289, + "step": 6347 + }, + { + "epoch": 0.5, + "learning_rate": 1.0391219975148734e-05, + "loss": 0.4748, + "step": 6348 + }, + { + "epoch": 0.5, + "learning_rate": 1.0388655895008654e-05, + "loss": 0.3468, + "step": 6349 + }, + { + "epoch": 0.5, + "learning_rate": 1.0386091789277458e-05, + "loss": 0.4049, + "step": 6350 + }, + { + "epoch": 0.5, + "learning_rate": 1.038352765812397e-05, + "loss": 0.3499, + "step": 6351 + }, + { + "epoch": 0.5, + "learning_rate": 1.0380963501717034e-05, + "loss": 0.3535, + "step": 6352 + }, + { + "epoch": 0.5, + "learning_rate": 1.0378399320225486e-05, + "loss": 0.4245, + "step": 6353 + }, + { + "epoch": 0.5, + "learning_rate": 1.037583511381816e-05, + "loss": 0.2647, + "step": 6354 + }, + { + "epoch": 0.5, + "learning_rate": 1.0373270882663899e-05, + "loss": 0.479, + "step": 6355 + }, + { + "epoch": 0.5, + "learning_rate": 1.0370706626931553e-05, + "loss": 0.404, + "step": 6356 + }, + { + "epoch": 0.5, + "learning_rate": 1.0368142346789954e-05, + "loss": 0.4002, + "step": 6357 + }, + { + "epoch": 0.5, + "learning_rate": 1.0365578042407956e-05, + "loss": 0.3309, + "step": 6358 + }, + { + "epoch": 0.5, + "learning_rate": 1.03630137139544e-05, + "loss": 0.3544, + "step": 6359 + }, + { + "epoch": 0.5, + "learning_rate": 1.0360449361598137e-05, + "loss": 0.3154, + "step": 6360 + }, + { + "epoch": 0.5, + "learning_rate": 1.0357884985508022e-05, + "loss": 0.3462, + "step": 6361 + }, + { + "epoch": 0.5, + "learning_rate": 1.03553205858529e-05, + "loss": 0.4339, + "step": 6362 + }, + { + "epoch": 0.5, + "learning_rate": 1.0352756162801626e-05, + "loss": 0.4559, + "step": 6363 + }, + { + "epoch": 0.5, + "learning_rate": 1.035019171652306e-05, + "loss": 0.4018, + "step": 6364 + }, + { + "epoch": 0.5, + "learning_rate": 1.0347627247186053e-05, + "loss": 0.2933, + "step": 6365 + }, + { + "epoch": 0.5, + "learning_rate": 1.0345062754959463e-05, + "loss": 0.4476, + "step": 6366 + }, + { + "epoch": 0.5, + "learning_rate": 1.0342498240012153e-05, + "loss": 0.3423, + "step": 6367 + }, + { + "epoch": 0.5, + "learning_rate": 1.0339933702512978e-05, + "loss": 0.2968, + "step": 6368 + }, + { + "epoch": 0.5, + "learning_rate": 1.0337369142630808e-05, + "loss": 0.2878, + "step": 6369 + }, + { + "epoch": 0.5, + "learning_rate": 1.0334804560534504e-05, + "loss": 0.3126, + "step": 6370 + }, + { + "epoch": 0.5, + "learning_rate": 1.0332239956392926e-05, + "loss": 0.3638, + "step": 6371 + }, + { + "epoch": 0.5, + "learning_rate": 1.032967533037495e-05, + "loss": 0.3644, + "step": 6372 + }, + { + "epoch": 0.5, + "learning_rate": 1.0327110682649436e-05, + "loss": 0.3853, + "step": 6373 + }, + { + "epoch": 0.5, + "learning_rate": 1.0324546013385258e-05, + "loss": 0.3158, + "step": 6374 + }, + { + "epoch": 0.51, + "learning_rate": 1.0321981322751291e-05, + "loss": 0.4848, + "step": 6375 + }, + { + "epoch": 0.51, + "learning_rate": 1.03194166109164e-05, + "loss": 0.3992, + "step": 6376 + }, + { + "epoch": 0.51, + "learning_rate": 1.0316851878049465e-05, + "loss": 0.3394, + "step": 6377 + }, + { + "epoch": 0.51, + "learning_rate": 1.0314287124319353e-05, + "loss": 0.4241, + "step": 6378 + }, + { + "epoch": 0.51, + "learning_rate": 1.031172234989495e-05, + "loss": 0.3059, + "step": 6379 + }, + { + "epoch": 0.51, + "learning_rate": 1.030915755494513e-05, + "loss": 0.5428, + "step": 6380 + }, + { + "epoch": 0.51, + "learning_rate": 1.030659273963877e-05, + "loss": 0.4659, + "step": 6381 + }, + { + "epoch": 0.51, + "learning_rate": 1.0304027904144756e-05, + "loss": 0.3371, + "step": 6382 + }, + { + "epoch": 0.51, + "learning_rate": 1.0301463048631968e-05, + "loss": 0.386, + "step": 6383 + }, + { + "epoch": 0.51, + "learning_rate": 1.0298898173269285e-05, + "loss": 0.301, + "step": 6384 + }, + { + "epoch": 0.51, + "learning_rate": 1.0296333278225599e-05, + "loss": 0.3133, + "step": 6385 + }, + { + "epoch": 0.51, + "learning_rate": 1.0293768363669791e-05, + "loss": 0.2937, + "step": 6386 + }, + { + "epoch": 0.51, + "learning_rate": 1.0291203429770749e-05, + "loss": 0.375, + "step": 6387 + }, + { + "epoch": 0.51, + "learning_rate": 1.0288638476697365e-05, + "loss": 0.3976, + "step": 6388 + }, + { + "epoch": 0.51, + "learning_rate": 1.0286073504618524e-05, + "loss": 0.4857, + "step": 6389 + }, + { + "epoch": 0.51, + "learning_rate": 1.0283508513703118e-05, + "loss": 0.3877, + "step": 6390 + }, + { + "epoch": 0.51, + "learning_rate": 1.0280943504120045e-05, + "loss": 0.3039, + "step": 6391 + }, + { + "epoch": 0.51, + "learning_rate": 1.027837847603819e-05, + "loss": 0.4382, + "step": 6392 + }, + { + "epoch": 0.51, + "learning_rate": 1.0275813429626456e-05, + "loss": 0.2952, + "step": 6393 + }, + { + "epoch": 0.51, + "learning_rate": 1.027324836505373e-05, + "loss": 0.4337, + "step": 6394 + }, + { + "epoch": 0.51, + "learning_rate": 1.0270683282488913e-05, + "loss": 0.4287, + "step": 6395 + }, + { + "epoch": 0.51, + "learning_rate": 1.026811818210091e-05, + "loss": 0.2726, + "step": 6396 + }, + { + "epoch": 0.51, + "learning_rate": 1.0265553064058612e-05, + "loss": 0.2379, + "step": 6397 + }, + { + "epoch": 0.51, + "learning_rate": 1.0262987928530921e-05, + "loss": 0.332, + "step": 6398 + }, + { + "epoch": 0.51, + "learning_rate": 1.0260422775686743e-05, + "loss": 0.4364, + "step": 6399 + }, + { + "epoch": 0.51, + "learning_rate": 1.0257857605694976e-05, + "loss": 0.3576, + "step": 6400 + }, + { + "epoch": 0.51, + "learning_rate": 1.025529241872453e-05, + "loss": 0.4212, + "step": 6401 + }, + { + "epoch": 0.51, + "learning_rate": 1.0252727214944302e-05, + "loss": 0.4368, + "step": 6402 + }, + { + "epoch": 0.51, + "learning_rate": 1.0250161994523205e-05, + "loss": 0.2477, + "step": 6403 + }, + { + "epoch": 0.51, + "learning_rate": 1.0247596757630147e-05, + "loss": 0.2563, + "step": 6404 + }, + { + "epoch": 0.51, + "learning_rate": 1.0245031504434032e-05, + "loss": 0.3047, + "step": 6405 + }, + { + "epoch": 0.51, + "learning_rate": 1.024246623510377e-05, + "loss": 0.3371, + "step": 6406 + }, + { + "epoch": 0.51, + "learning_rate": 1.0239900949808274e-05, + "loss": 0.4371, + "step": 6407 + }, + { + "epoch": 0.51, + "learning_rate": 1.0237335648716456e-05, + "loss": 0.4086, + "step": 6408 + }, + { + "epoch": 0.51, + "learning_rate": 1.0234770331997224e-05, + "loss": 0.4041, + "step": 6409 + }, + { + "epoch": 0.51, + "learning_rate": 1.02322049998195e-05, + "loss": 0.3908, + "step": 6410 + }, + { + "epoch": 0.51, + "learning_rate": 1.022963965235219e-05, + "loss": 0.3202, + "step": 6411 + }, + { + "epoch": 0.51, + "learning_rate": 1.0227074289764216e-05, + "loss": 0.4029, + "step": 6412 + }, + { + "epoch": 0.51, + "learning_rate": 1.0224508912224491e-05, + "loss": 0.3805, + "step": 6413 + }, + { + "epoch": 0.51, + "learning_rate": 1.0221943519901935e-05, + "loss": 0.3331, + "step": 6414 + }, + { + "epoch": 0.51, + "learning_rate": 1.0219378112965468e-05, + "loss": 0.395, + "step": 6415 + }, + { + "epoch": 0.51, + "learning_rate": 1.0216812691584005e-05, + "loss": 0.3148, + "step": 6416 + }, + { + "epoch": 0.51, + "learning_rate": 1.021424725592647e-05, + "loss": 0.3199, + "step": 6417 + }, + { + "epoch": 0.51, + "learning_rate": 1.0211681806161787e-05, + "loss": 0.3222, + "step": 6418 + }, + { + "epoch": 0.51, + "learning_rate": 1.0209116342458872e-05, + "loss": 0.3835, + "step": 6419 + }, + { + "epoch": 0.51, + "learning_rate": 1.0206550864986656e-05, + "loss": 0.3651, + "step": 6420 + }, + { + "epoch": 0.51, + "learning_rate": 1.0203985373914056e-05, + "loss": 0.4118, + "step": 6421 + }, + { + "epoch": 0.51, + "learning_rate": 1.0201419869410001e-05, + "loss": 0.3948, + "step": 6422 + }, + { + "epoch": 0.51, + "learning_rate": 1.0198854351643416e-05, + "loss": 0.38, + "step": 6423 + }, + { + "epoch": 0.51, + "learning_rate": 1.0196288820783232e-05, + "loss": 0.3621, + "step": 6424 + }, + { + "epoch": 0.51, + "learning_rate": 1.0193723276998371e-05, + "loss": 0.3591, + "step": 6425 + }, + { + "epoch": 0.51, + "learning_rate": 1.0191157720457765e-05, + "loss": 0.3752, + "step": 6426 + }, + { + "epoch": 0.51, + "learning_rate": 1.0188592151330343e-05, + "loss": 0.3434, + "step": 6427 + }, + { + "epoch": 0.51, + "learning_rate": 1.0186026569785037e-05, + "loss": 0.3034, + "step": 6428 + }, + { + "epoch": 0.51, + "learning_rate": 1.0183460975990773e-05, + "loss": 0.3829, + "step": 6429 + }, + { + "epoch": 0.51, + "learning_rate": 1.0180895370116488e-05, + "loss": 0.3397, + "step": 6430 + }, + { + "epoch": 0.51, + "learning_rate": 1.0178329752331116e-05, + "loss": 0.3413, + "step": 6431 + }, + { + "epoch": 0.51, + "learning_rate": 1.0175764122803584e-05, + "loss": 0.3226, + "step": 6432 + }, + { + "epoch": 0.51, + "learning_rate": 1.017319848170283e-05, + "loss": 0.3317, + "step": 6433 + }, + { + "epoch": 0.51, + "learning_rate": 1.0170632829197792e-05, + "loss": 0.3648, + "step": 6434 + }, + { + "epoch": 0.51, + "learning_rate": 1.0168067165457403e-05, + "loss": 0.3163, + "step": 6435 + }, + { + "epoch": 0.51, + "learning_rate": 1.01655014906506e-05, + "loss": 0.3109, + "step": 6436 + }, + { + "epoch": 0.51, + "learning_rate": 1.016293580494632e-05, + "loss": 0.3163, + "step": 6437 + }, + { + "epoch": 0.51, + "learning_rate": 1.0160370108513497e-05, + "loss": 0.3992, + "step": 6438 + }, + { + "epoch": 0.51, + "learning_rate": 1.015780440152108e-05, + "loss": 0.3651, + "step": 6439 + }, + { + "epoch": 0.51, + "learning_rate": 1.0155238684138e-05, + "loss": 0.3132, + "step": 6440 + }, + { + "epoch": 0.51, + "learning_rate": 1.0152672956533198e-05, + "loss": 0.2776, + "step": 6441 + }, + { + "epoch": 0.51, + "learning_rate": 1.015010721887562e-05, + "loss": 0.3625, + "step": 6442 + }, + { + "epoch": 0.51, + "learning_rate": 1.0147541471334204e-05, + "loss": 0.3063, + "step": 6443 + }, + { + "epoch": 0.51, + "learning_rate": 1.0144975714077889e-05, + "loss": 0.2453, + "step": 6444 + }, + { + "epoch": 0.51, + "learning_rate": 1.0142409947275621e-05, + "loss": 0.4268, + "step": 6445 + }, + { + "epoch": 0.51, + "learning_rate": 1.0139844171096345e-05, + "loss": 0.3861, + "step": 6446 + }, + { + "epoch": 0.51, + "learning_rate": 1.0137278385709004e-05, + "loss": 0.3311, + "step": 6447 + }, + { + "epoch": 0.51, + "learning_rate": 1.0134712591282539e-05, + "loss": 0.3431, + "step": 6448 + }, + { + "epoch": 0.51, + "learning_rate": 1.0132146787985898e-05, + "loss": 0.3398, + "step": 6449 + }, + { + "epoch": 0.51, + "learning_rate": 1.0129580975988029e-05, + "loss": 0.3391, + "step": 6450 + }, + { + "epoch": 0.51, + "learning_rate": 1.0127015155457875e-05, + "loss": 0.3246, + "step": 6451 + }, + { + "epoch": 0.51, + "learning_rate": 1.0124449326564383e-05, + "loss": 0.3497, + "step": 6452 + }, + { + "epoch": 0.51, + "learning_rate": 1.0121883489476505e-05, + "loss": 0.3701, + "step": 6453 + }, + { + "epoch": 0.51, + "learning_rate": 1.0119317644363182e-05, + "loss": 0.3676, + "step": 6454 + }, + { + "epoch": 0.51, + "learning_rate": 1.0116751791393371e-05, + "loss": 0.3015, + "step": 6455 + }, + { + "epoch": 0.51, + "learning_rate": 1.011418593073601e-05, + "loss": 0.3717, + "step": 6456 + }, + { + "epoch": 0.51, + "learning_rate": 1.0111620062560059e-05, + "loss": 0.2797, + "step": 6457 + }, + { + "epoch": 0.51, + "learning_rate": 1.0109054187034463e-05, + "loss": 0.4062, + "step": 6458 + }, + { + "epoch": 0.51, + "learning_rate": 1.0106488304328175e-05, + "loss": 0.304, + "step": 6459 + }, + { + "epoch": 0.51, + "learning_rate": 1.010392241461014e-05, + "loss": 0.2808, + "step": 6460 + }, + { + "epoch": 0.51, + "learning_rate": 1.010135651804932e-05, + "loss": 0.3692, + "step": 6461 + }, + { + "epoch": 0.51, + "learning_rate": 1.0098790614814658e-05, + "loss": 0.3235, + "step": 6462 + }, + { + "epoch": 0.51, + "learning_rate": 1.009622470507511e-05, + "loss": 0.4366, + "step": 6463 + }, + { + "epoch": 0.51, + "learning_rate": 1.0093658788999628e-05, + "loss": 0.4379, + "step": 6464 + }, + { + "epoch": 0.51, + "learning_rate": 1.0091092866757164e-05, + "loss": 0.344, + "step": 6465 + }, + { + "epoch": 0.51, + "learning_rate": 1.0088526938516676e-05, + "loss": 0.3257, + "step": 6466 + }, + { + "epoch": 0.51, + "learning_rate": 1.0085961004447114e-05, + "loss": 0.2885, + "step": 6467 + }, + { + "epoch": 0.51, + "learning_rate": 1.0083395064717429e-05, + "loss": 0.361, + "step": 6468 + }, + { + "epoch": 0.51, + "learning_rate": 1.0080829119496587e-05, + "loss": 0.3277, + "step": 6469 + }, + { + "epoch": 0.51, + "learning_rate": 1.0078263168953532e-05, + "loss": 0.3222, + "step": 6470 + }, + { + "epoch": 0.51, + "learning_rate": 1.0075697213257227e-05, + "loss": 0.3258, + "step": 6471 + }, + { + "epoch": 0.51, + "learning_rate": 1.0073131252576622e-05, + "loss": 0.3617, + "step": 6472 + }, + { + "epoch": 0.51, + "learning_rate": 1.0070565287080676e-05, + "loss": 0.4023, + "step": 6473 + }, + { + "epoch": 0.51, + "learning_rate": 1.0067999316938348e-05, + "loss": 0.4788, + "step": 6474 + }, + { + "epoch": 0.51, + "learning_rate": 1.006543334231859e-05, + "loss": 0.4014, + "step": 6475 + }, + { + "epoch": 0.51, + "learning_rate": 1.0062867363390361e-05, + "loss": 0.4521, + "step": 6476 + }, + { + "epoch": 0.51, + "learning_rate": 1.0060301380322622e-05, + "loss": 0.4394, + "step": 6477 + }, + { + "epoch": 0.51, + "learning_rate": 1.0057735393284322e-05, + "loss": 0.345, + "step": 6478 + }, + { + "epoch": 0.51, + "learning_rate": 1.0055169402444429e-05, + "loss": 0.465, + "step": 6479 + }, + { + "epoch": 0.51, + "learning_rate": 1.0052603407971892e-05, + "loss": 0.3646, + "step": 6480 + }, + { + "epoch": 0.51, + "learning_rate": 1.0050037410035676e-05, + "loss": 0.3385, + "step": 6481 + }, + { + "epoch": 0.51, + "learning_rate": 1.004747140880474e-05, + "loss": 0.4359, + "step": 6482 + }, + { + "epoch": 0.51, + "learning_rate": 1.0044905404448037e-05, + "loss": 0.3911, + "step": 6483 + }, + { + "epoch": 0.51, + "learning_rate": 1.0042339397134528e-05, + "loss": 0.3388, + "step": 6484 + }, + { + "epoch": 0.51, + "learning_rate": 1.0039773387033178e-05, + "loss": 0.3452, + "step": 6485 + }, + { + "epoch": 0.51, + "learning_rate": 1.0037207374312936e-05, + "loss": 0.3611, + "step": 6486 + }, + { + "epoch": 0.51, + "learning_rate": 1.003464135914277e-05, + "loss": 0.3275, + "step": 6487 + }, + { + "epoch": 0.51, + "learning_rate": 1.0032075341691639e-05, + "loss": 0.4185, + "step": 6488 + }, + { + "epoch": 0.51, + "learning_rate": 1.0029509322128499e-05, + "loss": 0.2572, + "step": 6489 + }, + { + "epoch": 0.51, + "learning_rate": 1.0026943300622313e-05, + "loss": 0.4632, + "step": 6490 + }, + { + "epoch": 0.51, + "learning_rate": 1.0024377277342038e-05, + "loss": 0.3206, + "step": 6491 + }, + { + "epoch": 0.51, + "learning_rate": 1.002181125245664e-05, + "loss": 0.4621, + "step": 6492 + }, + { + "epoch": 0.51, + "learning_rate": 1.0019245226135075e-05, + "loss": 0.483, + "step": 6493 + }, + { + "epoch": 0.51, + "learning_rate": 1.0016679198546304e-05, + "loss": 0.391, + "step": 6494 + }, + { + "epoch": 0.51, + "learning_rate": 1.0014113169859285e-05, + "loss": 0.3461, + "step": 6495 + }, + { + "epoch": 0.51, + "learning_rate": 1.0011547140242987e-05, + "loss": 0.3318, + "step": 6496 + }, + { + "epoch": 0.51, + "learning_rate": 1.0008981109866363e-05, + "loss": 0.21, + "step": 6497 + }, + { + "epoch": 0.51, + "learning_rate": 1.0006415078898377e-05, + "loss": 0.3157, + "step": 6498 + }, + { + "epoch": 0.51, + "learning_rate": 1.0003849047507987e-05, + "loss": 0.4363, + "step": 6499 + }, + { + "epoch": 0.51, + "learning_rate": 1.0001283015864157e-05, + "loss": 0.3465, + "step": 6500 + }, + { + "epoch": 0.52, + "learning_rate": 9.998716984135847e-06, + "loss": 0.4997, + "step": 6501 + }, + { + "epoch": 0.52, + "learning_rate": 9.996150952492018e-06, + "loss": 0.4185, + "step": 6502 + }, + { + "epoch": 0.52, + "learning_rate": 9.993584921101628e-06, + "loss": 0.3881, + "step": 6503 + }, + { + "epoch": 0.52, + "learning_rate": 9.991018890133642e-06, + "loss": 0.3333, + "step": 6504 + }, + { + "epoch": 0.52, + "learning_rate": 9.988452859757017e-06, + "loss": 0.3992, + "step": 6505 + }, + { + "epoch": 0.52, + "learning_rate": 9.985886830140717e-06, + "loss": 0.2015, + "step": 6506 + }, + { + "epoch": 0.52, + "learning_rate": 9.983320801453702e-06, + "loss": 0.3172, + "step": 6507 + }, + { + "epoch": 0.52, + "learning_rate": 9.98075477386493e-06, + "loss": 0.3522, + "step": 6508 + }, + { + "epoch": 0.52, + "learning_rate": 9.978188747543364e-06, + "loss": 0.3618, + "step": 6509 + }, + { + "epoch": 0.52, + "learning_rate": 9.975622722657965e-06, + "loss": 0.3423, + "step": 6510 + }, + { + "epoch": 0.52, + "learning_rate": 9.973056699377692e-06, + "loss": 0.3695, + "step": 6511 + }, + { + "epoch": 0.52, + "learning_rate": 9.970490677871506e-06, + "loss": 0.3034, + "step": 6512 + }, + { + "epoch": 0.52, + "learning_rate": 9.967924658308366e-06, + "loss": 0.4006, + "step": 6513 + }, + { + "epoch": 0.52, + "learning_rate": 9.965358640857231e-06, + "loss": 0.2858, + "step": 6514 + }, + { + "epoch": 0.52, + "learning_rate": 9.962792625687067e-06, + "loss": 0.4616, + "step": 6515 + }, + { + "epoch": 0.52, + "learning_rate": 9.960226612966828e-06, + "loss": 0.3214, + "step": 6516 + }, + { + "epoch": 0.52, + "learning_rate": 9.957660602865477e-06, + "loss": 0.3186, + "step": 6517 + }, + { + "epoch": 0.52, + "learning_rate": 9.955094595551968e-06, + "loss": 0.3514, + "step": 6518 + }, + { + "epoch": 0.52, + "learning_rate": 9.952528591195265e-06, + "loss": 0.2891, + "step": 6519 + }, + { + "epoch": 0.52, + "learning_rate": 9.949962589964327e-06, + "loss": 0.3491, + "step": 6520 + }, + { + "epoch": 0.52, + "learning_rate": 9.94739659202811e-06, + "loss": 0.348, + "step": 6521 + }, + { + "epoch": 0.52, + "learning_rate": 9.944830597555573e-06, + "loss": 0.3963, + "step": 6522 + }, + { + "epoch": 0.52, + "learning_rate": 9.94226460671568e-06, + "loss": 0.2236, + "step": 6523 + }, + { + "epoch": 0.52, + "learning_rate": 9.939698619677383e-06, + "loss": 0.2792, + "step": 6524 + }, + { + "epoch": 0.52, + "learning_rate": 9.937132636609642e-06, + "loss": 0.3195, + "step": 6525 + }, + { + "epoch": 0.52, + "learning_rate": 9.934566657681412e-06, + "loss": 0.3277, + "step": 6526 + }, + { + "epoch": 0.52, + "learning_rate": 9.932000683061654e-06, + "loss": 0.3826, + "step": 6527 + }, + { + "epoch": 0.52, + "learning_rate": 9.929434712919327e-06, + "loss": 0.4267, + "step": 6528 + }, + { + "epoch": 0.52, + "learning_rate": 9.926868747423381e-06, + "loss": 0.4378, + "step": 6529 + }, + { + "epoch": 0.52, + "learning_rate": 9.924302786742775e-06, + "loss": 0.3408, + "step": 6530 + }, + { + "epoch": 0.52, + "learning_rate": 9.92173683104647e-06, + "loss": 0.3819, + "step": 6531 + }, + { + "epoch": 0.52, + "learning_rate": 9.919170880503416e-06, + "loss": 0.2606, + "step": 6532 + }, + { + "epoch": 0.52, + "learning_rate": 9.916604935282573e-06, + "loss": 0.4687, + "step": 6533 + }, + { + "epoch": 0.52, + "learning_rate": 9.914038995552891e-06, + "loss": 0.4139, + "step": 6534 + }, + { + "epoch": 0.52, + "learning_rate": 9.911473061483326e-06, + "loss": 0.305, + "step": 6535 + }, + { + "epoch": 0.52, + "learning_rate": 9.908907133242838e-06, + "loss": 0.3429, + "step": 6536 + }, + { + "epoch": 0.52, + "learning_rate": 9.906341211000375e-06, + "loss": 0.423, + "step": 6537 + }, + { + "epoch": 0.52, + "learning_rate": 9.903775294924892e-06, + "loss": 0.3209, + "step": 6538 + }, + { + "epoch": 0.52, + "learning_rate": 9.901209385185345e-06, + "loss": 0.3094, + "step": 6539 + }, + { + "epoch": 0.52, + "learning_rate": 9.898643481950683e-06, + "loss": 0.4217, + "step": 6540 + }, + { + "epoch": 0.52, + "learning_rate": 9.89607758538986e-06, + "loss": 0.4318, + "step": 6541 + }, + { + "epoch": 0.52, + "learning_rate": 9.893511695671828e-06, + "loss": 0.3977, + "step": 6542 + }, + { + "epoch": 0.52, + "learning_rate": 9.890945812965538e-06, + "loss": 0.3931, + "step": 6543 + }, + { + "epoch": 0.52, + "learning_rate": 9.888379937439944e-06, + "loss": 0.3263, + "step": 6544 + }, + { + "epoch": 0.52, + "learning_rate": 9.885814069263991e-06, + "loss": 0.2923, + "step": 6545 + }, + { + "epoch": 0.52, + "learning_rate": 9.883248208606632e-06, + "loss": 0.386, + "step": 6546 + }, + { + "epoch": 0.52, + "learning_rate": 9.880682355636821e-06, + "loss": 0.3649, + "step": 6547 + }, + { + "epoch": 0.52, + "learning_rate": 9.878116510523498e-06, + "loss": 0.3651, + "step": 6548 + }, + { + "epoch": 0.52, + "learning_rate": 9.87555067343562e-06, + "loss": 0.2635, + "step": 6549 + }, + { + "epoch": 0.52, + "learning_rate": 9.872984844542128e-06, + "loss": 0.3099, + "step": 6550 + }, + { + "epoch": 0.52, + "learning_rate": 9.870419024011973e-06, + "loss": 0.4044, + "step": 6551 + }, + { + "epoch": 0.52, + "learning_rate": 9.867853212014104e-06, + "loss": 0.2662, + "step": 6552 + }, + { + "epoch": 0.52, + "learning_rate": 9.865287408717464e-06, + "loss": 0.3206, + "step": 6553 + }, + { + "epoch": 0.52, + "learning_rate": 9.862721614291e-06, + "loss": 0.3721, + "step": 6554 + }, + { + "epoch": 0.52, + "learning_rate": 9.860155828903658e-06, + "loss": 0.354, + "step": 6555 + }, + { + "epoch": 0.52, + "learning_rate": 9.85759005272438e-06, + "loss": 0.3833, + "step": 6556 + }, + { + "epoch": 0.52, + "learning_rate": 9.855024285922114e-06, + "loss": 0.4091, + "step": 6557 + }, + { + "epoch": 0.52, + "learning_rate": 9.8524585286658e-06, + "loss": 0.3955, + "step": 6558 + }, + { + "epoch": 0.52, + "learning_rate": 9.84989278112438e-06, + "loss": 0.3623, + "step": 6559 + }, + { + "epoch": 0.52, + "learning_rate": 9.847327043466802e-06, + "loss": 0.2896, + "step": 6560 + }, + { + "epoch": 0.52, + "learning_rate": 9.844761315862002e-06, + "loss": 0.3454, + "step": 6561 + }, + { + "epoch": 0.52, + "learning_rate": 9.842195598478922e-06, + "loss": 0.2897, + "step": 6562 + }, + { + "epoch": 0.52, + "learning_rate": 9.839629891486503e-06, + "loss": 0.2619, + "step": 6563 + }, + { + "epoch": 0.52, + "learning_rate": 9.83706419505368e-06, + "loss": 0.3553, + "step": 6564 + }, + { + "epoch": 0.52, + "learning_rate": 9.834498509349402e-06, + "loss": 0.3455, + "step": 6565 + }, + { + "epoch": 0.52, + "learning_rate": 9.831932834542598e-06, + "loss": 0.3488, + "step": 6566 + }, + { + "epoch": 0.52, + "learning_rate": 9.829367170802208e-06, + "loss": 0.3712, + "step": 6567 + }, + { + "epoch": 0.52, + "learning_rate": 9.82680151829717e-06, + "loss": 0.3013, + "step": 6568 + }, + { + "epoch": 0.52, + "learning_rate": 9.824235877196418e-06, + "loss": 0.2985, + "step": 6569 + }, + { + "epoch": 0.52, + "learning_rate": 9.821670247668887e-06, + "loss": 0.3736, + "step": 6570 + }, + { + "epoch": 0.52, + "learning_rate": 9.819104629883513e-06, + "loss": 0.2322, + "step": 6571 + }, + { + "epoch": 0.52, + "learning_rate": 9.816539024009227e-06, + "loss": 0.3249, + "step": 6572 + }, + { + "epoch": 0.52, + "learning_rate": 9.813973430214965e-06, + "loss": 0.2852, + "step": 6573 + }, + { + "epoch": 0.52, + "learning_rate": 9.811407848669657e-06, + "loss": 0.4162, + "step": 6574 + }, + { + "epoch": 0.52, + "learning_rate": 9.808842279542235e-06, + "loss": 0.3598, + "step": 6575 + }, + { + "epoch": 0.52, + "learning_rate": 9.80627672300163e-06, + "loss": 0.2771, + "step": 6576 + }, + { + "epoch": 0.52, + "learning_rate": 9.80371117921677e-06, + "loss": 0.5204, + "step": 6577 + }, + { + "epoch": 0.52, + "learning_rate": 9.801145648356585e-06, + "loss": 0.3281, + "step": 6578 + }, + { + "epoch": 0.52, + "learning_rate": 9.798580130590004e-06, + "loss": 0.3055, + "step": 6579 + }, + { + "epoch": 0.52, + "learning_rate": 9.79601462608595e-06, + "loss": 0.3556, + "step": 6580 + }, + { + "epoch": 0.52, + "learning_rate": 9.79344913501335e-06, + "loss": 0.3073, + "step": 6581 + }, + { + "epoch": 0.52, + "learning_rate": 9.790883657541133e-06, + "loss": 0.3791, + "step": 6582 + }, + { + "epoch": 0.52, + "learning_rate": 9.788318193838218e-06, + "loss": 0.3853, + "step": 6583 + }, + { + "epoch": 0.52, + "learning_rate": 9.785752744073534e-06, + "loss": 0.2995, + "step": 6584 + }, + { + "epoch": 0.52, + "learning_rate": 9.783187308416e-06, + "loss": 0.4187, + "step": 6585 + }, + { + "epoch": 0.52, + "learning_rate": 9.780621887034537e-06, + "loss": 0.3039, + "step": 6586 + }, + { + "epoch": 0.52, + "learning_rate": 9.778056480098068e-06, + "loss": 0.2926, + "step": 6587 + }, + { + "epoch": 0.52, + "learning_rate": 9.775491087775514e-06, + "loss": 0.4238, + "step": 6588 + }, + { + "epoch": 0.52, + "learning_rate": 9.772925710235789e-06, + "loss": 0.3749, + "step": 6589 + }, + { + "epoch": 0.52, + "learning_rate": 9.770360347647817e-06, + "loss": 0.4372, + "step": 6590 + }, + { + "epoch": 0.52, + "learning_rate": 9.767795000180507e-06, + "loss": 0.3246, + "step": 6591 + }, + { + "epoch": 0.52, + "learning_rate": 9.76522966800278e-06, + "loss": 0.4043, + "step": 6592 + }, + { + "epoch": 0.52, + "learning_rate": 9.76266435128355e-06, + "loss": 0.4729, + "step": 6593 + }, + { + "epoch": 0.52, + "learning_rate": 9.76009905019173e-06, + "loss": 0.4243, + "step": 6594 + }, + { + "epoch": 0.52, + "learning_rate": 9.757533764896235e-06, + "loss": 0.2497, + "step": 6595 + }, + { + "epoch": 0.52, + "learning_rate": 9.754968495565973e-06, + "loss": 0.3058, + "step": 6596 + }, + { + "epoch": 0.52, + "learning_rate": 9.752403242369857e-06, + "loss": 0.4189, + "step": 6597 + }, + { + "epoch": 0.52, + "learning_rate": 9.749838005476798e-06, + "loss": 0.3279, + "step": 6598 + }, + { + "epoch": 0.52, + "learning_rate": 9.7472727850557e-06, + "loss": 0.288, + "step": 6599 + }, + { + "epoch": 0.52, + "learning_rate": 9.744707581275473e-06, + "loss": 0.3541, + "step": 6600 + }, + { + "epoch": 0.52, + "learning_rate": 9.742142394305026e-06, + "loss": 0.3695, + "step": 6601 + }, + { + "epoch": 0.52, + "learning_rate": 9.739577224313258e-06, + "loss": 0.3217, + "step": 6602 + }, + { + "epoch": 0.52, + "learning_rate": 9.737012071469082e-06, + "loss": 0.2565, + "step": 6603 + }, + { + "epoch": 0.52, + "learning_rate": 9.734446935941392e-06, + "loss": 0.4219, + "step": 6604 + }, + { + "epoch": 0.52, + "learning_rate": 9.731881817899092e-06, + "loss": 0.2722, + "step": 6605 + }, + { + "epoch": 0.52, + "learning_rate": 9.729316717511088e-06, + "loss": 0.317, + "step": 6606 + }, + { + "epoch": 0.52, + "learning_rate": 9.726751634946272e-06, + "loss": 0.3137, + "step": 6607 + }, + { + "epoch": 0.52, + "learning_rate": 9.724186570373548e-06, + "loss": 0.3535, + "step": 6608 + }, + { + "epoch": 0.52, + "learning_rate": 9.721621523961812e-06, + "loss": 0.2846, + "step": 6609 + }, + { + "epoch": 0.52, + "learning_rate": 9.719056495879958e-06, + "loss": 0.3918, + "step": 6610 + }, + { + "epoch": 0.52, + "learning_rate": 9.716491486296883e-06, + "loss": 0.4037, + "step": 6611 + }, + { + "epoch": 0.52, + "learning_rate": 9.71392649538148e-06, + "loss": 0.3861, + "step": 6612 + }, + { + "epoch": 0.52, + "learning_rate": 9.711361523302638e-06, + "loss": 0.3761, + "step": 6613 + }, + { + "epoch": 0.52, + "learning_rate": 9.708796570229253e-06, + "loss": 0.3541, + "step": 6614 + }, + { + "epoch": 0.52, + "learning_rate": 9.706231636330212e-06, + "loss": 0.3493, + "step": 6615 + }, + { + "epoch": 0.52, + "learning_rate": 9.703666721774403e-06, + "loss": 0.3331, + "step": 6616 + }, + { + "epoch": 0.52, + "learning_rate": 9.701101826730718e-06, + "loss": 0.3885, + "step": 6617 + }, + { + "epoch": 0.52, + "learning_rate": 9.698536951368035e-06, + "loss": 0.3236, + "step": 6618 + }, + { + "epoch": 0.52, + "learning_rate": 9.695972095855248e-06, + "loss": 0.3325, + "step": 6619 + }, + { + "epoch": 0.52, + "learning_rate": 9.693407260361231e-06, + "loss": 0.3563, + "step": 6620 + }, + { + "epoch": 0.52, + "learning_rate": 9.690842445054873e-06, + "loss": 0.3878, + "step": 6621 + }, + { + "epoch": 0.52, + "learning_rate": 9.688277650105053e-06, + "loss": 0.3962, + "step": 6622 + }, + { + "epoch": 0.52, + "learning_rate": 9.685712875680649e-06, + "loss": 0.3163, + "step": 6623 + }, + { + "epoch": 0.52, + "learning_rate": 9.683148121950539e-06, + "loss": 0.3328, + "step": 6624 + }, + { + "epoch": 0.52, + "learning_rate": 9.680583389083602e-06, + "loss": 0.3358, + "step": 6625 + }, + { + "epoch": 0.52, + "learning_rate": 9.67801867724871e-06, + "loss": 0.3986, + "step": 6626 + }, + { + "epoch": 0.53, + "learning_rate": 9.675453986614743e-06, + "loss": 0.3328, + "step": 6627 + }, + { + "epoch": 0.53, + "learning_rate": 9.672889317350565e-06, + "loss": 0.3108, + "step": 6628 + }, + { + "epoch": 0.53, + "learning_rate": 9.670324669625053e-06, + "loss": 0.3323, + "step": 6629 + }, + { + "epoch": 0.53, + "learning_rate": 9.667760043607077e-06, + "loss": 0.2999, + "step": 6630 + }, + { + "epoch": 0.53, + "learning_rate": 9.6651954394655e-06, + "loss": 0.4302, + "step": 6631 + }, + { + "epoch": 0.53, + "learning_rate": 9.662630857369194e-06, + "loss": 0.404, + "step": 6632 + }, + { + "epoch": 0.53, + "learning_rate": 9.660066297487024e-06, + "loss": 0.3319, + "step": 6633 + }, + { + "epoch": 0.53, + "learning_rate": 9.65750175998785e-06, + "loss": 0.4062, + "step": 6634 + }, + { + "epoch": 0.53, + "learning_rate": 9.65493724504054e-06, + "loss": 0.3571, + "step": 6635 + }, + { + "epoch": 0.53, + "learning_rate": 9.65237275281395e-06, + "loss": 0.4056, + "step": 6636 + }, + { + "epoch": 0.53, + "learning_rate": 9.64980828347694e-06, + "loss": 0.4629, + "step": 6637 + }, + { + "epoch": 0.53, + "learning_rate": 9.647243837198375e-06, + "loss": 0.3914, + "step": 6638 + }, + { + "epoch": 0.53, + "learning_rate": 9.644679414147102e-06, + "loss": 0.281, + "step": 6639 + }, + { + "epoch": 0.53, + "learning_rate": 9.64211501449198e-06, + "loss": 0.2816, + "step": 6640 + }, + { + "epoch": 0.53, + "learning_rate": 9.639550638401863e-06, + "loss": 0.3303, + "step": 6641 + }, + { + "epoch": 0.53, + "learning_rate": 9.6369862860456e-06, + "loss": 0.3497, + "step": 6642 + }, + { + "epoch": 0.53, + "learning_rate": 9.634421957592048e-06, + "loss": 0.3465, + "step": 6643 + }, + { + "epoch": 0.53, + "learning_rate": 9.631857653210048e-06, + "loss": 0.3673, + "step": 6644 + }, + { + "epoch": 0.53, + "learning_rate": 9.629293373068449e-06, + "loss": 0.3376, + "step": 6645 + }, + { + "epoch": 0.53, + "learning_rate": 9.626729117336101e-06, + "loss": 0.3507, + "step": 6646 + }, + { + "epoch": 0.53, + "learning_rate": 9.624164886181841e-06, + "loss": 0.3712, + "step": 6647 + }, + { + "epoch": 0.53, + "learning_rate": 9.621600679774516e-06, + "loss": 0.2842, + "step": 6648 + }, + { + "epoch": 0.53, + "learning_rate": 9.619036498282968e-06, + "loss": 0.4483, + "step": 6649 + }, + { + "epoch": 0.53, + "learning_rate": 9.61647234187603e-06, + "loss": 0.2988, + "step": 6650 + }, + { + "epoch": 0.53, + "learning_rate": 9.613908210722546e-06, + "loss": 0.3219, + "step": 6651 + }, + { + "epoch": 0.53, + "learning_rate": 9.611344104991346e-06, + "loss": 0.3916, + "step": 6652 + }, + { + "epoch": 0.53, + "learning_rate": 9.608780024851266e-06, + "loss": 0.2908, + "step": 6653 + }, + { + "epoch": 0.53, + "learning_rate": 9.606215970471142e-06, + "loss": 0.2083, + "step": 6654 + }, + { + "epoch": 0.53, + "learning_rate": 9.6036519420198e-06, + "loss": 0.4308, + "step": 6655 + }, + { + "epoch": 0.53, + "learning_rate": 9.601087939666071e-06, + "loss": 0.2254, + "step": 6656 + }, + { + "epoch": 0.53, + "learning_rate": 9.598523963578785e-06, + "loss": 0.3857, + "step": 6657 + }, + { + "epoch": 0.53, + "learning_rate": 9.595960013926761e-06, + "loss": 0.3595, + "step": 6658 + }, + { + "epoch": 0.53, + "learning_rate": 9.593396090878823e-06, + "loss": 0.2502, + "step": 6659 + }, + { + "epoch": 0.53, + "learning_rate": 9.590832194603801e-06, + "loss": 0.31, + "step": 6660 + }, + { + "epoch": 0.53, + "learning_rate": 9.588268325270506e-06, + "loss": 0.52, + "step": 6661 + }, + { + "epoch": 0.53, + "learning_rate": 9.585704483047761e-06, + "loss": 0.2527, + "step": 6662 + }, + { + "epoch": 0.53, + "learning_rate": 9.583140668104387e-06, + "loss": 0.3664, + "step": 6663 + }, + { + "epoch": 0.53, + "learning_rate": 9.58057688060919e-06, + "loss": 0.4305, + "step": 6664 + }, + { + "epoch": 0.53, + "learning_rate": 9.578013120730987e-06, + "loss": 0.3321, + "step": 6665 + }, + { + "epoch": 0.53, + "learning_rate": 9.575449388638592e-06, + "loss": 0.3443, + "step": 6666 + }, + { + "epoch": 0.53, + "learning_rate": 9.57288568450081e-06, + "loss": 0.3859, + "step": 6667 + }, + { + "epoch": 0.53, + "learning_rate": 9.570322008486453e-06, + "loss": 0.3939, + "step": 6668 + }, + { + "epoch": 0.53, + "learning_rate": 9.567758360764321e-06, + "loss": 0.401, + "step": 6669 + }, + { + "epoch": 0.53, + "learning_rate": 9.565194741503221e-06, + "loss": 0.3354, + "step": 6670 + }, + { + "epoch": 0.53, + "learning_rate": 9.562631150871959e-06, + "loss": 0.3086, + "step": 6671 + }, + { + "epoch": 0.53, + "learning_rate": 9.560067589039327e-06, + "loss": 0.322, + "step": 6672 + }, + { + "epoch": 0.53, + "learning_rate": 9.55750405617413e-06, + "loss": 0.3147, + "step": 6673 + }, + { + "epoch": 0.53, + "learning_rate": 9.554940552445161e-06, + "loss": 0.3362, + "step": 6674 + }, + { + "epoch": 0.53, + "learning_rate": 9.552377078021215e-06, + "loss": 0.4121, + "step": 6675 + }, + { + "epoch": 0.53, + "learning_rate": 9.549813633071085e-06, + "loss": 0.3807, + "step": 6676 + }, + { + "epoch": 0.53, + "learning_rate": 9.54725021776356e-06, + "loss": 0.3708, + "step": 6677 + }, + { + "epoch": 0.53, + "learning_rate": 9.54468683226743e-06, + "loss": 0.4317, + "step": 6678 + }, + { + "epoch": 0.53, + "learning_rate": 9.542123476751484e-06, + "loss": 0.2775, + "step": 6679 + }, + { + "epoch": 0.53, + "learning_rate": 9.5395601513845e-06, + "loss": 0.3173, + "step": 6680 + }, + { + "epoch": 0.53, + "learning_rate": 9.536996856335269e-06, + "loss": 0.4393, + "step": 6681 + }, + { + "epoch": 0.53, + "learning_rate": 9.534433591772562e-06, + "loss": 0.4261, + "step": 6682 + }, + { + "epoch": 0.53, + "learning_rate": 9.531870357865165e-06, + "loss": 0.2945, + "step": 6683 + }, + { + "epoch": 0.53, + "learning_rate": 9.529307154781855e-06, + "loss": 0.3917, + "step": 6684 + }, + { + "epoch": 0.53, + "learning_rate": 9.5267439826914e-06, + "loss": 0.416, + "step": 6685 + }, + { + "epoch": 0.53, + "learning_rate": 9.524180841762577e-06, + "loss": 0.306, + "step": 6686 + }, + { + "epoch": 0.53, + "learning_rate": 9.52161773216416e-06, + "loss": 0.3883, + "step": 6687 + }, + { + "epoch": 0.53, + "learning_rate": 9.519054654064909e-06, + "loss": 0.3397, + "step": 6688 + }, + { + "epoch": 0.53, + "learning_rate": 9.5164916076336e-06, + "loss": 0.2764, + "step": 6689 + }, + { + "epoch": 0.53, + "learning_rate": 9.513928593038987e-06, + "loss": 0.4441, + "step": 6690 + }, + { + "epoch": 0.53, + "learning_rate": 9.51136561044984e-06, + "loss": 0.3828, + "step": 6691 + }, + { + "epoch": 0.53, + "learning_rate": 9.508802660034915e-06, + "loss": 0.3312, + "step": 6692 + }, + { + "epoch": 0.53, + "learning_rate": 9.506239741962971e-06, + "loss": 0.3931, + "step": 6693 + }, + { + "epoch": 0.53, + "learning_rate": 9.503676856402764e-06, + "loss": 0.3943, + "step": 6694 + }, + { + "epoch": 0.53, + "learning_rate": 9.50111400352305e-06, + "loss": 0.2717, + "step": 6695 + }, + { + "epoch": 0.53, + "learning_rate": 9.498551183492578e-06, + "loss": 0.3056, + "step": 6696 + }, + { + "epoch": 0.53, + "learning_rate": 9.495988396480097e-06, + "loss": 0.3657, + "step": 6697 + }, + { + "epoch": 0.53, + "learning_rate": 9.493425642654356e-06, + "loss": 0.4056, + "step": 6698 + }, + { + "epoch": 0.53, + "learning_rate": 9.490862922184096e-06, + "loss": 0.3076, + "step": 6699 + }, + { + "epoch": 0.53, + "learning_rate": 9.488300235238067e-06, + "loss": 0.4598, + "step": 6700 + }, + { + "epoch": 0.53, + "learning_rate": 9.485737581985002e-06, + "loss": 0.3246, + "step": 6701 + }, + { + "epoch": 0.53, + "learning_rate": 9.483174962593644e-06, + "loss": 0.1426, + "step": 6702 + }, + { + "epoch": 0.53, + "learning_rate": 9.480612377232728e-06, + "loss": 0.3247, + "step": 6703 + }, + { + "epoch": 0.53, + "learning_rate": 9.478049826070988e-06, + "loss": 0.3262, + "step": 6704 + }, + { + "epoch": 0.53, + "learning_rate": 9.475487309277156e-06, + "loss": 0.3256, + "step": 6705 + }, + { + "epoch": 0.53, + "learning_rate": 9.472924827019959e-06, + "loss": 0.3179, + "step": 6706 + }, + { + "epoch": 0.53, + "learning_rate": 9.470362379468125e-06, + "loss": 0.3225, + "step": 6707 + }, + { + "epoch": 0.53, + "learning_rate": 9.467799966790384e-06, + "loss": 0.3016, + "step": 6708 + }, + { + "epoch": 0.53, + "learning_rate": 9.465237589155452e-06, + "loss": 0.2912, + "step": 6709 + }, + { + "epoch": 0.53, + "learning_rate": 9.462675246732051e-06, + "loss": 0.33, + "step": 6710 + }, + { + "epoch": 0.53, + "learning_rate": 9.460112939688901e-06, + "loss": 0.4384, + "step": 6711 + }, + { + "epoch": 0.53, + "learning_rate": 9.457550668194714e-06, + "loss": 0.309, + "step": 6712 + }, + { + "epoch": 0.53, + "learning_rate": 9.45498843241821e-06, + "loss": 0.4713, + "step": 6713 + }, + { + "epoch": 0.53, + "learning_rate": 9.452426232528092e-06, + "loss": 0.3559, + "step": 6714 + }, + { + "epoch": 0.53, + "learning_rate": 9.449864068693072e-06, + "loss": 0.2869, + "step": 6715 + }, + { + "epoch": 0.53, + "learning_rate": 9.447301941081856e-06, + "loss": 0.4663, + "step": 6716 + }, + { + "epoch": 0.53, + "learning_rate": 9.444739849863146e-06, + "loss": 0.3834, + "step": 6717 + }, + { + "epoch": 0.53, + "learning_rate": 9.442177795205647e-06, + "loss": 0.3256, + "step": 6718 + }, + { + "epoch": 0.53, + "learning_rate": 9.439615777278059e-06, + "loss": 0.2394, + "step": 6719 + }, + { + "epoch": 0.53, + "learning_rate": 9.437053796249071e-06, + "loss": 0.3258, + "step": 6720 + }, + { + "epoch": 0.53, + "learning_rate": 9.434491852287385e-06, + "loss": 0.3933, + "step": 6721 + }, + { + "epoch": 0.53, + "learning_rate": 9.431929945561688e-06, + "loss": 0.3495, + "step": 6722 + }, + { + "epoch": 0.53, + "learning_rate": 9.429368076240669e-06, + "loss": 0.3644, + "step": 6723 + }, + { + "epoch": 0.53, + "learning_rate": 9.42680624449302e-06, + "loss": 0.3678, + "step": 6724 + }, + { + "epoch": 0.53, + "learning_rate": 9.42424445048742e-06, + "loss": 0.389, + "step": 6725 + }, + { + "epoch": 0.53, + "learning_rate": 9.42168269439255e-06, + "loss": 0.3482, + "step": 6726 + }, + { + "epoch": 0.53, + "learning_rate": 9.419120976377098e-06, + "loss": 0.3273, + "step": 6727 + }, + { + "epoch": 0.53, + "learning_rate": 9.41655929660973e-06, + "loss": 0.4018, + "step": 6728 + }, + { + "epoch": 0.53, + "learning_rate": 9.413997655259126e-06, + "loss": 0.2711, + "step": 6729 + }, + { + "epoch": 0.53, + "learning_rate": 9.411436052493957e-06, + "loss": 0.3461, + "step": 6730 + }, + { + "epoch": 0.53, + "learning_rate": 9.40887448848289e-06, + "loss": 0.3452, + "step": 6731 + }, + { + "epoch": 0.53, + "learning_rate": 9.406312963394598e-06, + "loss": 0.287, + "step": 6732 + }, + { + "epoch": 0.53, + "learning_rate": 9.403751477397738e-06, + "loss": 0.4383, + "step": 6733 + }, + { + "epoch": 0.53, + "learning_rate": 9.401190030660975e-06, + "loss": 0.3066, + "step": 6734 + }, + { + "epoch": 0.53, + "learning_rate": 9.398628623352969e-06, + "loss": 0.2556, + "step": 6735 + }, + { + "epoch": 0.53, + "learning_rate": 9.396067255642373e-06, + "loss": 0.2478, + "step": 6736 + }, + { + "epoch": 0.53, + "learning_rate": 9.39350592769784e-06, + "loss": 0.286, + "step": 6737 + }, + { + "epoch": 0.53, + "learning_rate": 9.390944639688027e-06, + "loss": 0.2892, + "step": 6738 + }, + { + "epoch": 0.53, + "learning_rate": 9.388383391781576e-06, + "loss": 0.3242, + "step": 6739 + }, + { + "epoch": 0.53, + "learning_rate": 9.385822184147136e-06, + "loss": 0.3059, + "step": 6740 + }, + { + "epoch": 0.53, + "learning_rate": 9.383261016953351e-06, + "loss": 0.3194, + "step": 6741 + }, + { + "epoch": 0.53, + "learning_rate": 9.38069989036886e-06, + "loss": 0.3406, + "step": 6742 + }, + { + "epoch": 0.53, + "learning_rate": 9.3781388045623e-06, + "loss": 0.3438, + "step": 6743 + }, + { + "epoch": 0.53, + "learning_rate": 9.37557775970231e-06, + "loss": 0.4259, + "step": 6744 + }, + { + "epoch": 0.53, + "learning_rate": 9.373016755957519e-06, + "loss": 0.442, + "step": 6745 + }, + { + "epoch": 0.53, + "learning_rate": 9.370455793496558e-06, + "loss": 0.3998, + "step": 6746 + }, + { + "epoch": 0.53, + "learning_rate": 9.367894872488053e-06, + "loss": 0.4946, + "step": 6747 + }, + { + "epoch": 0.53, + "learning_rate": 9.365333993100628e-06, + "loss": 0.4029, + "step": 6748 + }, + { + "epoch": 0.53, + "learning_rate": 9.362773155502909e-06, + "loss": 0.3946, + "step": 6749 + }, + { + "epoch": 0.53, + "learning_rate": 9.360212359863508e-06, + "loss": 0.4291, + "step": 6750 + }, + { + "epoch": 0.53, + "learning_rate": 9.357651606351047e-06, + "loss": 0.2815, + "step": 6751 + }, + { + "epoch": 0.53, + "learning_rate": 9.355090895134138e-06, + "loss": 0.39, + "step": 6752 + }, + { + "epoch": 0.53, + "learning_rate": 9.352530226381388e-06, + "loss": 0.4011, + "step": 6753 + }, + { + "epoch": 0.54, + "learning_rate": 9.349969600261408e-06, + "loss": 0.3178, + "step": 6754 + }, + { + "epoch": 0.54, + "learning_rate": 9.347409016942803e-06, + "loss": 0.345, + "step": 6755 + }, + { + "epoch": 0.54, + "learning_rate": 9.344848476594172e-06, + "loss": 0.3632, + "step": 6756 + }, + { + "epoch": 0.54, + "learning_rate": 9.342287979384118e-06, + "loss": 0.2955, + "step": 6757 + }, + { + "epoch": 0.54, + "learning_rate": 9.339727525481234e-06, + "loss": 0.3235, + "step": 6758 + }, + { + "epoch": 0.54, + "learning_rate": 9.33716711505412e-06, + "loss": 0.3976, + "step": 6759 + }, + { + "epoch": 0.54, + "learning_rate": 9.334606748271357e-06, + "loss": 0.3316, + "step": 6760 + }, + { + "epoch": 0.54, + "learning_rate": 9.33204642530154e-06, + "loss": 0.3755, + "step": 6761 + }, + { + "epoch": 0.54, + "learning_rate": 9.329486146313254e-06, + "loss": 0.3147, + "step": 6762 + }, + { + "epoch": 0.54, + "learning_rate": 9.326925911475075e-06, + "loss": 0.3761, + "step": 6763 + }, + { + "epoch": 0.54, + "learning_rate": 9.324365720955589e-06, + "loss": 0.3443, + "step": 6764 + }, + { + "epoch": 0.54, + "learning_rate": 9.321805574923369e-06, + "loss": 0.3078, + "step": 6765 + }, + { + "epoch": 0.54, + "learning_rate": 9.319245473546987e-06, + "loss": 0.3545, + "step": 6766 + }, + { + "epoch": 0.54, + "learning_rate": 9.316685416995017e-06, + "loss": 0.3015, + "step": 6767 + }, + { + "epoch": 0.54, + "learning_rate": 9.314125405436023e-06, + "loss": 0.2785, + "step": 6768 + }, + { + "epoch": 0.54, + "learning_rate": 9.311565439038571e-06, + "loss": 0.2287, + "step": 6769 + }, + { + "epoch": 0.54, + "learning_rate": 9.309005517971222e-06, + "loss": 0.3698, + "step": 6770 + }, + { + "epoch": 0.54, + "learning_rate": 9.306445642402534e-06, + "loss": 0.3277, + "step": 6771 + }, + { + "epoch": 0.54, + "learning_rate": 9.303885812501064e-06, + "loss": 0.3734, + "step": 6772 + }, + { + "epoch": 0.54, + "learning_rate": 9.301326028435367e-06, + "loss": 0.3885, + "step": 6773 + }, + { + "epoch": 0.54, + "learning_rate": 9.298766290373986e-06, + "loss": 0.286, + "step": 6774 + }, + { + "epoch": 0.54, + "learning_rate": 9.296206598485471e-06, + "loss": 0.3699, + "step": 6775 + }, + { + "epoch": 0.54, + "learning_rate": 9.293646952938365e-06, + "loss": 0.4413, + "step": 6776 + }, + { + "epoch": 0.54, + "learning_rate": 9.291087353901208e-06, + "loss": 0.3379, + "step": 6777 + }, + { + "epoch": 0.54, + "learning_rate": 9.28852780154254e-06, + "loss": 0.3073, + "step": 6778 + }, + { + "epoch": 0.54, + "learning_rate": 9.285968296030891e-06, + "loss": 0.3697, + "step": 6779 + }, + { + "epoch": 0.54, + "learning_rate": 9.283408837534793e-06, + "loss": 0.2701, + "step": 6780 + }, + { + "epoch": 0.54, + "learning_rate": 9.280849426222778e-06, + "loss": 0.3609, + "step": 6781 + }, + { + "epoch": 0.54, + "learning_rate": 9.278290062263364e-06, + "loss": 0.2661, + "step": 6782 + }, + { + "epoch": 0.54, + "learning_rate": 9.27573074582508e-06, + "loss": 0.304, + "step": 6783 + }, + { + "epoch": 0.54, + "learning_rate": 9.27317147707644e-06, + "loss": 0.2736, + "step": 6784 + }, + { + "epoch": 0.54, + "learning_rate": 9.270612256185962e-06, + "loss": 0.3634, + "step": 6785 + }, + { + "epoch": 0.54, + "learning_rate": 9.268053083322157e-06, + "loss": 0.3896, + "step": 6786 + }, + { + "epoch": 0.54, + "learning_rate": 9.265493958653533e-06, + "loss": 0.3246, + "step": 6787 + }, + { + "epoch": 0.54, + "learning_rate": 9.262934882348599e-06, + "loss": 0.3342, + "step": 6788 + }, + { + "epoch": 0.54, + "learning_rate": 9.260375854575857e-06, + "loss": 0.3514, + "step": 6789 + }, + { + "epoch": 0.54, + "learning_rate": 9.257816875503805e-06, + "loss": 0.3787, + "step": 6790 + }, + { + "epoch": 0.54, + "learning_rate": 9.255257945300941e-06, + "loss": 0.3303, + "step": 6791 + }, + { + "epoch": 0.54, + "learning_rate": 9.252699064135759e-06, + "loss": 0.2642, + "step": 6792 + }, + { + "epoch": 0.54, + "learning_rate": 9.250140232176746e-06, + "loss": 0.2786, + "step": 6793 + }, + { + "epoch": 0.54, + "learning_rate": 9.247581449592392e-06, + "loss": 0.4084, + "step": 6794 + }, + { + "epoch": 0.54, + "learning_rate": 9.245022716551178e-06, + "loss": 0.3781, + "step": 6795 + }, + { + "epoch": 0.54, + "learning_rate": 9.242464033221584e-06, + "loss": 0.3794, + "step": 6796 + }, + { + "epoch": 0.54, + "learning_rate": 9.239905399772092e-06, + "loss": 0.3973, + "step": 6797 + }, + { + "epoch": 0.54, + "learning_rate": 9.237346816371169e-06, + "loss": 0.4119, + "step": 6798 + }, + { + "epoch": 0.54, + "learning_rate": 9.234788283187291e-06, + "loss": 0.4228, + "step": 6799 + }, + { + "epoch": 0.54, + "learning_rate": 9.23222980038892e-06, + "loss": 0.2791, + "step": 6800 + }, + { + "epoch": 0.54, + "learning_rate": 9.229671368144524e-06, + "loss": 0.4378, + "step": 6801 + }, + { + "epoch": 0.54, + "learning_rate": 9.227112986622562e-06, + "loss": 0.4605, + "step": 6802 + }, + { + "epoch": 0.54, + "learning_rate": 9.224554655991492e-06, + "loss": 0.4454, + "step": 6803 + }, + { + "epoch": 0.54, + "learning_rate": 9.221996376419763e-06, + "loss": 0.4405, + "step": 6804 + }, + { + "epoch": 0.54, + "learning_rate": 9.219438148075834e-06, + "loss": 0.3086, + "step": 6805 + }, + { + "epoch": 0.54, + "learning_rate": 9.216879971128142e-06, + "loss": 0.462, + "step": 6806 + }, + { + "epoch": 0.54, + "learning_rate": 9.21432184574514e-06, + "loss": 0.3318, + "step": 6807 + }, + { + "epoch": 0.54, + "learning_rate": 9.21176377209526e-06, + "loss": 0.2774, + "step": 6808 + }, + { + "epoch": 0.54, + "learning_rate": 9.209205750346945e-06, + "loss": 0.3516, + "step": 6809 + }, + { + "epoch": 0.54, + "learning_rate": 9.206647780668629e-06, + "loss": 0.4229, + "step": 6810 + }, + { + "epoch": 0.54, + "learning_rate": 9.204089863228736e-06, + "loss": 0.3288, + "step": 6811 + }, + { + "epoch": 0.54, + "learning_rate": 9.201531998195697e-06, + "loss": 0.303, + "step": 6812 + }, + { + "epoch": 0.54, + "learning_rate": 9.198974185737934e-06, + "loss": 0.3289, + "step": 6813 + }, + { + "epoch": 0.54, + "learning_rate": 9.196416426023868e-06, + "loss": 0.3794, + "step": 6814 + }, + { + "epoch": 0.54, + "learning_rate": 9.193858719221912e-06, + "loss": 0.3543, + "step": 6815 + }, + { + "epoch": 0.54, + "learning_rate": 9.19130106550048e-06, + "loss": 0.3691, + "step": 6816 + }, + { + "epoch": 0.54, + "learning_rate": 9.188743465027981e-06, + "loss": 0.2369, + "step": 6817 + }, + { + "epoch": 0.54, + "learning_rate": 9.186185917972821e-06, + "loss": 0.2289, + "step": 6818 + }, + { + "epoch": 0.54, + "learning_rate": 9.183628424503405e-06, + "loss": 0.3486, + "step": 6819 + }, + { + "epoch": 0.54, + "learning_rate": 9.181070984788127e-06, + "loss": 0.2957, + "step": 6820 + }, + { + "epoch": 0.54, + "learning_rate": 9.178513598995384e-06, + "loss": 0.3121, + "step": 6821 + }, + { + "epoch": 0.54, + "learning_rate": 9.17595626729357e-06, + "loss": 0.3987, + "step": 6822 + }, + { + "epoch": 0.54, + "learning_rate": 9.17339898985107e-06, + "loss": 0.409, + "step": 6823 + }, + { + "epoch": 0.54, + "learning_rate": 9.170841766836268e-06, + "loss": 0.4102, + "step": 6824 + }, + { + "epoch": 0.54, + "learning_rate": 9.168284598417547e-06, + "loss": 0.4084, + "step": 6825 + }, + { + "epoch": 0.54, + "learning_rate": 9.165727484763283e-06, + "loss": 0.2977, + "step": 6826 + }, + { + "epoch": 0.54, + "learning_rate": 9.16317042604185e-06, + "loss": 0.4056, + "step": 6827 + }, + { + "epoch": 0.54, + "learning_rate": 9.160613422421616e-06, + "loss": 0.352, + "step": 6828 + }, + { + "epoch": 0.54, + "learning_rate": 9.158056474070952e-06, + "loss": 0.3662, + "step": 6829 + }, + { + "epoch": 0.54, + "learning_rate": 9.155499581158217e-06, + "loss": 0.2528, + "step": 6830 + }, + { + "epoch": 0.54, + "learning_rate": 9.152942743851771e-06, + "loss": 0.3186, + "step": 6831 + }, + { + "epoch": 0.54, + "learning_rate": 9.15038596231997e-06, + "loss": 0.253, + "step": 6832 + }, + { + "epoch": 0.54, + "learning_rate": 9.147829236731164e-06, + "loss": 0.3549, + "step": 6833 + }, + { + "epoch": 0.54, + "learning_rate": 9.145272567253703e-06, + "loss": 0.3561, + "step": 6834 + }, + { + "epoch": 0.54, + "learning_rate": 9.142715954055932e-06, + "loss": 0.3947, + "step": 6835 + }, + { + "epoch": 0.54, + "learning_rate": 9.140159397306188e-06, + "loss": 0.3461, + "step": 6836 + }, + { + "epoch": 0.54, + "learning_rate": 9.137602897172814e-06, + "loss": 0.306, + "step": 6837 + }, + { + "epoch": 0.54, + "learning_rate": 9.135046453824136e-06, + "loss": 0.3142, + "step": 6838 + }, + { + "epoch": 0.54, + "learning_rate": 9.132490067428488e-06, + "loss": 0.4291, + "step": 6839 + }, + { + "epoch": 0.54, + "learning_rate": 9.129933738154196e-06, + "loss": 0.2777, + "step": 6840 + }, + { + "epoch": 0.54, + "learning_rate": 9.12737746616958e-06, + "loss": 0.4393, + "step": 6841 + }, + { + "epoch": 0.54, + "learning_rate": 9.124821251642959e-06, + "loss": 0.2849, + "step": 6842 + }, + { + "epoch": 0.54, + "learning_rate": 9.122265094742648e-06, + "loss": 0.4192, + "step": 6843 + }, + { + "epoch": 0.54, + "learning_rate": 9.119708995636957e-06, + "loss": 0.3699, + "step": 6844 + }, + { + "epoch": 0.54, + "learning_rate": 9.117152954494195e-06, + "loss": 0.3713, + "step": 6845 + }, + { + "epoch": 0.54, + "learning_rate": 9.114596971482658e-06, + "loss": 0.3571, + "step": 6846 + }, + { + "epoch": 0.54, + "learning_rate": 9.112041046770653e-06, + "loss": 0.389, + "step": 6847 + }, + { + "epoch": 0.54, + "learning_rate": 9.109485180526474e-06, + "loss": 0.3326, + "step": 6848 + }, + { + "epoch": 0.54, + "learning_rate": 9.106929372918408e-06, + "loss": 0.3846, + "step": 6849 + }, + { + "epoch": 0.54, + "learning_rate": 9.104373624114746e-06, + "loss": 0.2928, + "step": 6850 + }, + { + "epoch": 0.54, + "learning_rate": 9.101817934283775e-06, + "loss": 0.4086, + "step": 6851 + }, + { + "epoch": 0.54, + "learning_rate": 9.099262303593768e-06, + "loss": 0.415, + "step": 6852 + }, + { + "epoch": 0.54, + "learning_rate": 9.096706732213005e-06, + "loss": 0.4087, + "step": 6853 + }, + { + "epoch": 0.54, + "learning_rate": 9.094151220309757e-06, + "loss": 0.3433, + "step": 6854 + }, + { + "epoch": 0.54, + "learning_rate": 9.091595768052291e-06, + "loss": 0.5418, + "step": 6855 + }, + { + "epoch": 0.54, + "learning_rate": 9.089040375608876e-06, + "loss": 0.2802, + "step": 6856 + }, + { + "epoch": 0.54, + "learning_rate": 9.086485043147768e-06, + "loss": 0.4812, + "step": 6857 + }, + { + "epoch": 0.54, + "learning_rate": 9.083929770837222e-06, + "loss": 0.3604, + "step": 6858 + }, + { + "epoch": 0.54, + "learning_rate": 9.081374558845496e-06, + "loss": 0.2611, + "step": 6859 + }, + { + "epoch": 0.54, + "learning_rate": 9.078819407340833e-06, + "loss": 0.2714, + "step": 6860 + }, + { + "epoch": 0.54, + "learning_rate": 9.07626431649148e-06, + "loss": 0.323, + "step": 6861 + }, + { + "epoch": 0.54, + "learning_rate": 9.073709286465678e-06, + "loss": 0.3952, + "step": 6862 + }, + { + "epoch": 0.54, + "learning_rate": 9.071154317431661e-06, + "loss": 0.3319, + "step": 6863 + }, + { + "epoch": 0.54, + "learning_rate": 9.068599409557664e-06, + "loss": 0.3452, + "step": 6864 + }, + { + "epoch": 0.54, + "learning_rate": 9.066044563011914e-06, + "loss": 0.3425, + "step": 6865 + }, + { + "epoch": 0.54, + "learning_rate": 9.063489777962634e-06, + "loss": 0.4073, + "step": 6866 + }, + { + "epoch": 0.54, + "learning_rate": 9.06093505457805e-06, + "loss": 0.2888, + "step": 6867 + }, + { + "epoch": 0.54, + "learning_rate": 9.058380393026369e-06, + "loss": 0.3813, + "step": 6868 + }, + { + "epoch": 0.54, + "learning_rate": 9.055825793475814e-06, + "loss": 0.2661, + "step": 6869 + }, + { + "epoch": 0.54, + "learning_rate": 9.053271256094582e-06, + "loss": 0.3948, + "step": 6870 + }, + { + "epoch": 0.54, + "learning_rate": 9.050716781050885e-06, + "loss": 0.4277, + "step": 6871 + }, + { + "epoch": 0.54, + "learning_rate": 9.04816236851292e-06, + "loss": 0.2998, + "step": 6872 + }, + { + "epoch": 0.54, + "learning_rate": 9.045608018648884e-06, + "loss": 0.2815, + "step": 6873 + }, + { + "epoch": 0.54, + "learning_rate": 9.043053731626964e-06, + "loss": 0.2714, + "step": 6874 + }, + { + "epoch": 0.54, + "learning_rate": 9.040499507615356e-06, + "loss": 0.2958, + "step": 6875 + }, + { + "epoch": 0.54, + "learning_rate": 9.037945346782236e-06, + "loss": 0.3954, + "step": 6876 + }, + { + "epoch": 0.54, + "learning_rate": 9.035391249295788e-06, + "loss": 0.363, + "step": 6877 + }, + { + "epoch": 0.54, + "learning_rate": 9.032837215324183e-06, + "loss": 0.4065, + "step": 6878 + }, + { + "epoch": 0.54, + "learning_rate": 9.030283245035594e-06, + "loss": 0.408, + "step": 6879 + }, + { + "epoch": 0.55, + "learning_rate": 9.027729338598188e-06, + "loss": 0.3929, + "step": 6880 + }, + { + "epoch": 0.55, + "learning_rate": 9.025175496180125e-06, + "loss": 0.3027, + "step": 6881 + }, + { + "epoch": 0.55, + "learning_rate": 9.022621717949566e-06, + "loss": 0.3361, + "step": 6882 + }, + { + "epoch": 0.55, + "learning_rate": 9.020068004074665e-06, + "loss": 0.3822, + "step": 6883 + }, + { + "epoch": 0.55, + "learning_rate": 9.01751435472357e-06, + "loss": 0.3658, + "step": 6884 + }, + { + "epoch": 0.55, + "learning_rate": 9.014960770064429e-06, + "loss": 0.343, + "step": 6885 + }, + { + "epoch": 0.55, + "learning_rate": 9.012407250265377e-06, + "loss": 0.3933, + "step": 6886 + }, + { + "epoch": 0.55, + "learning_rate": 9.009853795494558e-06, + "loss": 0.389, + "step": 6887 + }, + { + "epoch": 0.55, + "learning_rate": 9.007300405920105e-06, + "loss": 0.3691, + "step": 6888 + }, + { + "epoch": 0.55, + "learning_rate": 9.00474708171014e-06, + "loss": 0.2915, + "step": 6889 + }, + { + "epoch": 0.55, + "learning_rate": 9.002193823032791e-06, + "loss": 0.2971, + "step": 6890 + }, + { + "epoch": 0.55, + "learning_rate": 8.999640630056183e-06, + "loss": 0.2462, + "step": 6891 + }, + { + "epoch": 0.55, + "learning_rate": 8.997087502948423e-06, + "loss": 0.3327, + "step": 6892 + }, + { + "epoch": 0.55, + "learning_rate": 8.994534441877625e-06, + "loss": 0.345, + "step": 6893 + }, + { + "epoch": 0.55, + "learning_rate": 8.991981447011896e-06, + "loss": 0.4173, + "step": 6894 + }, + { + "epoch": 0.55, + "learning_rate": 8.989428518519336e-06, + "loss": 0.264, + "step": 6895 + }, + { + "epoch": 0.55, + "learning_rate": 8.986875656568047e-06, + "loss": 0.4498, + "step": 6896 + }, + { + "epoch": 0.55, + "learning_rate": 8.984322861326122e-06, + "loss": 0.4101, + "step": 6897 + }, + { + "epoch": 0.55, + "learning_rate": 8.981770132961649e-06, + "loss": 0.2947, + "step": 6898 + }, + { + "epoch": 0.55, + "learning_rate": 8.979217471642712e-06, + "loss": 0.4945, + "step": 6899 + }, + { + "epoch": 0.55, + "learning_rate": 8.976664877537395e-06, + "loss": 0.3085, + "step": 6900 + }, + { + "epoch": 0.55, + "learning_rate": 8.974112350813771e-06, + "loss": 0.4917, + "step": 6901 + }, + { + "epoch": 0.55, + "learning_rate": 8.971559891639913e-06, + "loss": 0.4168, + "step": 6902 + }, + { + "epoch": 0.55, + "learning_rate": 8.969007500183886e-06, + "loss": 0.2062, + "step": 6903 + }, + { + "epoch": 0.55, + "learning_rate": 8.966455176613754e-06, + "loss": 0.4089, + "step": 6904 + }, + { + "epoch": 0.55, + "learning_rate": 8.963902921097579e-06, + "loss": 0.3856, + "step": 6905 + }, + { + "epoch": 0.55, + "learning_rate": 8.961350733803406e-06, + "loss": 0.4367, + "step": 6906 + }, + { + "epoch": 0.55, + "learning_rate": 8.958798614899291e-06, + "loss": 0.3533, + "step": 6907 + }, + { + "epoch": 0.55, + "learning_rate": 8.956246564553282e-06, + "loss": 0.3499, + "step": 6908 + }, + { + "epoch": 0.55, + "learning_rate": 8.95369458293341e-06, + "loss": 0.2432, + "step": 6909 + }, + { + "epoch": 0.55, + "learning_rate": 8.951142670207718e-06, + "loss": 0.3308, + "step": 6910 + }, + { + "epoch": 0.55, + "learning_rate": 8.948590826544232e-06, + "loss": 0.3585, + "step": 6911 + }, + { + "epoch": 0.55, + "learning_rate": 8.94603905211098e-06, + "loss": 0.3139, + "step": 6912 + }, + { + "epoch": 0.55, + "learning_rate": 8.943487347075988e-06, + "loss": 0.5188, + "step": 6913 + }, + { + "epoch": 0.55, + "learning_rate": 8.94093571160727e-06, + "loss": 0.3375, + "step": 6914 + }, + { + "epoch": 0.55, + "learning_rate": 8.938384145872838e-06, + "loss": 0.3433, + "step": 6915 + }, + { + "epoch": 0.55, + "learning_rate": 8.935832650040703e-06, + "loss": 0.3396, + "step": 6916 + }, + { + "epoch": 0.55, + "learning_rate": 8.933281224278867e-06, + "loss": 0.4095, + "step": 6917 + }, + { + "epoch": 0.55, + "learning_rate": 8.930729868755333e-06, + "loss": 0.3632, + "step": 6918 + }, + { + "epoch": 0.55, + "learning_rate": 8.928178583638088e-06, + "loss": 0.3361, + "step": 6919 + }, + { + "epoch": 0.55, + "learning_rate": 8.925627369095125e-06, + "loss": 0.3789, + "step": 6920 + }, + { + "epoch": 0.55, + "learning_rate": 8.923076225294434e-06, + "loss": 0.3463, + "step": 6921 + }, + { + "epoch": 0.55, + "learning_rate": 8.920525152403989e-06, + "loss": 0.306, + "step": 6922 + }, + { + "epoch": 0.55, + "learning_rate": 8.917974150591772e-06, + "loss": 0.5371, + "step": 6923 + }, + { + "epoch": 0.55, + "learning_rate": 8.915423220025747e-06, + "loss": 0.1976, + "step": 6924 + }, + { + "epoch": 0.55, + "learning_rate": 8.912872360873885e-06, + "loss": 0.3471, + "step": 6925 + }, + { + "epoch": 0.55, + "learning_rate": 8.91032157330415e-06, + "loss": 0.3612, + "step": 6926 + }, + { + "epoch": 0.55, + "learning_rate": 8.907770857484493e-06, + "loss": 0.3957, + "step": 6927 + }, + { + "epoch": 0.55, + "learning_rate": 8.90522021358287e-06, + "loss": 0.3857, + "step": 6928 + }, + { + "epoch": 0.55, + "learning_rate": 8.90266964176723e-06, + "loss": 0.4012, + "step": 6929 + }, + { + "epoch": 0.55, + "learning_rate": 8.90011914220551e-06, + "loss": 0.3553, + "step": 6930 + }, + { + "epoch": 0.55, + "learning_rate": 8.897568715065658e-06, + "loss": 0.3381, + "step": 6931 + }, + { + "epoch": 0.55, + "learning_rate": 8.895018360515597e-06, + "loss": 0.367, + "step": 6932 + }, + { + "epoch": 0.55, + "learning_rate": 8.892468078723262e-06, + "loss": 0.3931, + "step": 6933 + }, + { + "epoch": 0.55, + "learning_rate": 8.889917869856576e-06, + "loss": 0.3126, + "step": 6934 + }, + { + "epoch": 0.55, + "learning_rate": 8.887367734083454e-06, + "loss": 0.3503, + "step": 6935 + }, + { + "epoch": 0.55, + "learning_rate": 8.884817671571815e-06, + "loss": 0.3328, + "step": 6936 + }, + { + "epoch": 0.55, + "learning_rate": 8.882267682489566e-06, + "loss": 0.3328, + "step": 6937 + }, + { + "epoch": 0.55, + "learning_rate": 8.879717767004613e-06, + "loss": 0.254, + "step": 6938 + }, + { + "epoch": 0.55, + "learning_rate": 8.877167925284855e-06, + "loss": 0.2771, + "step": 6939 + }, + { + "epoch": 0.55, + "learning_rate": 8.874618157498183e-06, + "loss": 0.3811, + "step": 6940 + }, + { + "epoch": 0.55, + "learning_rate": 8.872068463812492e-06, + "loss": 0.3402, + "step": 6941 + }, + { + "epoch": 0.55, + "learning_rate": 8.869518844395667e-06, + "loss": 0.3881, + "step": 6942 + }, + { + "epoch": 0.55, + "learning_rate": 8.866969299415585e-06, + "loss": 0.3268, + "step": 6943 + }, + { + "epoch": 0.55, + "learning_rate": 8.864419829040122e-06, + "loss": 0.2798, + "step": 6944 + }, + { + "epoch": 0.55, + "learning_rate": 8.86187043343715e-06, + "loss": 0.2719, + "step": 6945 + }, + { + "epoch": 0.55, + "learning_rate": 8.859321112774535e-06, + "loss": 0.2986, + "step": 6946 + }, + { + "epoch": 0.55, + "learning_rate": 8.856771867220135e-06, + "loss": 0.3587, + "step": 6947 + }, + { + "epoch": 0.55, + "learning_rate": 8.854222696941807e-06, + "loss": 0.3445, + "step": 6948 + }, + { + "epoch": 0.55, + "learning_rate": 8.8516736021074e-06, + "loss": 0.294, + "step": 6949 + }, + { + "epoch": 0.55, + "learning_rate": 8.849124582884762e-06, + "loss": 0.3686, + "step": 6950 + }, + { + "epoch": 0.55, + "learning_rate": 8.846575639441732e-06, + "loss": 0.4012, + "step": 6951 + }, + { + "epoch": 0.55, + "learning_rate": 8.844026771946148e-06, + "loss": 0.523, + "step": 6952 + }, + { + "epoch": 0.55, + "learning_rate": 8.841477980565838e-06, + "loss": 0.2641, + "step": 6953 + }, + { + "epoch": 0.55, + "learning_rate": 8.838929265468627e-06, + "loss": 0.3616, + "step": 6954 + }, + { + "epoch": 0.55, + "learning_rate": 8.836380626822339e-06, + "loss": 0.3672, + "step": 6955 + }, + { + "epoch": 0.55, + "learning_rate": 8.833832064794787e-06, + "loss": 0.4718, + "step": 6956 + }, + { + "epoch": 0.55, + "learning_rate": 8.831283579553781e-06, + "loss": 0.2828, + "step": 6957 + }, + { + "epoch": 0.55, + "learning_rate": 8.828735171267131e-06, + "loss": 0.3789, + "step": 6958 + }, + { + "epoch": 0.55, + "learning_rate": 8.82618684010263e-06, + "loss": 0.2958, + "step": 6959 + }, + { + "epoch": 0.55, + "learning_rate": 8.823638586228081e-06, + "loss": 0.359, + "step": 6960 + }, + { + "epoch": 0.55, + "learning_rate": 8.82109040981127e-06, + "loss": 0.3354, + "step": 6961 + }, + { + "epoch": 0.55, + "learning_rate": 8.818542311019982e-06, + "loss": 0.338, + "step": 6962 + }, + { + "epoch": 0.55, + "learning_rate": 8.815994290022e-06, + "loss": 0.3537, + "step": 6963 + }, + { + "epoch": 0.55, + "learning_rate": 8.813446346985095e-06, + "loss": 0.2931, + "step": 6964 + }, + { + "epoch": 0.55, + "learning_rate": 8.810898482077038e-06, + "loss": 0.3793, + "step": 6965 + }, + { + "epoch": 0.55, + "learning_rate": 8.808350695465597e-06, + "loss": 0.3445, + "step": 6966 + }, + { + "epoch": 0.55, + "learning_rate": 8.805802987318527e-06, + "loss": 0.3493, + "step": 6967 + }, + { + "epoch": 0.55, + "learning_rate": 8.803255357803584e-06, + "loss": 0.3368, + "step": 6968 + }, + { + "epoch": 0.55, + "learning_rate": 8.800707807088521e-06, + "loss": 0.2975, + "step": 6969 + }, + { + "epoch": 0.55, + "learning_rate": 8.798160335341078e-06, + "loss": 0.4914, + "step": 6970 + }, + { + "epoch": 0.55, + "learning_rate": 8.795612942728989e-06, + "loss": 0.3794, + "step": 6971 + }, + { + "epoch": 0.55, + "learning_rate": 8.793065629419996e-06, + "loss": 0.3651, + "step": 6972 + }, + { + "epoch": 0.55, + "learning_rate": 8.790518395581823e-06, + "loss": 0.3055, + "step": 6973 + }, + { + "epoch": 0.55, + "learning_rate": 8.787971241382193e-06, + "loss": 0.3921, + "step": 6974 + }, + { + "epoch": 0.55, + "learning_rate": 8.785424166988827e-06, + "loss": 0.2735, + "step": 6975 + }, + { + "epoch": 0.55, + "learning_rate": 8.782877172569433e-06, + "loss": 0.2598, + "step": 6976 + }, + { + "epoch": 0.55, + "learning_rate": 8.78033025829172e-06, + "loss": 0.3403, + "step": 6977 + }, + { + "epoch": 0.55, + "learning_rate": 8.777783424323396e-06, + "loss": 0.3651, + "step": 6978 + }, + { + "epoch": 0.55, + "learning_rate": 8.775236670832146e-06, + "loss": 0.3427, + "step": 6979 + }, + { + "epoch": 0.55, + "learning_rate": 8.772689997985674e-06, + "loss": 0.4072, + "step": 6980 + }, + { + "epoch": 0.55, + "learning_rate": 8.770143405951657e-06, + "loss": 0.3805, + "step": 6981 + }, + { + "epoch": 0.55, + "learning_rate": 8.76759689489778e-06, + "loss": 0.2841, + "step": 6982 + }, + { + "epoch": 0.55, + "learning_rate": 8.765050464991716e-06, + "loss": 0.4077, + "step": 6983 + }, + { + "epoch": 0.55, + "learning_rate": 8.762504116401137e-06, + "loss": 0.3595, + "step": 6984 + }, + { + "epoch": 0.55, + "learning_rate": 8.759957849293707e-06, + "loss": 0.2765, + "step": 6985 + }, + { + "epoch": 0.55, + "learning_rate": 8.75741166383709e-06, + "loss": 0.3955, + "step": 6986 + }, + { + "epoch": 0.55, + "learning_rate": 8.754865560198932e-06, + "loss": 0.2439, + "step": 6987 + }, + { + "epoch": 0.55, + "learning_rate": 8.752319538546888e-06, + "loss": 0.4157, + "step": 6988 + }, + { + "epoch": 0.55, + "learning_rate": 8.749773599048597e-06, + "loss": 0.4307, + "step": 6989 + }, + { + "epoch": 0.55, + "learning_rate": 8.747227741871698e-06, + "loss": 0.2196, + "step": 6990 + }, + { + "epoch": 0.55, + "learning_rate": 8.744681967183826e-06, + "loss": 0.3642, + "step": 6991 + }, + { + "epoch": 0.55, + "learning_rate": 8.742136275152606e-06, + "loss": 0.3438, + "step": 6992 + }, + { + "epoch": 0.55, + "learning_rate": 8.73959066594566e-06, + "loss": 0.311, + "step": 6993 + }, + { + "epoch": 0.55, + "learning_rate": 8.737045139730605e-06, + "loss": 0.3601, + "step": 6994 + }, + { + "epoch": 0.55, + "learning_rate": 8.734499696675048e-06, + "loss": 0.2674, + "step": 6995 + }, + { + "epoch": 0.55, + "learning_rate": 8.731954336946599e-06, + "loss": 0.3318, + "step": 6996 + }, + { + "epoch": 0.55, + "learning_rate": 8.729409060712855e-06, + "loss": 0.4257, + "step": 6997 + }, + { + "epoch": 0.55, + "learning_rate": 8.726863868141408e-06, + "loss": 0.3281, + "step": 6998 + }, + { + "epoch": 0.55, + "learning_rate": 8.724318759399853e-06, + "loss": 0.3296, + "step": 6999 + }, + { + "epoch": 0.55, + "learning_rate": 8.721773734655768e-06, + "loss": 0.3742, + "step": 7000 + }, + { + "epoch": 0.55, + "learning_rate": 8.719228794076733e-06, + "loss": 0.2869, + "step": 7001 + }, + { + "epoch": 0.55, + "learning_rate": 8.716683937830318e-06, + "loss": 0.3905, + "step": 7002 + }, + { + "epoch": 0.55, + "learning_rate": 8.71413916608409e-06, + "loss": 0.3654, + "step": 7003 + }, + { + "epoch": 0.55, + "learning_rate": 8.711594479005614e-06, + "loss": 0.2555, + "step": 7004 + }, + { + "epoch": 0.55, + "learning_rate": 8.709049876762438e-06, + "loss": 0.3384, + "step": 7005 + }, + { + "epoch": 0.56, + "learning_rate": 8.706505359522119e-06, + "loss": 0.3843, + "step": 7006 + }, + { + "epoch": 0.56, + "learning_rate": 8.703960927452197e-06, + "loss": 0.2665, + "step": 7007 + }, + { + "epoch": 0.56, + "learning_rate": 8.701416580720212e-06, + "loss": 0.3997, + "step": 7008 + }, + { + "epoch": 0.56, + "learning_rate": 8.698872319493698e-06, + "loss": 0.4557, + "step": 7009 + }, + { + "epoch": 0.56, + "learning_rate": 8.69632814394018e-06, + "loss": 0.3702, + "step": 7010 + }, + { + "epoch": 0.56, + "learning_rate": 8.693784054227179e-06, + "loss": 0.2854, + "step": 7011 + }, + { + "epoch": 0.56, + "learning_rate": 8.691240050522215e-06, + "loss": 0.4729, + "step": 7012 + }, + { + "epoch": 0.56, + "learning_rate": 8.688696132992797e-06, + "loss": 0.3111, + "step": 7013 + }, + { + "epoch": 0.56, + "learning_rate": 8.686152301806427e-06, + "loss": 0.4138, + "step": 7014 + }, + { + "epoch": 0.56, + "learning_rate": 8.683608557130608e-06, + "loss": 0.3541, + "step": 7015 + }, + { + "epoch": 0.56, + "learning_rate": 8.681064899132831e-06, + "loss": 0.4337, + "step": 7016 + }, + { + "epoch": 0.56, + "learning_rate": 8.678521327980585e-06, + "loss": 0.3045, + "step": 7017 + }, + { + "epoch": 0.56, + "learning_rate": 8.675977843841347e-06, + "loss": 0.3389, + "step": 7018 + }, + { + "epoch": 0.56, + "learning_rate": 8.673434446882601e-06, + "loss": 0.2617, + "step": 7019 + }, + { + "epoch": 0.56, + "learning_rate": 8.670891137271814e-06, + "loss": 0.3667, + "step": 7020 + }, + { + "epoch": 0.56, + "learning_rate": 8.668347915176448e-06, + "loss": 0.384, + "step": 7021 + }, + { + "epoch": 0.56, + "learning_rate": 8.665804780763963e-06, + "loss": 0.404, + "step": 7022 + }, + { + "epoch": 0.56, + "learning_rate": 8.663261734201818e-06, + "loss": 0.362, + "step": 7023 + }, + { + "epoch": 0.56, + "learning_rate": 8.660718775657453e-06, + "loss": 0.3662, + "step": 7024 + }, + { + "epoch": 0.56, + "learning_rate": 8.658175905298314e-06, + "loss": 0.3121, + "step": 7025 + }, + { + "epoch": 0.56, + "learning_rate": 8.655633123291833e-06, + "loss": 0.3727, + "step": 7026 + }, + { + "epoch": 0.56, + "learning_rate": 8.653090429805442e-06, + "loss": 0.3169, + "step": 7027 + }, + { + "epoch": 0.56, + "learning_rate": 8.650547825006568e-06, + "loss": 0.345, + "step": 7028 + }, + { + "epoch": 0.56, + "learning_rate": 8.648005309062623e-06, + "loss": 0.3951, + "step": 7029 + }, + { + "epoch": 0.56, + "learning_rate": 8.645462882141026e-06, + "loss": 0.3869, + "step": 7030 + }, + { + "epoch": 0.56, + "learning_rate": 8.64292054440918e-06, + "loss": 0.2799, + "step": 7031 + }, + { + "epoch": 0.56, + "learning_rate": 8.640378296034486e-06, + "loss": 0.3237, + "step": 7032 + }, + { + "epoch": 0.56, + "learning_rate": 8.63783613718434e-06, + "loss": 0.4391, + "step": 7033 + }, + { + "epoch": 0.56, + "learning_rate": 8.63529406802613e-06, + "loss": 0.4238, + "step": 7034 + }, + { + "epoch": 0.56, + "learning_rate": 8.632752088727237e-06, + "loss": 0.3266, + "step": 7035 + }, + { + "epoch": 0.56, + "learning_rate": 8.63021019945504e-06, + "loss": 0.3176, + "step": 7036 + }, + { + "epoch": 0.56, + "learning_rate": 8.627668400376914e-06, + "loss": 0.3756, + "step": 7037 + }, + { + "epoch": 0.56, + "learning_rate": 8.625126691660216e-06, + "loss": 0.4381, + "step": 7038 + }, + { + "epoch": 0.56, + "learning_rate": 8.622585073472314e-06, + "loss": 0.3573, + "step": 7039 + }, + { + "epoch": 0.56, + "learning_rate": 8.620043545980554e-06, + "loss": 0.3389, + "step": 7040 + }, + { + "epoch": 0.56, + "learning_rate": 8.61750210935229e-06, + "loss": 0.3199, + "step": 7041 + }, + { + "epoch": 0.56, + "learning_rate": 8.614960763754857e-06, + "loss": 0.3366, + "step": 7042 + }, + { + "epoch": 0.56, + "learning_rate": 8.612419509355593e-06, + "loss": 0.3431, + "step": 7043 + }, + { + "epoch": 0.56, + "learning_rate": 8.60987834632183e-06, + "loss": 0.4285, + "step": 7044 + }, + { + "epoch": 0.56, + "learning_rate": 8.607337274820888e-06, + "loss": 0.4383, + "step": 7045 + }, + { + "epoch": 0.56, + "learning_rate": 8.604796295020085e-06, + "loss": 0.366, + "step": 7046 + }, + { + "epoch": 0.56, + "learning_rate": 8.602255407086736e-06, + "loss": 0.4711, + "step": 7047 + }, + { + "epoch": 0.56, + "learning_rate": 8.599714611188141e-06, + "loss": 0.5414, + "step": 7048 + }, + { + "epoch": 0.56, + "learning_rate": 8.5971739074916e-06, + "loss": 0.3835, + "step": 7049 + }, + { + "epoch": 0.56, + "learning_rate": 8.594633296164409e-06, + "loss": 0.4071, + "step": 7050 + }, + { + "epoch": 0.56, + "learning_rate": 8.59209277737385e-06, + "loss": 0.3296, + "step": 7051 + }, + { + "epoch": 0.56, + "learning_rate": 8.58955235128721e-06, + "loss": 0.4189, + "step": 7052 + }, + { + "epoch": 0.56, + "learning_rate": 8.58701201807176e-06, + "loss": 0.4206, + "step": 7053 + }, + { + "epoch": 0.56, + "learning_rate": 8.584471777894768e-06, + "loss": 0.3072, + "step": 7054 + }, + { + "epoch": 0.56, + "learning_rate": 8.581931630923499e-06, + "loss": 0.325, + "step": 7055 + }, + { + "epoch": 0.56, + "learning_rate": 8.57939157732521e-06, + "loss": 0.3508, + "step": 7056 + }, + { + "epoch": 0.56, + "learning_rate": 8.576851617267151e-06, + "loss": 0.2893, + "step": 7057 + }, + { + "epoch": 0.56, + "learning_rate": 8.574311750916565e-06, + "loss": 0.2959, + "step": 7058 + }, + { + "epoch": 0.56, + "learning_rate": 8.571771978440689e-06, + "loss": 0.4777, + "step": 7059 + }, + { + "epoch": 0.56, + "learning_rate": 8.569232300006756e-06, + "loss": 0.3733, + "step": 7060 + }, + { + "epoch": 0.56, + "learning_rate": 8.566692715781992e-06, + "loss": 0.308, + "step": 7061 + }, + { + "epoch": 0.56, + "learning_rate": 8.564153225933616e-06, + "loss": 0.4168, + "step": 7062 + }, + { + "epoch": 0.56, + "learning_rate": 8.56161383062884e-06, + "loss": 0.3198, + "step": 7063 + }, + { + "epoch": 0.56, + "learning_rate": 8.559074530034875e-06, + "loss": 0.3322, + "step": 7064 + }, + { + "epoch": 0.56, + "learning_rate": 8.556535324318916e-06, + "loss": 0.2515, + "step": 7065 + }, + { + "epoch": 0.56, + "learning_rate": 8.553996213648164e-06, + "loss": 0.322, + "step": 7066 + }, + { + "epoch": 0.56, + "learning_rate": 8.551457198189799e-06, + "loss": 0.2736, + "step": 7067 + }, + { + "epoch": 0.56, + "learning_rate": 8.54891827811101e-06, + "loss": 0.2116, + "step": 7068 + }, + { + "epoch": 0.56, + "learning_rate": 8.546379453578972e-06, + "loss": 0.3199, + "step": 7069 + }, + { + "epoch": 0.56, + "learning_rate": 8.543840724760848e-06, + "loss": 0.445, + "step": 7070 + }, + { + "epoch": 0.56, + "learning_rate": 8.541302091823809e-06, + "loss": 0.3135, + "step": 7071 + }, + { + "epoch": 0.56, + "learning_rate": 8.538763554935008e-06, + "loss": 0.3442, + "step": 7072 + }, + { + "epoch": 0.56, + "learning_rate": 8.536225114261597e-06, + "loss": 0.273, + "step": 7073 + }, + { + "epoch": 0.56, + "learning_rate": 8.533686769970717e-06, + "loss": 0.3821, + "step": 7074 + }, + { + "epoch": 0.56, + "learning_rate": 8.531148522229509e-06, + "loss": 0.3031, + "step": 7075 + }, + { + "epoch": 0.56, + "learning_rate": 8.528610371205102e-06, + "loss": 0.4381, + "step": 7076 + }, + { + "epoch": 0.56, + "learning_rate": 8.526072317064623e-06, + "loss": 0.3806, + "step": 7077 + }, + { + "epoch": 0.56, + "learning_rate": 8.52353435997519e-06, + "loss": 0.4048, + "step": 7078 + }, + { + "epoch": 0.56, + "learning_rate": 8.520996500103915e-06, + "loss": 0.3374, + "step": 7079 + }, + { + "epoch": 0.56, + "learning_rate": 8.518458737617903e-06, + "loss": 0.3671, + "step": 7080 + }, + { + "epoch": 0.56, + "learning_rate": 8.515921072684255e-06, + "loss": 0.2408, + "step": 7081 + }, + { + "epoch": 0.56, + "learning_rate": 8.513383505470065e-06, + "loss": 0.3252, + "step": 7082 + }, + { + "epoch": 0.56, + "learning_rate": 8.510846036142415e-06, + "loss": 0.4051, + "step": 7083 + }, + { + "epoch": 0.56, + "learning_rate": 8.50830866486839e-06, + "loss": 0.2523, + "step": 7084 + }, + { + "epoch": 0.56, + "learning_rate": 8.505771391815061e-06, + "loss": 0.4471, + "step": 7085 + }, + { + "epoch": 0.56, + "learning_rate": 8.503234217149496e-06, + "loss": 0.4267, + "step": 7086 + }, + { + "epoch": 0.56, + "learning_rate": 8.500697141038758e-06, + "loss": 0.3279, + "step": 7087 + }, + { + "epoch": 0.56, + "learning_rate": 8.498160163649896e-06, + "loss": 0.3114, + "step": 7088 + }, + { + "epoch": 0.56, + "learning_rate": 8.495623285149962e-06, + "loss": 0.2817, + "step": 7089 + }, + { + "epoch": 0.56, + "learning_rate": 8.493086505705998e-06, + "loss": 0.3435, + "step": 7090 + }, + { + "epoch": 0.56, + "learning_rate": 8.490549825485036e-06, + "loss": 0.4089, + "step": 7091 + }, + { + "epoch": 0.56, + "learning_rate": 8.488013244654103e-06, + "loss": 0.2854, + "step": 7092 + }, + { + "epoch": 0.56, + "learning_rate": 8.485476763380224e-06, + "loss": 0.4108, + "step": 7093 + }, + { + "epoch": 0.56, + "learning_rate": 8.482940381830412e-06, + "loss": 0.3094, + "step": 7094 + }, + { + "epoch": 0.56, + "learning_rate": 8.480404100171677e-06, + "loss": 0.3949, + "step": 7095 + }, + { + "epoch": 0.56, + "learning_rate": 8.47786791857102e-06, + "loss": 0.2768, + "step": 7096 + }, + { + "epoch": 0.56, + "learning_rate": 8.475331837195435e-06, + "loss": 0.3959, + "step": 7097 + }, + { + "epoch": 0.56, + "learning_rate": 8.472795856211916e-06, + "loss": 0.3376, + "step": 7098 + }, + { + "epoch": 0.56, + "learning_rate": 8.470259975787438e-06, + "loss": 0.3272, + "step": 7099 + }, + { + "epoch": 0.56, + "learning_rate": 8.46772419608898e-06, + "loss": 0.3615, + "step": 7100 + }, + { + "epoch": 0.56, + "learning_rate": 8.465188517283514e-06, + "loss": 0.3439, + "step": 7101 + }, + { + "epoch": 0.56, + "learning_rate": 8.462652939537996e-06, + "loss": 0.3487, + "step": 7102 + }, + { + "epoch": 0.56, + "learning_rate": 8.460117463019387e-06, + "loss": 0.3067, + "step": 7103 + }, + { + "epoch": 0.56, + "learning_rate": 8.457582087894631e-06, + "loss": 0.3102, + "step": 7104 + }, + { + "epoch": 0.56, + "learning_rate": 8.455046814330674e-06, + "loss": 0.4256, + "step": 7105 + }, + { + "epoch": 0.56, + "learning_rate": 8.452511642494453e-06, + "loss": 0.4775, + "step": 7106 + }, + { + "epoch": 0.56, + "learning_rate": 8.449976572552891e-06, + "loss": 0.405, + "step": 7107 + }, + { + "epoch": 0.56, + "learning_rate": 8.447441604672913e-06, + "loss": 0.2671, + "step": 7108 + }, + { + "epoch": 0.56, + "learning_rate": 8.444906739021438e-06, + "loss": 0.2864, + "step": 7109 + }, + { + "epoch": 0.56, + "learning_rate": 8.442371975765368e-06, + "loss": 0.301, + "step": 7110 + }, + { + "epoch": 0.56, + "learning_rate": 8.439837315071612e-06, + "loss": 0.349, + "step": 7111 + }, + { + "epoch": 0.56, + "learning_rate": 8.43730275710706e-06, + "loss": 0.4177, + "step": 7112 + }, + { + "epoch": 0.56, + "learning_rate": 8.434768302038602e-06, + "loss": 0.3276, + "step": 7113 + }, + { + "epoch": 0.56, + "learning_rate": 8.432233950033122e-06, + "loss": 0.4059, + "step": 7114 + }, + { + "epoch": 0.56, + "learning_rate": 8.42969970125749e-06, + "loss": 0.3714, + "step": 7115 + }, + { + "epoch": 0.56, + "learning_rate": 8.427165555878577e-06, + "loss": 0.2164, + "step": 7116 + }, + { + "epoch": 0.56, + "learning_rate": 8.424631514063247e-06, + "loss": 0.284, + "step": 7117 + }, + { + "epoch": 0.56, + "learning_rate": 8.422097575978349e-06, + "loss": 0.4034, + "step": 7118 + }, + { + "epoch": 0.56, + "learning_rate": 8.419563741790735e-06, + "loss": 0.2881, + "step": 7119 + }, + { + "epoch": 0.56, + "learning_rate": 8.417030011667241e-06, + "loss": 0.2719, + "step": 7120 + }, + { + "epoch": 0.56, + "learning_rate": 8.414496385774706e-06, + "loss": 0.4382, + "step": 7121 + }, + { + "epoch": 0.56, + "learning_rate": 8.411962864279957e-06, + "loss": 0.3369, + "step": 7122 + }, + { + "epoch": 0.56, + "learning_rate": 8.409429447349811e-06, + "loss": 0.3249, + "step": 7123 + }, + { + "epoch": 0.56, + "learning_rate": 8.406896135151081e-06, + "loss": 0.3303, + "step": 7124 + }, + { + "epoch": 0.56, + "learning_rate": 8.40436292785058e-06, + "loss": 0.3299, + "step": 7125 + }, + { + "epoch": 0.56, + "learning_rate": 8.401829825615098e-06, + "loss": 0.3638, + "step": 7126 + }, + { + "epoch": 0.56, + "learning_rate": 8.399296828611433e-06, + "loss": 0.3136, + "step": 7127 + }, + { + "epoch": 0.56, + "learning_rate": 8.396763937006369e-06, + "loss": 0.3536, + "step": 7128 + }, + { + "epoch": 0.56, + "learning_rate": 8.394231150966685e-06, + "loss": 0.4618, + "step": 7129 + }, + { + "epoch": 0.56, + "learning_rate": 8.391698470659154e-06, + "loss": 0.4316, + "step": 7130 + }, + { + "epoch": 0.56, + "learning_rate": 8.38916589625054e-06, + "loss": 0.3927, + "step": 7131 + }, + { + "epoch": 0.57, + "learning_rate": 8.3866334279076e-06, + "loss": 0.4468, + "step": 7132 + }, + { + "epoch": 0.57, + "learning_rate": 8.384101065797087e-06, + "loss": 0.3219, + "step": 7133 + }, + { + "epoch": 0.57, + "learning_rate": 8.381568810085745e-06, + "loss": 0.318, + "step": 7134 + }, + { + "epoch": 0.57, + "learning_rate": 8.379036660940306e-06, + "loss": 0.4421, + "step": 7135 + }, + { + "epoch": 0.57, + "learning_rate": 8.376504618527505e-06, + "loss": 0.2273, + "step": 7136 + }, + { + "epoch": 0.57, + "learning_rate": 8.373972683014063e-06, + "loss": 0.3392, + "step": 7137 + }, + { + "epoch": 0.57, + "learning_rate": 8.371440854566696e-06, + "loss": 0.2706, + "step": 7138 + }, + { + "epoch": 0.57, + "learning_rate": 8.368909133352114e-06, + "loss": 0.3965, + "step": 7139 + }, + { + "epoch": 0.57, + "learning_rate": 8.366377519537015e-06, + "loss": 0.407, + "step": 7140 + }, + { + "epoch": 0.57, + "learning_rate": 8.363846013288096e-06, + "loss": 0.3308, + "step": 7141 + }, + { + "epoch": 0.57, + "learning_rate": 8.361314614772047e-06, + "loss": 0.4946, + "step": 7142 + }, + { + "epoch": 0.57, + "learning_rate": 8.358783324155542e-06, + "loss": 0.2782, + "step": 7143 + }, + { + "epoch": 0.57, + "learning_rate": 8.35625214160526e-06, + "loss": 0.3372, + "step": 7144 + }, + { + "epoch": 0.57, + "learning_rate": 8.353721067287865e-06, + "loss": 0.3381, + "step": 7145 + }, + { + "epoch": 0.57, + "learning_rate": 8.351190101370016e-06, + "loss": 0.3056, + "step": 7146 + }, + { + "epoch": 0.57, + "learning_rate": 8.348659244018367e-06, + "loss": 0.4196, + "step": 7147 + }, + { + "epoch": 0.57, + "learning_rate": 8.34612849539956e-06, + "loss": 0.4403, + "step": 7148 + }, + { + "epoch": 0.57, + "learning_rate": 8.343597855680231e-06, + "loss": 0.3264, + "step": 7149 + }, + { + "epoch": 0.57, + "learning_rate": 8.341067325027017e-06, + "loss": 0.2364, + "step": 7150 + }, + { + "epoch": 0.57, + "learning_rate": 8.338536903606535e-06, + "loss": 0.3302, + "step": 7151 + }, + { + "epoch": 0.57, + "learning_rate": 8.336006591585406e-06, + "loss": 0.2504, + "step": 7152 + }, + { + "epoch": 0.57, + "learning_rate": 8.333476389130234e-06, + "loss": 0.3643, + "step": 7153 + }, + { + "epoch": 0.57, + "learning_rate": 8.330946296407622e-06, + "loss": 0.3187, + "step": 7154 + }, + { + "epoch": 0.57, + "learning_rate": 8.328416313584169e-06, + "loss": 0.2899, + "step": 7155 + }, + { + "epoch": 0.57, + "learning_rate": 8.325886440826457e-06, + "loss": 0.3438, + "step": 7156 + }, + { + "epoch": 0.57, + "learning_rate": 8.323356678301067e-06, + "loss": 0.2961, + "step": 7157 + }, + { + "epoch": 0.57, + "learning_rate": 8.320827026174572e-06, + "loss": 0.3159, + "step": 7158 + }, + { + "epoch": 0.57, + "learning_rate": 8.318297484613538e-06, + "loss": 0.3691, + "step": 7159 + }, + { + "epoch": 0.57, + "learning_rate": 8.315768053784524e-06, + "loss": 0.415, + "step": 7160 + }, + { + "epoch": 0.57, + "learning_rate": 8.313238733854076e-06, + "loss": 0.4083, + "step": 7161 + }, + { + "epoch": 0.57, + "learning_rate": 8.310709524988743e-06, + "loss": 0.3197, + "step": 7162 + }, + { + "epoch": 0.57, + "learning_rate": 8.308180427355062e-06, + "loss": 0.4579, + "step": 7163 + }, + { + "epoch": 0.57, + "learning_rate": 8.305651441119558e-06, + "loss": 0.3025, + "step": 7164 + }, + { + "epoch": 0.57, + "learning_rate": 8.303122566448754e-06, + "loss": 0.2461, + "step": 7165 + }, + { + "epoch": 0.57, + "learning_rate": 8.300593803509163e-06, + "loss": 0.3206, + "step": 7166 + }, + { + "epoch": 0.57, + "learning_rate": 8.298065152467293e-06, + "loss": 0.4222, + "step": 7167 + }, + { + "epoch": 0.57, + "learning_rate": 8.295536613489645e-06, + "loss": 0.2679, + "step": 7168 + }, + { + "epoch": 0.57, + "learning_rate": 8.293008186742708e-06, + "loss": 0.382, + "step": 7169 + }, + { + "epoch": 0.57, + "learning_rate": 8.290479872392969e-06, + "loss": 0.3145, + "step": 7170 + }, + { + "epoch": 0.57, + "learning_rate": 8.287951670606905e-06, + "loss": 0.3833, + "step": 7171 + }, + { + "epoch": 0.57, + "learning_rate": 8.285423581550985e-06, + "loss": 0.3883, + "step": 7172 + }, + { + "epoch": 0.57, + "learning_rate": 8.282895605391674e-06, + "loss": 0.3028, + "step": 7173 + }, + { + "epoch": 0.57, + "learning_rate": 8.280367742295424e-06, + "loss": 0.4073, + "step": 7174 + }, + { + "epoch": 0.57, + "learning_rate": 8.277839992428683e-06, + "loss": 0.4721, + "step": 7175 + }, + { + "epoch": 0.57, + "learning_rate": 8.275312355957893e-06, + "loss": 0.3701, + "step": 7176 + }, + { + "epoch": 0.57, + "learning_rate": 8.272784833049485e-06, + "loss": 0.3513, + "step": 7177 + }, + { + "epoch": 0.57, + "learning_rate": 8.270257423869885e-06, + "loss": 0.3596, + "step": 7178 + }, + { + "epoch": 0.57, + "learning_rate": 8.267730128585511e-06, + "loss": 0.3126, + "step": 7179 + }, + { + "epoch": 0.57, + "learning_rate": 8.265202947362772e-06, + "loss": 0.3655, + "step": 7180 + }, + { + "epoch": 0.57, + "learning_rate": 8.262675880368074e-06, + "loss": 0.3592, + "step": 7181 + }, + { + "epoch": 0.57, + "learning_rate": 8.260148927767807e-06, + "loss": 0.4217, + "step": 7182 + }, + { + "epoch": 0.57, + "learning_rate": 8.257622089728362e-06, + "loss": 0.4176, + "step": 7183 + }, + { + "epoch": 0.57, + "learning_rate": 8.255095366416122e-06, + "loss": 0.3916, + "step": 7184 + }, + { + "epoch": 0.57, + "learning_rate": 8.25256875799745e-06, + "loss": 0.3069, + "step": 7185 + }, + { + "epoch": 0.57, + "learning_rate": 8.250042264638721e-06, + "loss": 0.3929, + "step": 7186 + }, + { + "epoch": 0.57, + "learning_rate": 8.24751588650629e-06, + "loss": 0.2948, + "step": 7187 + }, + { + "epoch": 0.57, + "learning_rate": 8.244989623766502e-06, + "loss": 0.342, + "step": 7188 + }, + { + "epoch": 0.57, + "learning_rate": 8.242463476585707e-06, + "loss": 0.4003, + "step": 7189 + }, + { + "epoch": 0.57, + "learning_rate": 8.239937445130232e-06, + "loss": 0.3551, + "step": 7190 + }, + { + "epoch": 0.57, + "learning_rate": 8.237411529566407e-06, + "loss": 0.3734, + "step": 7191 + }, + { + "epoch": 0.57, + "learning_rate": 8.234885730060554e-06, + "loss": 0.3331, + "step": 7192 + }, + { + "epoch": 0.57, + "learning_rate": 8.232360046778982e-06, + "loss": 0.2554, + "step": 7193 + }, + { + "epoch": 0.57, + "learning_rate": 8.229834479887992e-06, + "loss": 0.3083, + "step": 7194 + }, + { + "epoch": 0.57, + "learning_rate": 8.227309029553889e-06, + "loss": 0.2426, + "step": 7195 + }, + { + "epoch": 0.57, + "learning_rate": 8.224783695942954e-06, + "loss": 0.3175, + "step": 7196 + }, + { + "epoch": 0.57, + "learning_rate": 8.222258479221473e-06, + "loss": 0.3375, + "step": 7197 + }, + { + "epoch": 0.57, + "learning_rate": 8.219733379555715e-06, + "loss": 0.3317, + "step": 7198 + }, + { + "epoch": 0.57, + "learning_rate": 8.217208397111948e-06, + "loss": 0.3475, + "step": 7199 + }, + { + "epoch": 0.57, + "learning_rate": 8.21468353205643e-06, + "loss": 0.425, + "step": 7200 + }, + { + "epoch": 0.57, + "learning_rate": 8.212158784555412e-06, + "loss": 0.4346, + "step": 7201 + }, + { + "epoch": 0.57, + "learning_rate": 8.209634154775134e-06, + "loss": 0.2722, + "step": 7202 + }, + { + "epoch": 0.57, + "learning_rate": 8.207109642881836e-06, + "loss": 0.4618, + "step": 7203 + }, + { + "epoch": 0.57, + "learning_rate": 8.20458524904174e-06, + "loss": 0.295, + "step": 7204 + }, + { + "epoch": 0.57, + "learning_rate": 8.202060973421064e-06, + "loss": 0.4199, + "step": 7205 + }, + { + "epoch": 0.57, + "learning_rate": 8.199536816186025e-06, + "loss": 0.3398, + "step": 7206 + }, + { + "epoch": 0.57, + "learning_rate": 8.197012777502819e-06, + "loss": 0.3702, + "step": 7207 + }, + { + "epoch": 0.57, + "learning_rate": 8.194488857537646e-06, + "loss": 0.3672, + "step": 7208 + }, + { + "epoch": 0.57, + "learning_rate": 8.191965056456699e-06, + "loss": 0.3104, + "step": 7209 + }, + { + "epoch": 0.57, + "learning_rate": 8.18944137442615e-06, + "loss": 0.4052, + "step": 7210 + }, + { + "epoch": 0.57, + "learning_rate": 8.186917811612173e-06, + "loss": 0.3419, + "step": 7211 + }, + { + "epoch": 0.57, + "learning_rate": 8.184394368180937e-06, + "loss": 0.2965, + "step": 7212 + }, + { + "epoch": 0.57, + "learning_rate": 8.181871044298594e-06, + "loss": 0.2977, + "step": 7213 + }, + { + "epoch": 0.57, + "learning_rate": 8.179347840131297e-06, + "loss": 0.37, + "step": 7214 + }, + { + "epoch": 0.57, + "learning_rate": 8.176824755845183e-06, + "loss": 0.3962, + "step": 7215 + }, + { + "epoch": 0.57, + "learning_rate": 8.174301791606384e-06, + "loss": 0.3915, + "step": 7216 + }, + { + "epoch": 0.57, + "learning_rate": 8.171778947581032e-06, + "loss": 0.3118, + "step": 7217 + }, + { + "epoch": 0.57, + "learning_rate": 8.169256223935236e-06, + "loss": 0.3304, + "step": 7218 + }, + { + "epoch": 0.57, + "learning_rate": 8.166733620835107e-06, + "loss": 0.353, + "step": 7219 + }, + { + "epoch": 0.57, + "learning_rate": 8.164211138446753e-06, + "loss": 0.3687, + "step": 7220 + }, + { + "epoch": 0.57, + "learning_rate": 8.161688776936259e-06, + "loss": 0.3654, + "step": 7221 + }, + { + "epoch": 0.57, + "learning_rate": 8.159166536469717e-06, + "loss": 0.389, + "step": 7222 + }, + { + "epoch": 0.57, + "learning_rate": 8.156644417213196e-06, + "loss": 0.3157, + "step": 7223 + }, + { + "epoch": 0.57, + "learning_rate": 8.154122419332772e-06, + "loss": 0.2131, + "step": 7224 + }, + { + "epoch": 0.57, + "learning_rate": 8.151600542994506e-06, + "loss": 0.3509, + "step": 7225 + }, + { + "epoch": 0.57, + "learning_rate": 8.149078788364451e-06, + "loss": 0.2943, + "step": 7226 + }, + { + "epoch": 0.57, + "learning_rate": 8.14655715560865e-06, + "loss": 0.3316, + "step": 7227 + }, + { + "epoch": 0.57, + "learning_rate": 8.144035644893143e-06, + "loss": 0.4159, + "step": 7228 + }, + { + "epoch": 0.57, + "learning_rate": 8.141514256383957e-06, + "loss": 0.3274, + "step": 7229 + }, + { + "epoch": 0.57, + "learning_rate": 8.138992990247119e-06, + "loss": 0.3463, + "step": 7230 + }, + { + "epoch": 0.57, + "learning_rate": 8.136471846648633e-06, + "loss": 0.3741, + "step": 7231 + }, + { + "epoch": 0.57, + "learning_rate": 8.133950825754511e-06, + "loss": 0.3951, + "step": 7232 + }, + { + "epoch": 0.57, + "learning_rate": 8.13142992773075e-06, + "loss": 0.366, + "step": 7233 + }, + { + "epoch": 0.57, + "learning_rate": 8.128909152743334e-06, + "loss": 0.3004, + "step": 7234 + }, + { + "epoch": 0.57, + "learning_rate": 8.12638850095825e-06, + "loss": 0.3088, + "step": 7235 + }, + { + "epoch": 0.57, + "learning_rate": 8.123867972541466e-06, + "loss": 0.3165, + "step": 7236 + }, + { + "epoch": 0.57, + "learning_rate": 8.12134756765895e-06, + "loss": 0.3418, + "step": 7237 + }, + { + "epoch": 0.57, + "learning_rate": 8.118827286476658e-06, + "loss": 0.3329, + "step": 7238 + }, + { + "epoch": 0.57, + "learning_rate": 8.116307129160535e-06, + "loss": 0.4207, + "step": 7239 + }, + { + "epoch": 0.57, + "learning_rate": 8.113787095876525e-06, + "loss": 0.2847, + "step": 7240 + }, + { + "epoch": 0.57, + "learning_rate": 8.11126718679056e-06, + "loss": 0.3271, + "step": 7241 + }, + { + "epoch": 0.57, + "learning_rate": 8.10874740206856e-06, + "loss": 0.4772, + "step": 7242 + }, + { + "epoch": 0.57, + "learning_rate": 8.106227741876447e-06, + "loss": 0.3642, + "step": 7243 + }, + { + "epoch": 0.57, + "learning_rate": 8.103708206380123e-06, + "loss": 0.3697, + "step": 7244 + }, + { + "epoch": 0.57, + "learning_rate": 8.101188795745489e-06, + "loss": 0.3203, + "step": 7245 + }, + { + "epoch": 0.57, + "learning_rate": 8.098669510138438e-06, + "loss": 0.4169, + "step": 7246 + }, + { + "epoch": 0.57, + "learning_rate": 8.09615034972485e-06, + "loss": 0.3381, + "step": 7247 + }, + { + "epoch": 0.57, + "learning_rate": 8.093631314670598e-06, + "loss": 0.4081, + "step": 7248 + }, + { + "epoch": 0.57, + "learning_rate": 8.091112405141555e-06, + "loss": 0.3472, + "step": 7249 + }, + { + "epoch": 0.57, + "learning_rate": 8.088593621303573e-06, + "loss": 0.3869, + "step": 7250 + }, + { + "epoch": 0.57, + "learning_rate": 8.086074963322505e-06, + "loss": 0.3525, + "step": 7251 + }, + { + "epoch": 0.57, + "learning_rate": 8.083556431364191e-06, + "loss": 0.3745, + "step": 7252 + }, + { + "epoch": 0.57, + "learning_rate": 8.081038025594464e-06, + "loss": 0.3917, + "step": 7253 + }, + { + "epoch": 0.57, + "learning_rate": 8.078519746179153e-06, + "loss": 0.3487, + "step": 7254 + }, + { + "epoch": 0.57, + "learning_rate": 8.076001593284066e-06, + "loss": 0.3252, + "step": 7255 + }, + { + "epoch": 0.57, + "learning_rate": 8.073483567075018e-06, + "loss": 0.316, + "step": 7256 + }, + { + "epoch": 0.57, + "learning_rate": 8.070965667717809e-06, + "loss": 0.2566, + "step": 7257 + }, + { + "epoch": 0.58, + "learning_rate": 8.06844789537823e-06, + "loss": 0.4027, + "step": 7258 + }, + { + "epoch": 0.58, + "learning_rate": 8.065930250222061e-06, + "loss": 0.3043, + "step": 7259 + }, + { + "epoch": 0.58, + "learning_rate": 8.063412732415077e-06, + "loss": 0.2719, + "step": 7260 + }, + { + "epoch": 0.58, + "learning_rate": 8.060895342123049e-06, + "loss": 0.4101, + "step": 7261 + }, + { + "epoch": 0.58, + "learning_rate": 8.058378079511732e-06, + "loss": 0.4041, + "step": 7262 + }, + { + "epoch": 0.58, + "learning_rate": 8.055860944746876e-06, + "loss": 0.3359, + "step": 7263 + }, + { + "epoch": 0.58, + "learning_rate": 8.05334393799422e-06, + "loss": 0.3294, + "step": 7264 + }, + { + "epoch": 0.58, + "learning_rate": 8.050827059419502e-06, + "loss": 0.2754, + "step": 7265 + }, + { + "epoch": 0.58, + "learning_rate": 8.04831030918844e-06, + "loss": 0.5236, + "step": 7266 + }, + { + "epoch": 0.58, + "learning_rate": 8.045793687466757e-06, + "loss": 0.3295, + "step": 7267 + }, + { + "epoch": 0.58, + "learning_rate": 8.043277194420155e-06, + "loss": 0.2707, + "step": 7268 + }, + { + "epoch": 0.58, + "learning_rate": 8.040760830214334e-06, + "loss": 0.3901, + "step": 7269 + }, + { + "epoch": 0.58, + "learning_rate": 8.038244595014986e-06, + "loss": 0.333, + "step": 7270 + }, + { + "epoch": 0.58, + "learning_rate": 8.03572848898779e-06, + "loss": 0.3458, + "step": 7271 + }, + { + "epoch": 0.58, + "learning_rate": 8.033212512298422e-06, + "loss": 0.3576, + "step": 7272 + }, + { + "epoch": 0.58, + "learning_rate": 8.03069666511255e-06, + "loss": 0.3818, + "step": 7273 + }, + { + "epoch": 0.58, + "learning_rate": 8.028180947595823e-06, + "loss": 0.3333, + "step": 7274 + }, + { + "epoch": 0.58, + "learning_rate": 8.025665359913897e-06, + "loss": 0.3125, + "step": 7275 + }, + { + "epoch": 0.58, + "learning_rate": 8.023149902232404e-06, + "loss": 0.3701, + "step": 7276 + }, + { + "epoch": 0.58, + "learning_rate": 8.020634574716976e-06, + "loss": 0.3255, + "step": 7277 + }, + { + "epoch": 0.58, + "learning_rate": 8.018119377533243e-06, + "loss": 0.3468, + "step": 7278 + }, + { + "epoch": 0.58, + "learning_rate": 8.015604310846807e-06, + "loss": 0.2867, + "step": 7279 + }, + { + "epoch": 0.58, + "learning_rate": 8.013089374823281e-06, + "loss": 0.3286, + "step": 7280 + }, + { + "epoch": 0.58, + "learning_rate": 8.010574569628263e-06, + "loss": 0.2749, + "step": 7281 + }, + { + "epoch": 0.58, + "learning_rate": 8.008059895427334e-06, + "loss": 0.2319, + "step": 7282 + }, + { + "epoch": 0.58, + "learning_rate": 8.005545352386077e-06, + "loss": 0.3337, + "step": 7283 + }, + { + "epoch": 0.58, + "learning_rate": 8.003030940670061e-06, + "loss": 0.2118, + "step": 7284 + }, + { + "epoch": 0.58, + "learning_rate": 8.000516660444848e-06, + "loss": 0.3875, + "step": 7285 + }, + { + "epoch": 0.58, + "learning_rate": 7.99800251187599e-06, + "loss": 0.3326, + "step": 7286 + }, + { + "epoch": 0.58, + "learning_rate": 7.995488495129039e-06, + "loss": 0.4493, + "step": 7287 + }, + { + "epoch": 0.58, + "learning_rate": 7.992974610369521e-06, + "loss": 0.381, + "step": 7288 + }, + { + "epoch": 0.58, + "learning_rate": 7.990460857762969e-06, + "loss": 0.2792, + "step": 7289 + }, + { + "epoch": 0.58, + "learning_rate": 7.987947237474903e-06, + "loss": 0.2956, + "step": 7290 + }, + { + "epoch": 0.58, + "learning_rate": 7.985433749670825e-06, + "loss": 0.4064, + "step": 7291 + }, + { + "epoch": 0.58, + "learning_rate": 7.982920394516247e-06, + "loss": 0.367, + "step": 7292 + }, + { + "epoch": 0.58, + "learning_rate": 7.98040717217665e-06, + "loss": 0.3492, + "step": 7293 + }, + { + "epoch": 0.58, + "learning_rate": 7.977894082817524e-06, + "loss": 0.3804, + "step": 7294 + }, + { + "epoch": 0.58, + "learning_rate": 7.975381126604346e-06, + "loss": 0.379, + "step": 7295 + }, + { + "epoch": 0.58, + "learning_rate": 7.972868303702576e-06, + "loss": 0.2729, + "step": 7296 + }, + { + "epoch": 0.58, + "learning_rate": 7.970355614277674e-06, + "loss": 0.2619, + "step": 7297 + }, + { + "epoch": 0.58, + "learning_rate": 7.967843058495092e-06, + "loss": 0.4485, + "step": 7298 + }, + { + "epoch": 0.58, + "learning_rate": 7.965330636520262e-06, + "loss": 0.3777, + "step": 7299 + }, + { + "epoch": 0.58, + "learning_rate": 7.962818348518623e-06, + "loss": 0.4021, + "step": 7300 + }, + { + "epoch": 0.58, + "learning_rate": 7.960306194655593e-06, + "loss": 0.2048, + "step": 7301 + }, + { + "epoch": 0.58, + "learning_rate": 7.957794175096585e-06, + "loss": 0.3809, + "step": 7302 + }, + { + "epoch": 0.58, + "learning_rate": 7.955282290007006e-06, + "loss": 0.3415, + "step": 7303 + }, + { + "epoch": 0.58, + "learning_rate": 7.952770539552246e-06, + "loss": 0.3614, + "step": 7304 + }, + { + "epoch": 0.58, + "learning_rate": 7.950258923897695e-06, + "loss": 0.3116, + "step": 7305 + }, + { + "epoch": 0.58, + "learning_rate": 7.947747443208735e-06, + "loss": 0.3794, + "step": 7306 + }, + { + "epoch": 0.58, + "learning_rate": 7.945236097650729e-06, + "loss": 0.2614, + "step": 7307 + }, + { + "epoch": 0.58, + "learning_rate": 7.942724887389041e-06, + "loss": 0.2611, + "step": 7308 + }, + { + "epoch": 0.58, + "learning_rate": 7.940213812589018e-06, + "loss": 0.3888, + "step": 7309 + }, + { + "epoch": 0.58, + "learning_rate": 7.937702873416005e-06, + "loss": 0.3881, + "step": 7310 + }, + { + "epoch": 0.58, + "learning_rate": 7.935192070035335e-06, + "loss": 0.2614, + "step": 7311 + }, + { + "epoch": 0.58, + "learning_rate": 7.932681402612332e-06, + "loss": 0.5272, + "step": 7312 + }, + { + "epoch": 0.58, + "learning_rate": 7.93017087131231e-06, + "loss": 0.321, + "step": 7313 + }, + { + "epoch": 0.58, + "learning_rate": 7.927660476300578e-06, + "loss": 0.3478, + "step": 7314 + }, + { + "epoch": 0.58, + "learning_rate": 7.925150217742431e-06, + "loss": 0.3582, + "step": 7315 + }, + { + "epoch": 0.58, + "learning_rate": 7.92264009580316e-06, + "loss": 0.3751, + "step": 7316 + }, + { + "epoch": 0.58, + "learning_rate": 7.920130110648044e-06, + "loss": 0.3074, + "step": 7317 + }, + { + "epoch": 0.58, + "learning_rate": 7.917620262442349e-06, + "loss": 0.2676, + "step": 7318 + }, + { + "epoch": 0.58, + "learning_rate": 7.915110551351344e-06, + "loss": 0.3041, + "step": 7319 + }, + { + "epoch": 0.58, + "learning_rate": 7.912600977540275e-06, + "loss": 0.429, + "step": 7320 + }, + { + "epoch": 0.58, + "learning_rate": 7.910091541174388e-06, + "loss": 0.4462, + "step": 7321 + }, + { + "epoch": 0.58, + "learning_rate": 7.907582242418916e-06, + "loss": 0.4531, + "step": 7322 + }, + { + "epoch": 0.58, + "learning_rate": 7.905073081439087e-06, + "loss": 0.3535, + "step": 7323 + }, + { + "epoch": 0.58, + "learning_rate": 7.902564058400116e-06, + "loss": 0.3676, + "step": 7324 + }, + { + "epoch": 0.58, + "learning_rate": 7.900055173467207e-06, + "loss": 0.2989, + "step": 7325 + }, + { + "epoch": 0.58, + "learning_rate": 7.897546426805561e-06, + "loss": 0.4434, + "step": 7326 + }, + { + "epoch": 0.58, + "learning_rate": 7.89503781858037e-06, + "loss": 0.3355, + "step": 7327 + }, + { + "epoch": 0.58, + "learning_rate": 7.892529348956805e-06, + "loss": 0.4254, + "step": 7328 + }, + { + "epoch": 0.58, + "learning_rate": 7.890021018100045e-06, + "loss": 0.2279, + "step": 7329 + }, + { + "epoch": 0.58, + "learning_rate": 7.887512826175247e-06, + "loss": 0.2909, + "step": 7330 + }, + { + "epoch": 0.58, + "learning_rate": 7.885004773347565e-06, + "loss": 0.3239, + "step": 7331 + }, + { + "epoch": 0.58, + "learning_rate": 7.882496859782145e-06, + "loss": 0.3797, + "step": 7332 + }, + { + "epoch": 0.58, + "learning_rate": 7.879989085644114e-06, + "loss": 0.2742, + "step": 7333 + }, + { + "epoch": 0.58, + "learning_rate": 7.877481451098602e-06, + "loss": 0.4702, + "step": 7334 + }, + { + "epoch": 0.58, + "learning_rate": 7.874973956310726e-06, + "loss": 0.3201, + "step": 7335 + }, + { + "epoch": 0.58, + "learning_rate": 7.872466601445587e-06, + "loss": 0.3854, + "step": 7336 + }, + { + "epoch": 0.58, + "learning_rate": 7.869959386668286e-06, + "loss": 0.3228, + "step": 7337 + }, + { + "epoch": 0.58, + "learning_rate": 7.86745231214391e-06, + "loss": 0.3179, + "step": 7338 + }, + { + "epoch": 0.58, + "learning_rate": 7.864945378037538e-06, + "loss": 0.4405, + "step": 7339 + }, + { + "epoch": 0.58, + "learning_rate": 7.862438584514242e-06, + "loss": 0.3958, + "step": 7340 + }, + { + "epoch": 0.58, + "learning_rate": 7.859931931739077e-06, + "loss": 0.3548, + "step": 7341 + }, + { + "epoch": 0.58, + "learning_rate": 7.857425419877097e-06, + "loss": 0.3539, + "step": 7342 + }, + { + "epoch": 0.58, + "learning_rate": 7.854919049093345e-06, + "loss": 0.3214, + "step": 7343 + }, + { + "epoch": 0.58, + "learning_rate": 7.852412819552853e-06, + "loss": 0.2837, + "step": 7344 + }, + { + "epoch": 0.58, + "learning_rate": 7.849906731420642e-06, + "loss": 0.2872, + "step": 7345 + }, + { + "epoch": 0.58, + "learning_rate": 7.847400784861727e-06, + "loss": 0.2062, + "step": 7346 + }, + { + "epoch": 0.58, + "learning_rate": 7.844894980041112e-06, + "loss": 0.3068, + "step": 7347 + }, + { + "epoch": 0.58, + "learning_rate": 7.842389317123795e-06, + "loss": 0.2806, + "step": 7348 + }, + { + "epoch": 0.58, + "learning_rate": 7.839883796274758e-06, + "loss": 0.3427, + "step": 7349 + }, + { + "epoch": 0.58, + "learning_rate": 7.83737841765898e-06, + "loss": 0.3383, + "step": 7350 + }, + { + "epoch": 0.58, + "learning_rate": 7.834873181441426e-06, + "loss": 0.3644, + "step": 7351 + }, + { + "epoch": 0.58, + "learning_rate": 7.832368087787056e-06, + "loss": 0.388, + "step": 7352 + }, + { + "epoch": 0.58, + "learning_rate": 7.82986313686082e-06, + "loss": 0.3448, + "step": 7353 + }, + { + "epoch": 0.58, + "learning_rate": 7.82735832882765e-06, + "loss": 0.3343, + "step": 7354 + }, + { + "epoch": 0.58, + "learning_rate": 7.824853663852482e-06, + "loss": 0.4008, + "step": 7355 + }, + { + "epoch": 0.58, + "learning_rate": 7.822349142100236e-06, + "loss": 0.347, + "step": 7356 + }, + { + "epoch": 0.58, + "learning_rate": 7.819844763735818e-06, + "loss": 0.2656, + "step": 7357 + }, + { + "epoch": 0.58, + "learning_rate": 7.817340528924132e-06, + "loss": 0.3318, + "step": 7358 + }, + { + "epoch": 0.58, + "learning_rate": 7.814836437830074e-06, + "loss": 0.3495, + "step": 7359 + }, + { + "epoch": 0.58, + "learning_rate": 7.812332490618521e-06, + "loss": 0.3681, + "step": 7360 + }, + { + "epoch": 0.58, + "learning_rate": 7.809828687454343e-06, + "loss": 0.3501, + "step": 7361 + }, + { + "epoch": 0.58, + "learning_rate": 7.807325028502412e-06, + "loss": 0.2545, + "step": 7362 + }, + { + "epoch": 0.58, + "learning_rate": 7.804821513927574e-06, + "loss": 0.3034, + "step": 7363 + }, + { + "epoch": 0.58, + "learning_rate": 7.802318143894678e-06, + "loss": 0.3368, + "step": 7364 + }, + { + "epoch": 0.58, + "learning_rate": 7.799814918568559e-06, + "loss": 0.2621, + "step": 7365 + }, + { + "epoch": 0.58, + "learning_rate": 7.797311838114038e-06, + "loss": 0.3819, + "step": 7366 + }, + { + "epoch": 0.58, + "learning_rate": 7.794808902695935e-06, + "loss": 0.2708, + "step": 7367 + }, + { + "epoch": 0.58, + "learning_rate": 7.792306112479055e-06, + "loss": 0.3448, + "step": 7368 + }, + { + "epoch": 0.58, + "learning_rate": 7.789803467628196e-06, + "loss": 0.3541, + "step": 7369 + }, + { + "epoch": 0.58, + "learning_rate": 7.787300968308144e-06, + "loss": 0.3632, + "step": 7370 + }, + { + "epoch": 0.58, + "learning_rate": 7.784798614683675e-06, + "loss": 0.3059, + "step": 7371 + }, + { + "epoch": 0.58, + "learning_rate": 7.782296406919557e-06, + "loss": 0.3965, + "step": 7372 + }, + { + "epoch": 0.58, + "learning_rate": 7.779794345180552e-06, + "loss": 0.2682, + "step": 7373 + }, + { + "epoch": 0.58, + "learning_rate": 7.777292429631405e-06, + "loss": 0.3097, + "step": 7374 + }, + { + "epoch": 0.58, + "learning_rate": 7.774790660436857e-06, + "loss": 0.5221, + "step": 7375 + }, + { + "epoch": 0.58, + "learning_rate": 7.772289037761639e-06, + "loss": 0.344, + "step": 7376 + }, + { + "epoch": 0.58, + "learning_rate": 7.769787561770466e-06, + "loss": 0.3383, + "step": 7377 + }, + { + "epoch": 0.58, + "learning_rate": 7.767286232628054e-06, + "loss": 0.4762, + "step": 7378 + }, + { + "epoch": 0.58, + "learning_rate": 7.764785050499098e-06, + "loss": 0.2946, + "step": 7379 + }, + { + "epoch": 0.58, + "learning_rate": 7.76228401554829e-06, + "loss": 0.3161, + "step": 7380 + }, + { + "epoch": 0.58, + "learning_rate": 7.759783127940315e-06, + "loss": 0.3967, + "step": 7381 + }, + { + "epoch": 0.58, + "learning_rate": 7.757282387839842e-06, + "loss": 0.3313, + "step": 7382 + }, + { + "epoch": 0.58, + "learning_rate": 7.75478179541153e-06, + "loss": 0.3758, + "step": 7383 + }, + { + "epoch": 0.58, + "learning_rate": 7.752281350820037e-06, + "loss": 0.4423, + "step": 7384 + }, + { + "epoch": 0.59, + "learning_rate": 7.749781054229998e-06, + "loss": 0.3802, + "step": 7385 + }, + { + "epoch": 0.59, + "learning_rate": 7.747280905806051e-06, + "loss": 0.4238, + "step": 7386 + }, + { + "epoch": 0.59, + "learning_rate": 7.744780905712818e-06, + "loss": 0.3198, + "step": 7387 + }, + { + "epoch": 0.59, + "learning_rate": 7.742281054114909e-06, + "loss": 0.311, + "step": 7388 + }, + { + "epoch": 0.59, + "learning_rate": 7.73978135117693e-06, + "loss": 0.3378, + "step": 7389 + }, + { + "epoch": 0.59, + "learning_rate": 7.737281797063473e-06, + "loss": 0.4018, + "step": 7390 + }, + { + "epoch": 0.59, + "learning_rate": 7.734782391939123e-06, + "loss": 0.3682, + "step": 7391 + }, + { + "epoch": 0.59, + "learning_rate": 7.732283135968452e-06, + "loss": 0.2485, + "step": 7392 + }, + { + "epoch": 0.59, + "learning_rate": 7.729784029316025e-06, + "loss": 0.2688, + "step": 7393 + }, + { + "epoch": 0.59, + "learning_rate": 7.7272850721464e-06, + "loss": 0.3605, + "step": 7394 + }, + { + "epoch": 0.59, + "learning_rate": 7.724786264624112e-06, + "loss": 0.4822, + "step": 7395 + }, + { + "epoch": 0.59, + "learning_rate": 7.722287606913703e-06, + "loss": 0.2969, + "step": 7396 + }, + { + "epoch": 0.59, + "learning_rate": 7.719789099179696e-06, + "loss": 0.2425, + "step": 7397 + }, + { + "epoch": 0.59, + "learning_rate": 7.717290741586602e-06, + "loss": 0.3379, + "step": 7398 + }, + { + "epoch": 0.59, + "learning_rate": 7.714792534298934e-06, + "loss": 0.4032, + "step": 7399 + }, + { + "epoch": 0.59, + "learning_rate": 7.712294477481177e-06, + "loss": 0.5683, + "step": 7400 + }, + { + "epoch": 0.59, + "learning_rate": 7.709796571297823e-06, + "loss": 0.2873, + "step": 7401 + }, + { + "epoch": 0.59, + "learning_rate": 7.707298815913346e-06, + "loss": 0.3573, + "step": 7402 + }, + { + "epoch": 0.59, + "learning_rate": 7.70480121149221e-06, + "loss": 0.4885, + "step": 7403 + }, + { + "epoch": 0.59, + "learning_rate": 7.702303758198868e-06, + "loss": 0.3213, + "step": 7404 + }, + { + "epoch": 0.59, + "learning_rate": 7.699806456197771e-06, + "loss": 0.3215, + "step": 7405 + }, + { + "epoch": 0.59, + "learning_rate": 7.697309305653348e-06, + "loss": 0.4929, + "step": 7406 + }, + { + "epoch": 0.59, + "learning_rate": 7.694812306730031e-06, + "loss": 0.309, + "step": 7407 + }, + { + "epoch": 0.59, + "learning_rate": 7.69231545959223e-06, + "loss": 0.4076, + "step": 7408 + }, + { + "epoch": 0.59, + "learning_rate": 7.689818764404351e-06, + "loss": 0.2729, + "step": 7409 + }, + { + "epoch": 0.59, + "learning_rate": 7.687322221330794e-06, + "loss": 0.3062, + "step": 7410 + }, + { + "epoch": 0.59, + "learning_rate": 7.684825830535935e-06, + "loss": 0.3646, + "step": 7411 + }, + { + "epoch": 0.59, + "learning_rate": 7.682329592184158e-06, + "loss": 0.4177, + "step": 7412 + }, + { + "epoch": 0.59, + "learning_rate": 7.679833506439826e-06, + "loss": 0.3665, + "step": 7413 + }, + { + "epoch": 0.59, + "learning_rate": 7.677337573467294e-06, + "loss": 0.3134, + "step": 7414 + }, + { + "epoch": 0.59, + "learning_rate": 7.674841793430907e-06, + "loss": 0.3856, + "step": 7415 + }, + { + "epoch": 0.59, + "learning_rate": 7.672346166494999e-06, + "loss": 0.412, + "step": 7416 + }, + { + "epoch": 0.59, + "learning_rate": 7.669850692823895e-06, + "loss": 0.4298, + "step": 7417 + }, + { + "epoch": 0.59, + "learning_rate": 7.667355372581913e-06, + "loss": 0.3131, + "step": 7418 + }, + { + "epoch": 0.59, + "learning_rate": 7.664860205933356e-06, + "loss": 0.4035, + "step": 7419 + }, + { + "epoch": 0.59, + "learning_rate": 7.662365193042516e-06, + "loss": 0.3018, + "step": 7420 + }, + { + "epoch": 0.59, + "learning_rate": 7.659870334073683e-06, + "loss": 0.3244, + "step": 7421 + }, + { + "epoch": 0.59, + "learning_rate": 7.657375629191126e-06, + "loss": 0.3422, + "step": 7422 + }, + { + "epoch": 0.59, + "learning_rate": 7.654881078559112e-06, + "loss": 0.3817, + "step": 7423 + }, + { + "epoch": 0.59, + "learning_rate": 7.652386682341895e-06, + "loss": 0.4707, + "step": 7424 + }, + { + "epoch": 0.59, + "learning_rate": 7.64989244070372e-06, + "loss": 0.3059, + "step": 7425 + }, + { + "epoch": 0.59, + "learning_rate": 7.647398353808822e-06, + "loss": 0.3029, + "step": 7426 + }, + { + "epoch": 0.59, + "learning_rate": 7.644904421821418e-06, + "loss": 0.2413, + "step": 7427 + }, + { + "epoch": 0.59, + "learning_rate": 7.642410644905726e-06, + "loss": 0.3813, + "step": 7428 + }, + { + "epoch": 0.59, + "learning_rate": 7.639917023225953e-06, + "loss": 0.2833, + "step": 7429 + }, + { + "epoch": 0.59, + "learning_rate": 7.637423556946284e-06, + "loss": 0.3123, + "step": 7430 + }, + { + "epoch": 0.59, + "learning_rate": 7.63493024623091e-06, + "loss": 0.314, + "step": 7431 + }, + { + "epoch": 0.59, + "learning_rate": 7.632437091243996e-06, + "loss": 0.337, + "step": 7432 + }, + { + "epoch": 0.59, + "learning_rate": 7.629944092149707e-06, + "loss": 0.3634, + "step": 7433 + }, + { + "epoch": 0.59, + "learning_rate": 7.627451249112199e-06, + "loss": 0.2322, + "step": 7434 + }, + { + "epoch": 0.59, + "learning_rate": 7.624958562295607e-06, + "loss": 0.3416, + "step": 7435 + }, + { + "epoch": 0.59, + "learning_rate": 7.622466031864066e-06, + "loss": 0.2126, + "step": 7436 + }, + { + "epoch": 0.59, + "learning_rate": 7.6199736579817005e-06, + "loss": 0.2701, + "step": 7437 + }, + { + "epoch": 0.59, + "learning_rate": 7.617481440812617e-06, + "loss": 0.3908, + "step": 7438 + }, + { + "epoch": 0.59, + "learning_rate": 7.614989380520914e-06, + "loss": 0.2898, + "step": 7439 + }, + { + "epoch": 0.59, + "learning_rate": 7.612497477270686e-06, + "loss": 0.2927, + "step": 7440 + }, + { + "epoch": 0.59, + "learning_rate": 7.610005731226009e-06, + "loss": 0.3782, + "step": 7441 + }, + { + "epoch": 0.59, + "learning_rate": 7.607514142550955e-06, + "loss": 0.4588, + "step": 7442 + }, + { + "epoch": 0.59, + "learning_rate": 7.605022711409585e-06, + "loss": 0.2895, + "step": 7443 + }, + { + "epoch": 0.59, + "learning_rate": 7.602531437965943e-06, + "loss": 0.3413, + "step": 7444 + }, + { + "epoch": 0.59, + "learning_rate": 7.6000403223840714e-06, + "loss": 0.3617, + "step": 7445 + }, + { + "epoch": 0.59, + "learning_rate": 7.597549364827997e-06, + "loss": 0.2503, + "step": 7446 + }, + { + "epoch": 0.59, + "learning_rate": 7.595058565461736e-06, + "loss": 0.2678, + "step": 7447 + }, + { + "epoch": 0.59, + "learning_rate": 7.5925679244492985e-06, + "loss": 0.4074, + "step": 7448 + }, + { + "epoch": 0.59, + "learning_rate": 7.5900774419546775e-06, + "loss": 0.409, + "step": 7449 + }, + { + "epoch": 0.59, + "learning_rate": 7.58758711814186e-06, + "loss": 0.2405, + "step": 7450 + }, + { + "epoch": 0.59, + "learning_rate": 7.585096953174827e-06, + "loss": 0.4104, + "step": 7451 + }, + { + "epoch": 0.59, + "learning_rate": 7.582606947217537e-06, + "loss": 0.3655, + "step": 7452 + }, + { + "epoch": 0.59, + "learning_rate": 7.580117100433947e-06, + "loss": 0.5192, + "step": 7453 + }, + { + "epoch": 0.59, + "learning_rate": 7.577627412988005e-06, + "loss": 0.3253, + "step": 7454 + }, + { + "epoch": 0.59, + "learning_rate": 7.57513788504364e-06, + "loss": 0.4485, + "step": 7455 + }, + { + "epoch": 0.59, + "learning_rate": 7.572648516764778e-06, + "loss": 0.398, + "step": 7456 + }, + { + "epoch": 0.59, + "learning_rate": 7.570159308315331e-06, + "loss": 0.3747, + "step": 7457 + }, + { + "epoch": 0.59, + "learning_rate": 7.5676702598592025e-06, + "loss": 0.4273, + "step": 7458 + }, + { + "epoch": 0.59, + "learning_rate": 7.5651813715602855e-06, + "loss": 0.328, + "step": 7459 + }, + { + "epoch": 0.59, + "learning_rate": 7.562692643582456e-06, + "loss": 0.2772, + "step": 7460 + }, + { + "epoch": 0.59, + "learning_rate": 7.56020407608959e-06, + "loss": 0.3776, + "step": 7461 + }, + { + "epoch": 0.59, + "learning_rate": 7.557715669245547e-06, + "loss": 0.3624, + "step": 7462 + }, + { + "epoch": 0.59, + "learning_rate": 7.555227423214174e-06, + "loss": 0.3788, + "step": 7463 + }, + { + "epoch": 0.59, + "learning_rate": 7.552739338159314e-06, + "loss": 0.2622, + "step": 7464 + }, + { + "epoch": 0.59, + "learning_rate": 7.550251414244791e-06, + "loss": 0.2522, + "step": 7465 + }, + { + "epoch": 0.59, + "learning_rate": 7.5477636516344255e-06, + "loss": 0.3382, + "step": 7466 + }, + { + "epoch": 0.59, + "learning_rate": 7.545276050492025e-06, + "loss": 0.2943, + "step": 7467 + }, + { + "epoch": 0.59, + "learning_rate": 7.542788610981384e-06, + "loss": 0.4444, + "step": 7468 + }, + { + "epoch": 0.59, + "learning_rate": 7.540301333266289e-06, + "loss": 0.4076, + "step": 7469 + }, + { + "epoch": 0.59, + "learning_rate": 7.537814217510518e-06, + "loss": 0.2957, + "step": 7470 + }, + { + "epoch": 0.59, + "learning_rate": 7.535327263877832e-06, + "loss": 0.3021, + "step": 7471 + }, + { + "epoch": 0.59, + "learning_rate": 7.532840472531988e-06, + "loss": 0.3518, + "step": 7472 + }, + { + "epoch": 0.59, + "learning_rate": 7.530353843636726e-06, + "loss": 0.391, + "step": 7473 + }, + { + "epoch": 0.59, + "learning_rate": 7.52786737735578e-06, + "loss": 0.329, + "step": 7474 + }, + { + "epoch": 0.59, + "learning_rate": 7.525381073852874e-06, + "loss": 0.2802, + "step": 7475 + }, + { + "epoch": 0.59, + "learning_rate": 7.522894933291715e-06, + "loss": 0.3617, + "step": 7476 + }, + { + "epoch": 0.59, + "learning_rate": 7.5204089558360076e-06, + "loss": 0.3749, + "step": 7477 + }, + { + "epoch": 0.59, + "learning_rate": 7.517923141649439e-06, + "loss": 0.3088, + "step": 7478 + }, + { + "epoch": 0.59, + "learning_rate": 7.515437490895688e-06, + "loss": 0.4254, + "step": 7479 + }, + { + "epoch": 0.59, + "learning_rate": 7.5129520037384225e-06, + "loss": 0.3632, + "step": 7480 + }, + { + "epoch": 0.59, + "learning_rate": 7.5104666803413015e-06, + "loss": 0.3577, + "step": 7481 + }, + { + "epoch": 0.59, + "learning_rate": 7.50798152086797e-06, + "loss": 0.3488, + "step": 7482 + }, + { + "epoch": 0.59, + "learning_rate": 7.505496525482066e-06, + "loss": 0.3283, + "step": 7483 + }, + { + "epoch": 0.59, + "learning_rate": 7.503011694347212e-06, + "loss": 0.326, + "step": 7484 + }, + { + "epoch": 0.59, + "learning_rate": 7.500527027627025e-06, + "loss": 0.416, + "step": 7485 + }, + { + "epoch": 0.59, + "learning_rate": 7.4980425254851034e-06, + "loss": 0.3614, + "step": 7486 + }, + { + "epoch": 0.59, + "learning_rate": 7.495558188085044e-06, + "loss": 0.2861, + "step": 7487 + }, + { + "epoch": 0.59, + "learning_rate": 7.493074015590429e-06, + "loss": 0.3255, + "step": 7488 + }, + { + "epoch": 0.59, + "learning_rate": 7.490590008164824e-06, + "loss": 0.3227, + "step": 7489 + }, + { + "epoch": 0.59, + "learning_rate": 7.488106165971795e-06, + "loss": 0.3785, + "step": 7490 + }, + { + "epoch": 0.59, + "learning_rate": 7.485622489174888e-06, + "loss": 0.2639, + "step": 7491 + }, + { + "epoch": 0.59, + "learning_rate": 7.483138977937643e-06, + "loss": 0.3158, + "step": 7492 + }, + { + "epoch": 0.59, + "learning_rate": 7.480655632423586e-06, + "loss": 0.2409, + "step": 7493 + }, + { + "epoch": 0.59, + "learning_rate": 7.478172452796231e-06, + "loss": 0.3812, + "step": 7494 + }, + { + "epoch": 0.59, + "learning_rate": 7.475689439219085e-06, + "loss": 0.2962, + "step": 7495 + }, + { + "epoch": 0.59, + "learning_rate": 7.473206591855646e-06, + "loss": 0.384, + "step": 7496 + }, + { + "epoch": 0.59, + "learning_rate": 7.470723910869393e-06, + "loss": 0.4051, + "step": 7497 + }, + { + "epoch": 0.59, + "learning_rate": 7.468241396423801e-06, + "loss": 0.3795, + "step": 7498 + }, + { + "epoch": 0.59, + "learning_rate": 7.465759048682333e-06, + "loss": 0.3426, + "step": 7499 + }, + { + "epoch": 0.59, + "learning_rate": 7.463276867808435e-06, + "loss": 0.2859, + "step": 7500 + }, + { + "epoch": 0.59, + "learning_rate": 7.46079485396555e-06, + "loss": 0.3332, + "step": 7501 + }, + { + "epoch": 0.59, + "learning_rate": 7.458313007317106e-06, + "loss": 0.3876, + "step": 7502 + }, + { + "epoch": 0.59, + "learning_rate": 7.45583132802652e-06, + "loss": 0.2889, + "step": 7503 + }, + { + "epoch": 0.59, + "learning_rate": 7.4533498162572004e-06, + "loss": 0.3924, + "step": 7504 + }, + { + "epoch": 0.59, + "learning_rate": 7.450868472172541e-06, + "loss": 0.3565, + "step": 7505 + }, + { + "epoch": 0.59, + "learning_rate": 7.448387295935926e-06, + "loss": 0.318, + "step": 7506 + }, + { + "epoch": 0.59, + "learning_rate": 7.445906287710733e-06, + "loss": 0.4613, + "step": 7507 + }, + { + "epoch": 0.59, + "learning_rate": 7.443425447660319e-06, + "loss": 0.3025, + "step": 7508 + }, + { + "epoch": 0.59, + "learning_rate": 7.4409447759480404e-06, + "loss": 0.2991, + "step": 7509 + }, + { + "epoch": 0.59, + "learning_rate": 7.438464272737232e-06, + "loss": 0.2861, + "step": 7510 + }, + { + "epoch": 0.6, + "learning_rate": 7.435983938191227e-06, + "loss": 0.3642, + "step": 7511 + }, + { + "epoch": 0.6, + "learning_rate": 7.433503772473343e-06, + "loss": 0.4153, + "step": 7512 + }, + { + "epoch": 0.6, + "learning_rate": 7.431023775746886e-06, + "loss": 0.3493, + "step": 7513 + }, + { + "epoch": 0.6, + "learning_rate": 7.428543948175151e-06, + "loss": 0.3659, + "step": 7514 + }, + { + "epoch": 0.6, + "learning_rate": 7.426064289921429e-06, + "loss": 0.2806, + "step": 7515 + }, + { + "epoch": 0.6, + "learning_rate": 7.423584801148985e-06, + "loss": 0.3645, + "step": 7516 + }, + { + "epoch": 0.6, + "learning_rate": 7.421105482021084e-06, + "loss": 0.375, + "step": 7517 + }, + { + "epoch": 0.6, + "learning_rate": 7.41862633270098e-06, + "loss": 0.199, + "step": 7518 + }, + { + "epoch": 0.6, + "learning_rate": 7.416147353351909e-06, + "loss": 0.3575, + "step": 7519 + }, + { + "epoch": 0.6, + "learning_rate": 7.4136685441371025e-06, + "loss": 0.382, + "step": 7520 + }, + { + "epoch": 0.6, + "learning_rate": 7.41118990521978e-06, + "loss": 0.3609, + "step": 7521 + }, + { + "epoch": 0.6, + "learning_rate": 7.408711436763143e-06, + "loss": 0.3683, + "step": 7522 + }, + { + "epoch": 0.6, + "learning_rate": 7.406233138930389e-06, + "loss": 0.387, + "step": 7523 + }, + { + "epoch": 0.6, + "learning_rate": 7.4037550118847044e-06, + "loss": 0.2606, + "step": 7524 + }, + { + "epoch": 0.6, + "learning_rate": 7.401277055789259e-06, + "loss": 0.3977, + "step": 7525 + }, + { + "epoch": 0.6, + "learning_rate": 7.398799270807217e-06, + "loss": 0.3981, + "step": 7526 + }, + { + "epoch": 0.6, + "learning_rate": 7.3963216571017235e-06, + "loss": 0.3192, + "step": 7527 + }, + { + "epoch": 0.6, + "learning_rate": 7.3938442148359215e-06, + "loss": 0.3319, + "step": 7528 + }, + { + "epoch": 0.6, + "learning_rate": 7.391366944172941e-06, + "loss": 0.3146, + "step": 7529 + }, + { + "epoch": 0.6, + "learning_rate": 7.388889845275893e-06, + "loss": 0.3917, + "step": 7530 + }, + { + "epoch": 0.6, + "learning_rate": 7.3864129183078835e-06, + "loss": 0.4387, + "step": 7531 + }, + { + "epoch": 0.6, + "learning_rate": 7.38393616343201e-06, + "loss": 0.416, + "step": 7532 + }, + { + "epoch": 0.6, + "learning_rate": 7.381459580811352e-06, + "loss": 0.3097, + "step": 7533 + }, + { + "epoch": 0.6, + "learning_rate": 7.378983170608982e-06, + "loss": 0.4106, + "step": 7534 + }, + { + "epoch": 0.6, + "learning_rate": 7.376506932987956e-06, + "loss": 0.3435, + "step": 7535 + }, + { + "epoch": 0.6, + "learning_rate": 7.374030868111326e-06, + "loss": 0.3198, + "step": 7536 + }, + { + "epoch": 0.6, + "learning_rate": 7.371554976142128e-06, + "loss": 0.3507, + "step": 7537 + }, + { + "epoch": 0.6, + "learning_rate": 7.369079257243388e-06, + "loss": 0.3311, + "step": 7538 + }, + { + "epoch": 0.6, + "learning_rate": 7.366603711578119e-06, + "loss": 0.3723, + "step": 7539 + }, + { + "epoch": 0.6, + "learning_rate": 7.364128339309326e-06, + "loss": 0.267, + "step": 7540 + }, + { + "epoch": 0.6, + "learning_rate": 7.361653140599997e-06, + "loss": 0.361, + "step": 7541 + }, + { + "epoch": 0.6, + "learning_rate": 7.359178115613116e-06, + "loss": 0.3075, + "step": 7542 + }, + { + "epoch": 0.6, + "learning_rate": 7.356703264511646e-06, + "loss": 0.4445, + "step": 7543 + }, + { + "epoch": 0.6, + "learning_rate": 7.354228587458549e-06, + "loss": 0.3673, + "step": 7544 + }, + { + "epoch": 0.6, + "learning_rate": 7.351754084616771e-06, + "loss": 0.3688, + "step": 7545 + }, + { + "epoch": 0.6, + "learning_rate": 7.349279756149241e-06, + "loss": 0.352, + "step": 7546 + }, + { + "epoch": 0.6, + "learning_rate": 7.346805602218885e-06, + "loss": 0.3929, + "step": 7547 + }, + { + "epoch": 0.6, + "learning_rate": 7.344331622988616e-06, + "loss": 0.2424, + "step": 7548 + }, + { + "epoch": 0.6, + "learning_rate": 7.341857818621328e-06, + "loss": 0.3309, + "step": 7549 + }, + { + "epoch": 0.6, + "learning_rate": 7.339384189279917e-06, + "loss": 0.2448, + "step": 7550 + }, + { + "epoch": 0.6, + "learning_rate": 7.33691073512725e-06, + "loss": 0.3962, + "step": 7551 + }, + { + "epoch": 0.6, + "learning_rate": 7.3344374563262e-06, + "loss": 0.2951, + "step": 7552 + }, + { + "epoch": 0.6, + "learning_rate": 7.3319643530396175e-06, + "loss": 0.302, + "step": 7553 + }, + { + "epoch": 0.6, + "learning_rate": 7.329491425430344e-06, + "loss": 0.3916, + "step": 7554 + }, + { + "epoch": 0.6, + "learning_rate": 7.327018673661209e-06, + "loss": 0.4095, + "step": 7555 + }, + { + "epoch": 0.6, + "learning_rate": 7.324546097895036e-06, + "loss": 0.3351, + "step": 7556 + }, + { + "epoch": 0.6, + "learning_rate": 7.3220736982946275e-06, + "loss": 0.263, + "step": 7557 + }, + { + "epoch": 0.6, + "learning_rate": 7.3196014750227815e-06, + "loss": 0.3953, + "step": 7558 + }, + { + "epoch": 0.6, + "learning_rate": 7.317129428242279e-06, + "loss": 0.2326, + "step": 7559 + }, + { + "epoch": 0.6, + "learning_rate": 7.3146575581158945e-06, + "loss": 0.2704, + "step": 7560 + }, + { + "epoch": 0.6, + "learning_rate": 7.312185864806391e-06, + "loss": 0.3208, + "step": 7561 + }, + { + "epoch": 0.6, + "learning_rate": 7.309714348476513e-06, + "loss": 0.4249, + "step": 7562 + }, + { + "epoch": 0.6, + "learning_rate": 7.307243009289005e-06, + "loss": 0.2149, + "step": 7563 + }, + { + "epoch": 0.6, + "learning_rate": 7.304771847406582e-06, + "loss": 0.3455, + "step": 7564 + }, + { + "epoch": 0.6, + "learning_rate": 7.3023008629919665e-06, + "loss": 0.2928, + "step": 7565 + }, + { + "epoch": 0.6, + "learning_rate": 7.299830056207861e-06, + "loss": 0.2759, + "step": 7566 + }, + { + "epoch": 0.6, + "learning_rate": 7.29735942721695e-06, + "loss": 0.3782, + "step": 7567 + }, + { + "epoch": 0.6, + "learning_rate": 7.294888976181919e-06, + "loss": 0.3988, + "step": 7568 + }, + { + "epoch": 0.6, + "learning_rate": 7.2924187032654335e-06, + "loss": 0.422, + "step": 7569 + }, + { + "epoch": 0.6, + "learning_rate": 7.289948608630146e-06, + "loss": 0.3079, + "step": 7570 + }, + { + "epoch": 0.6, + "learning_rate": 7.287478692438705e-06, + "loss": 0.3822, + "step": 7571 + }, + { + "epoch": 0.6, + "learning_rate": 7.285008954853739e-06, + "loss": 0.3625, + "step": 7572 + }, + { + "epoch": 0.6, + "learning_rate": 7.282539396037868e-06, + "loss": 0.295, + "step": 7573 + }, + { + "epoch": 0.6, + "learning_rate": 7.280070016153706e-06, + "loss": 0.4557, + "step": 7574 + }, + { + "epoch": 0.6, + "learning_rate": 7.277600815363842e-06, + "loss": 0.2525, + "step": 7575 + }, + { + "epoch": 0.6, + "learning_rate": 7.275131793830865e-06, + "loss": 0.3198, + "step": 7576 + }, + { + "epoch": 0.6, + "learning_rate": 7.272662951717352e-06, + "loss": 0.3684, + "step": 7577 + }, + { + "epoch": 0.6, + "learning_rate": 7.270194289185858e-06, + "loss": 0.3093, + "step": 7578 + }, + { + "epoch": 0.6, + "learning_rate": 7.267725806398936e-06, + "loss": 0.2313, + "step": 7579 + }, + { + "epoch": 0.6, + "learning_rate": 7.265257503519122e-06, + "loss": 0.3652, + "step": 7580 + }, + { + "epoch": 0.6, + "learning_rate": 7.262789380708942e-06, + "loss": 0.4071, + "step": 7581 + }, + { + "epoch": 0.6, + "learning_rate": 7.260321438130913e-06, + "loss": 0.354, + "step": 7582 + }, + { + "epoch": 0.6, + "learning_rate": 7.257853675947533e-06, + "loss": 0.3523, + "step": 7583 + }, + { + "epoch": 0.6, + "learning_rate": 7.255386094321293e-06, + "loss": 0.3579, + "step": 7584 + }, + { + "epoch": 0.6, + "learning_rate": 7.2529186934146756e-06, + "loss": 0.301, + "step": 7585 + }, + { + "epoch": 0.6, + "learning_rate": 7.250451473390141e-06, + "loss": 0.304, + "step": 7586 + }, + { + "epoch": 0.6, + "learning_rate": 7.24798443441015e-06, + "loss": 0.317, + "step": 7587 + }, + { + "epoch": 0.6, + "learning_rate": 7.24551757663714e-06, + "loss": 0.2865, + "step": 7588 + }, + { + "epoch": 0.6, + "learning_rate": 7.2430509002335434e-06, + "loss": 0.3868, + "step": 7589 + }, + { + "epoch": 0.6, + "learning_rate": 7.240584405361781e-06, + "loss": 0.3596, + "step": 7590 + }, + { + "epoch": 0.6, + "learning_rate": 7.238118092184256e-06, + "loss": 0.29, + "step": 7591 + }, + { + "epoch": 0.6, + "learning_rate": 7.2356519608633665e-06, + "loss": 0.3772, + "step": 7592 + }, + { + "epoch": 0.6, + "learning_rate": 7.233186011561498e-06, + "loss": 0.4378, + "step": 7593 + }, + { + "epoch": 0.6, + "learning_rate": 7.230720244441016e-06, + "loss": 0.312, + "step": 7594 + }, + { + "epoch": 0.6, + "learning_rate": 7.228254659664278e-06, + "loss": 0.4384, + "step": 7595 + }, + { + "epoch": 0.6, + "learning_rate": 7.225789257393636e-06, + "loss": 0.3077, + "step": 7596 + }, + { + "epoch": 0.6, + "learning_rate": 7.223324037791421e-06, + "loss": 0.4311, + "step": 7597 + }, + { + "epoch": 0.6, + "learning_rate": 7.220859001019957e-06, + "loss": 0.3574, + "step": 7598 + }, + { + "epoch": 0.6, + "learning_rate": 7.218394147241559e-06, + "loss": 0.4179, + "step": 7599 + }, + { + "epoch": 0.6, + "learning_rate": 7.2159294766185174e-06, + "loss": 0.3403, + "step": 7600 + }, + { + "epoch": 0.6, + "learning_rate": 7.213464989313126e-06, + "loss": 0.3207, + "step": 7601 + }, + { + "epoch": 0.6, + "learning_rate": 7.211000685487658e-06, + "loss": 0.359, + "step": 7602 + }, + { + "epoch": 0.6, + "learning_rate": 7.208536565304374e-06, + "loss": 0.352, + "step": 7603 + }, + { + "epoch": 0.6, + "learning_rate": 7.206072628925526e-06, + "loss": 0.2731, + "step": 7604 + }, + { + "epoch": 0.6, + "learning_rate": 7.203608876513351e-06, + "loss": 0.3694, + "step": 7605 + }, + { + "epoch": 0.6, + "learning_rate": 7.201145308230075e-06, + "loss": 0.3187, + "step": 7606 + }, + { + "epoch": 0.6, + "learning_rate": 7.198681924237918e-06, + "loss": 0.3239, + "step": 7607 + }, + { + "epoch": 0.6, + "learning_rate": 7.196218724699072e-06, + "loss": 0.3872, + "step": 7608 + }, + { + "epoch": 0.6, + "learning_rate": 7.193755709775734e-06, + "loss": 0.3524, + "step": 7609 + }, + { + "epoch": 0.6, + "learning_rate": 7.191292879630081e-06, + "loss": 0.3939, + "step": 7610 + }, + { + "epoch": 0.6, + "learning_rate": 7.188830234424275e-06, + "loss": 0.2585, + "step": 7611 + }, + { + "epoch": 0.6, + "learning_rate": 7.186367774320474e-06, + "loss": 0.4309, + "step": 7612 + }, + { + "epoch": 0.6, + "learning_rate": 7.1839054994808145e-06, + "loss": 0.4054, + "step": 7613 + }, + { + "epoch": 0.6, + "learning_rate": 7.181443410067428e-06, + "loss": 0.3492, + "step": 7614 + }, + { + "epoch": 0.6, + "learning_rate": 7.1789815062424325e-06, + "loss": 0.296, + "step": 7615 + }, + { + "epoch": 0.6, + "learning_rate": 7.176519788167929e-06, + "loss": 0.327, + "step": 7616 + }, + { + "epoch": 0.6, + "learning_rate": 7.174058256006012e-06, + "loss": 0.3463, + "step": 7617 + }, + { + "epoch": 0.6, + "learning_rate": 7.171596909918763e-06, + "loss": 0.3061, + "step": 7618 + }, + { + "epoch": 0.6, + "learning_rate": 7.169135750068247e-06, + "loss": 0.3924, + "step": 7619 + }, + { + "epoch": 0.6, + "learning_rate": 7.1666747766165226e-06, + "loss": 0.3811, + "step": 7620 + }, + { + "epoch": 0.6, + "learning_rate": 7.164213989725628e-06, + "loss": 0.2452, + "step": 7621 + }, + { + "epoch": 0.6, + "learning_rate": 7.1617533895575975e-06, + "loss": 0.3285, + "step": 7622 + }, + { + "epoch": 0.6, + "learning_rate": 7.1592929762744515e-06, + "loss": 0.3695, + "step": 7623 + }, + { + "epoch": 0.6, + "learning_rate": 7.156832750038192e-06, + "loss": 0.4496, + "step": 7624 + }, + { + "epoch": 0.6, + "learning_rate": 7.154372711010815e-06, + "loss": 0.3449, + "step": 7625 + }, + { + "epoch": 0.6, + "learning_rate": 7.1519128593543065e-06, + "loss": 0.2397, + "step": 7626 + }, + { + "epoch": 0.6, + "learning_rate": 7.149453195230629e-06, + "loss": 0.4152, + "step": 7627 + }, + { + "epoch": 0.6, + "learning_rate": 7.1469937188017444e-06, + "loss": 0.4741, + "step": 7628 + }, + { + "epoch": 0.6, + "learning_rate": 7.144534430229595e-06, + "loss": 0.2853, + "step": 7629 + }, + { + "epoch": 0.6, + "learning_rate": 7.142075329676112e-06, + "loss": 0.3386, + "step": 7630 + }, + { + "epoch": 0.6, + "learning_rate": 7.139616417303221e-06, + "loss": 0.4842, + "step": 7631 + }, + { + "epoch": 0.6, + "learning_rate": 7.137157693272822e-06, + "loss": 0.4426, + "step": 7632 + }, + { + "epoch": 0.6, + "learning_rate": 7.1346991577468136e-06, + "loss": 0.3428, + "step": 7633 + }, + { + "epoch": 0.6, + "learning_rate": 7.132240810887083e-06, + "loss": 0.43, + "step": 7634 + }, + { + "epoch": 0.6, + "learning_rate": 7.129782652855492e-06, + "loss": 0.4275, + "step": 7635 + }, + { + "epoch": 0.6, + "learning_rate": 7.127324683813906e-06, + "loss": 0.2957, + "step": 7636 + }, + { + "epoch": 0.61, + "learning_rate": 7.124866903924164e-06, + "loss": 0.3439, + "step": 7637 + }, + { + "epoch": 0.61, + "learning_rate": 7.122409313348102e-06, + "loss": 0.2323, + "step": 7638 + }, + { + "epoch": 0.61, + "learning_rate": 7.119951912247545e-06, + "loss": 0.3369, + "step": 7639 + }, + { + "epoch": 0.61, + "learning_rate": 7.117494700784292e-06, + "loss": 0.2991, + "step": 7640 + }, + { + "epoch": 0.61, + "learning_rate": 7.115037679120147e-06, + "loss": 0.3308, + "step": 7641 + }, + { + "epoch": 0.61, + "learning_rate": 7.112580847416886e-06, + "loss": 0.3065, + "step": 7642 + }, + { + "epoch": 0.61, + "learning_rate": 7.110124205836283e-06, + "loss": 0.359, + "step": 7643 + }, + { + "epoch": 0.61, + "learning_rate": 7.107667754540097e-06, + "loss": 0.2298, + "step": 7644 + }, + { + "epoch": 0.61, + "learning_rate": 7.105211493690073e-06, + "loss": 0.3417, + "step": 7645 + }, + { + "epoch": 0.61, + "learning_rate": 7.102755423447941e-06, + "loss": 0.3943, + "step": 7646 + }, + { + "epoch": 0.61, + "learning_rate": 7.100299543975426e-06, + "loss": 0.3769, + "step": 7647 + }, + { + "epoch": 0.61, + "learning_rate": 7.097843855434232e-06, + "loss": 0.2535, + "step": 7648 + }, + { + "epoch": 0.61, + "learning_rate": 7.09538835798606e-06, + "loss": 0.3045, + "step": 7649 + }, + { + "epoch": 0.61, + "learning_rate": 7.092933051792583e-06, + "loss": 0.4748, + "step": 7650 + }, + { + "epoch": 0.61, + "learning_rate": 7.090477937015479e-06, + "loss": 0.3508, + "step": 7651 + }, + { + "epoch": 0.61, + "learning_rate": 7.088023013816403e-06, + "loss": 0.3074, + "step": 7652 + }, + { + "epoch": 0.61, + "learning_rate": 7.085568282357e-06, + "loss": 0.3065, + "step": 7653 + }, + { + "epoch": 0.61, + "learning_rate": 7.083113742798901e-06, + "loss": 0.3168, + "step": 7654 + }, + { + "epoch": 0.61, + "learning_rate": 7.080659395303729e-06, + "loss": 0.3828, + "step": 7655 + }, + { + "epoch": 0.61, + "learning_rate": 7.078205240033087e-06, + "loss": 0.3776, + "step": 7656 + }, + { + "epoch": 0.61, + "learning_rate": 7.075751277148574e-06, + "loss": 0.4229, + "step": 7657 + }, + { + "epoch": 0.61, + "learning_rate": 7.073297506811766e-06, + "loss": 0.3307, + "step": 7658 + }, + { + "epoch": 0.61, + "learning_rate": 7.0708439291842345e-06, + "loss": 0.3901, + "step": 7659 + }, + { + "epoch": 0.61, + "learning_rate": 7.068390544427539e-06, + "loss": 0.3911, + "step": 7660 + }, + { + "epoch": 0.61, + "learning_rate": 7.065937352703218e-06, + "loss": 0.2396, + "step": 7661 + }, + { + "epoch": 0.61, + "learning_rate": 7.063484354172804e-06, + "loss": 0.4418, + "step": 7662 + }, + { + "epoch": 0.61, + "learning_rate": 7.061031548997818e-06, + "loss": 0.379, + "step": 7663 + }, + { + "epoch": 0.61, + "learning_rate": 7.058578937339759e-06, + "loss": 0.3545, + "step": 7664 + }, + { + "epoch": 0.61, + "learning_rate": 7.056126519360129e-06, + "loss": 0.3656, + "step": 7665 + }, + { + "epoch": 0.61, + "learning_rate": 7.053674295220399e-06, + "loss": 0.3715, + "step": 7666 + }, + { + "epoch": 0.61, + "learning_rate": 7.05122226508204e-06, + "loss": 0.3065, + "step": 7667 + }, + { + "epoch": 0.61, + "learning_rate": 7.048770429106509e-06, + "loss": 0.3357, + "step": 7668 + }, + { + "epoch": 0.61, + "learning_rate": 7.0463187874552415e-06, + "loss": 0.2966, + "step": 7669 + }, + { + "epoch": 0.61, + "learning_rate": 7.043867340289672e-06, + "loss": 0.3027, + "step": 7670 + }, + { + "epoch": 0.61, + "learning_rate": 7.0414160877712155e-06, + "loss": 0.4176, + "step": 7671 + }, + { + "epoch": 0.61, + "learning_rate": 7.038965030061273e-06, + "loss": 0.4299, + "step": 7672 + }, + { + "epoch": 0.61, + "learning_rate": 7.0365141673212336e-06, + "loss": 0.3625, + "step": 7673 + }, + { + "epoch": 0.61, + "learning_rate": 7.034063499712479e-06, + "loss": 0.3303, + "step": 7674 + }, + { + "epoch": 0.61, + "learning_rate": 7.031613027396369e-06, + "loss": 0.345, + "step": 7675 + }, + { + "epoch": 0.61, + "learning_rate": 7.029162750534259e-06, + "loss": 0.2563, + "step": 7676 + }, + { + "epoch": 0.61, + "learning_rate": 7.02671266928749e-06, + "loss": 0.3363, + "step": 7677 + }, + { + "epoch": 0.61, + "learning_rate": 7.024262783817382e-06, + "loss": 0.3343, + "step": 7678 + }, + { + "epoch": 0.61, + "learning_rate": 7.02181309428525e-06, + "loss": 0.3209, + "step": 7679 + }, + { + "epoch": 0.61, + "learning_rate": 7.0193636008524e-06, + "loss": 0.2662, + "step": 7680 + }, + { + "epoch": 0.61, + "learning_rate": 7.016914303680111e-06, + "loss": 0.3873, + "step": 7681 + }, + { + "epoch": 0.61, + "learning_rate": 7.014465202929665e-06, + "loss": 0.3582, + "step": 7682 + }, + { + "epoch": 0.61, + "learning_rate": 7.012016298762317e-06, + "loss": 0.3401, + "step": 7683 + }, + { + "epoch": 0.61, + "learning_rate": 7.009567591339319e-06, + "loss": 0.2734, + "step": 7684 + }, + { + "epoch": 0.61, + "learning_rate": 7.007119080821908e-06, + "loss": 0.2687, + "step": 7685 + }, + { + "epoch": 0.61, + "learning_rate": 7.004670767371302e-06, + "loss": 0.3103, + "step": 7686 + }, + { + "epoch": 0.61, + "learning_rate": 7.002222651148714e-06, + "loss": 0.3726, + "step": 7687 + }, + { + "epoch": 0.61, + "learning_rate": 6.999774732315343e-06, + "loss": 0.3272, + "step": 7688 + }, + { + "epoch": 0.61, + "learning_rate": 6.9973270110323666e-06, + "loss": 0.3645, + "step": 7689 + }, + { + "epoch": 0.61, + "learning_rate": 6.994879487460961e-06, + "loss": 0.3124, + "step": 7690 + }, + { + "epoch": 0.61, + "learning_rate": 6.992432161762278e-06, + "loss": 0.242, + "step": 7691 + }, + { + "epoch": 0.61, + "learning_rate": 6.989985034097466e-06, + "loss": 0.4322, + "step": 7692 + }, + { + "epoch": 0.61, + "learning_rate": 6.9875381046276605e-06, + "loss": 0.2689, + "step": 7693 + }, + { + "epoch": 0.61, + "learning_rate": 6.985091373513972e-06, + "loss": 0.3234, + "step": 7694 + }, + { + "epoch": 0.61, + "learning_rate": 6.982644840917509e-06, + "loss": 0.3159, + "step": 7695 + }, + { + "epoch": 0.61, + "learning_rate": 6.980198506999368e-06, + "loss": 0.2797, + "step": 7696 + }, + { + "epoch": 0.61, + "learning_rate": 6.977752371920623e-06, + "loss": 0.4026, + "step": 7697 + }, + { + "epoch": 0.61, + "learning_rate": 6.975306435842344e-06, + "loss": 0.3232, + "step": 7698 + }, + { + "epoch": 0.61, + "learning_rate": 6.97286069892558e-06, + "loss": 0.4122, + "step": 7699 + }, + { + "epoch": 0.61, + "learning_rate": 6.970415161331373e-06, + "loss": 0.3836, + "step": 7700 + }, + { + "epoch": 0.61, + "learning_rate": 6.967969823220752e-06, + "loss": 0.3981, + "step": 7701 + }, + { + "epoch": 0.61, + "learning_rate": 6.965524684754729e-06, + "loss": 0.3348, + "step": 7702 + }, + { + "epoch": 0.61, + "learning_rate": 6.963079746094302e-06, + "loss": 0.3273, + "step": 7703 + }, + { + "epoch": 0.61, + "learning_rate": 6.960635007400465e-06, + "loss": 0.3237, + "step": 7704 + }, + { + "epoch": 0.61, + "learning_rate": 6.9581904688341854e-06, + "loss": 0.291, + "step": 7705 + }, + { + "epoch": 0.61, + "learning_rate": 6.955746130556429e-06, + "loss": 0.328, + "step": 7706 + }, + { + "epoch": 0.61, + "learning_rate": 6.95330199272814e-06, + "loss": 0.3584, + "step": 7707 + }, + { + "epoch": 0.61, + "learning_rate": 6.950858055510254e-06, + "loss": 0.3557, + "step": 7708 + }, + { + "epoch": 0.61, + "learning_rate": 6.948414319063696e-06, + "loss": 0.3067, + "step": 7709 + }, + { + "epoch": 0.61, + "learning_rate": 6.945970783549372e-06, + "loss": 0.2107, + "step": 7710 + }, + { + "epoch": 0.61, + "learning_rate": 6.943527449128174e-06, + "loss": 0.3001, + "step": 7711 + }, + { + "epoch": 0.61, + "learning_rate": 6.9410843159609905e-06, + "loss": 0.4279, + "step": 7712 + }, + { + "epoch": 0.61, + "learning_rate": 6.9386413842086845e-06, + "loss": 0.4386, + "step": 7713 + }, + { + "epoch": 0.61, + "learning_rate": 6.936198654032114e-06, + "loss": 0.3037, + "step": 7714 + }, + { + "epoch": 0.61, + "learning_rate": 6.933756125592117e-06, + "loss": 0.3159, + "step": 7715 + }, + { + "epoch": 0.61, + "learning_rate": 6.931313799049526e-06, + "loss": 0.2938, + "step": 7716 + }, + { + "epoch": 0.61, + "learning_rate": 6.928871674565158e-06, + "loss": 0.3575, + "step": 7717 + }, + { + "epoch": 0.61, + "learning_rate": 6.926429752299812e-06, + "loss": 0.4435, + "step": 7718 + }, + { + "epoch": 0.61, + "learning_rate": 6.923988032414277e-06, + "loss": 0.3811, + "step": 7719 + }, + { + "epoch": 0.61, + "learning_rate": 6.9215465150693305e-06, + "loss": 0.307, + "step": 7720 + }, + { + "epoch": 0.61, + "learning_rate": 6.919105200425733e-06, + "loss": 0.3457, + "step": 7721 + }, + { + "epoch": 0.61, + "learning_rate": 6.916664088644234e-06, + "loss": 0.3072, + "step": 7722 + }, + { + "epoch": 0.61, + "learning_rate": 6.914223179885567e-06, + "loss": 0.3468, + "step": 7723 + }, + { + "epoch": 0.61, + "learning_rate": 6.911782474310456e-06, + "loss": 0.3119, + "step": 7724 + }, + { + "epoch": 0.61, + "learning_rate": 6.909341972079613e-06, + "loss": 0.3993, + "step": 7725 + }, + { + "epoch": 0.61, + "learning_rate": 6.9069016733537255e-06, + "loss": 0.3599, + "step": 7726 + }, + { + "epoch": 0.61, + "learning_rate": 6.904461578293483e-06, + "loss": 0.3957, + "step": 7727 + }, + { + "epoch": 0.61, + "learning_rate": 6.902021687059549e-06, + "loss": 0.2853, + "step": 7728 + }, + { + "epoch": 0.61, + "learning_rate": 6.89958199981258e-06, + "loss": 0.4272, + "step": 7729 + }, + { + "epoch": 0.61, + "learning_rate": 6.89714251671322e-06, + "loss": 0.3684, + "step": 7730 + }, + { + "epoch": 0.61, + "learning_rate": 6.894703237922094e-06, + "loss": 0.4019, + "step": 7731 + }, + { + "epoch": 0.61, + "learning_rate": 6.892264163599817e-06, + "loss": 0.4827, + "step": 7732 + }, + { + "epoch": 0.61, + "learning_rate": 6.889825293906993e-06, + "loss": 0.3207, + "step": 7733 + }, + { + "epoch": 0.61, + "learning_rate": 6.887386629004207e-06, + "loss": 0.3448, + "step": 7734 + }, + { + "epoch": 0.61, + "learning_rate": 6.884948169052037e-06, + "loss": 0.3707, + "step": 7735 + }, + { + "epoch": 0.61, + "learning_rate": 6.88250991421104e-06, + "loss": 0.354, + "step": 7736 + }, + { + "epoch": 0.61, + "learning_rate": 6.880071864641762e-06, + "loss": 0.3223, + "step": 7737 + }, + { + "epoch": 0.61, + "learning_rate": 6.8776340205047446e-06, + "loss": 0.2998, + "step": 7738 + }, + { + "epoch": 0.61, + "learning_rate": 6.875196381960498e-06, + "loss": 0.3262, + "step": 7739 + }, + { + "epoch": 0.61, + "learning_rate": 6.872758949169536e-06, + "loss": 0.2507, + "step": 7740 + }, + { + "epoch": 0.61, + "learning_rate": 6.8703217222923525e-06, + "loss": 0.2645, + "step": 7741 + }, + { + "epoch": 0.61, + "learning_rate": 6.867884701489421e-06, + "loss": 0.261, + "step": 7742 + }, + { + "epoch": 0.61, + "learning_rate": 6.865447886921215e-06, + "loss": 0.245, + "step": 7743 + }, + { + "epoch": 0.61, + "learning_rate": 6.86301127874818e-06, + "loss": 0.3373, + "step": 7744 + }, + { + "epoch": 0.61, + "learning_rate": 6.860574877130757e-06, + "loss": 0.3432, + "step": 7745 + }, + { + "epoch": 0.61, + "learning_rate": 6.8581386822293765e-06, + "loss": 0.3448, + "step": 7746 + }, + { + "epoch": 0.61, + "learning_rate": 6.8557026942044425e-06, + "loss": 0.3786, + "step": 7747 + }, + { + "epoch": 0.61, + "learning_rate": 6.853266913216357e-06, + "loss": 0.2224, + "step": 7748 + }, + { + "epoch": 0.61, + "learning_rate": 6.850831339425508e-06, + "loss": 0.3711, + "step": 7749 + }, + { + "epoch": 0.61, + "learning_rate": 6.848395972992261e-06, + "loss": 0.3239, + "step": 7750 + }, + { + "epoch": 0.61, + "learning_rate": 6.845960814076973e-06, + "loss": 0.3953, + "step": 7751 + }, + { + "epoch": 0.61, + "learning_rate": 6.8435258628399905e-06, + "loss": 0.3532, + "step": 7752 + }, + { + "epoch": 0.61, + "learning_rate": 6.841091119441639e-06, + "loss": 0.4014, + "step": 7753 + }, + { + "epoch": 0.61, + "learning_rate": 6.8386565840422385e-06, + "loss": 0.3798, + "step": 7754 + }, + { + "epoch": 0.61, + "learning_rate": 6.836222256802093e-06, + "loss": 0.2251, + "step": 7755 + }, + { + "epoch": 0.61, + "learning_rate": 6.833788137881486e-06, + "loss": 0.4497, + "step": 7756 + }, + { + "epoch": 0.61, + "learning_rate": 6.8313542274406964e-06, + "loss": 0.3404, + "step": 7757 + }, + { + "epoch": 0.61, + "learning_rate": 6.828920525639985e-06, + "loss": 0.382, + "step": 7758 + }, + { + "epoch": 0.61, + "learning_rate": 6.826487032639597e-06, + "loss": 0.3331, + "step": 7759 + }, + { + "epoch": 0.61, + "learning_rate": 6.8240537485997704e-06, + "loss": 0.3948, + "step": 7760 + }, + { + "epoch": 0.61, + "learning_rate": 6.821620673680721e-06, + "loss": 0.3212, + "step": 7761 + }, + { + "epoch": 0.61, + "learning_rate": 6.819187808042656e-06, + "loss": 0.4018, + "step": 7762 + }, + { + "epoch": 0.62, + "learning_rate": 6.816755151845771e-06, + "loss": 0.4438, + "step": 7763 + }, + { + "epoch": 0.62, + "learning_rate": 6.814322705250241e-06, + "loss": 0.4798, + "step": 7764 + }, + { + "epoch": 0.62, + "learning_rate": 6.8118904684162325e-06, + "loss": 0.3938, + "step": 7765 + }, + { + "epoch": 0.62, + "learning_rate": 6.8094584415038975e-06, + "loss": 0.4787, + "step": 7766 + }, + { + "epoch": 0.62, + "learning_rate": 6.807026624673372e-06, + "loss": 0.3264, + "step": 7767 + }, + { + "epoch": 0.62, + "learning_rate": 6.80459501808478e-06, + "loss": 0.3049, + "step": 7768 + }, + { + "epoch": 0.62, + "learning_rate": 6.8021636218982275e-06, + "loss": 0.2655, + "step": 7769 + }, + { + "epoch": 0.62, + "learning_rate": 6.799732436273816e-06, + "loss": 0.2711, + "step": 7770 + }, + { + "epoch": 0.62, + "learning_rate": 6.797301461371626e-06, + "loss": 0.2382, + "step": 7771 + }, + { + "epoch": 0.62, + "learning_rate": 6.7948706973517235e-06, + "loss": 0.3334, + "step": 7772 + }, + { + "epoch": 0.62, + "learning_rate": 6.792440144374162e-06, + "loss": 0.4053, + "step": 7773 + }, + { + "epoch": 0.62, + "learning_rate": 6.790009802598984e-06, + "loss": 0.2849, + "step": 7774 + }, + { + "epoch": 0.62, + "learning_rate": 6.787579672186215e-06, + "loss": 0.3887, + "step": 7775 + }, + { + "epoch": 0.62, + "learning_rate": 6.78514975329587e-06, + "loss": 0.2588, + "step": 7776 + }, + { + "epoch": 0.62, + "learning_rate": 6.78272004608794e-06, + "loss": 0.2827, + "step": 7777 + }, + { + "epoch": 0.62, + "learning_rate": 6.780290550722417e-06, + "loss": 0.5048, + "step": 7778 + }, + { + "epoch": 0.62, + "learning_rate": 6.777861267359272e-06, + "loss": 0.3241, + "step": 7779 + }, + { + "epoch": 0.62, + "learning_rate": 6.7754321961584535e-06, + "loss": 0.3172, + "step": 7780 + }, + { + "epoch": 0.62, + "learning_rate": 6.773003337279911e-06, + "loss": 0.292, + "step": 7781 + }, + { + "epoch": 0.62, + "learning_rate": 6.7705746908835734e-06, + "loss": 0.3524, + "step": 7782 + }, + { + "epoch": 0.62, + "learning_rate": 6.768146257129351e-06, + "loss": 0.2986, + "step": 7783 + }, + { + "epoch": 0.62, + "learning_rate": 6.765718036177148e-06, + "loss": 0.5189, + "step": 7784 + }, + { + "epoch": 0.62, + "learning_rate": 6.763290028186849e-06, + "loss": 0.4112, + "step": 7785 + }, + { + "epoch": 0.62, + "learning_rate": 6.760862233318327e-06, + "loss": 0.4514, + "step": 7786 + }, + { + "epoch": 0.62, + "learning_rate": 6.758434651731445e-06, + "loss": 0.4456, + "step": 7787 + }, + { + "epoch": 0.62, + "learning_rate": 6.756007283586039e-06, + "loss": 0.3722, + "step": 7788 + }, + { + "epoch": 0.62, + "learning_rate": 6.753580129041945e-06, + "loss": 0.3285, + "step": 7789 + }, + { + "epoch": 0.62, + "learning_rate": 6.751153188258983e-06, + "loss": 0.2642, + "step": 7790 + }, + { + "epoch": 0.62, + "learning_rate": 6.748726461396946e-06, + "loss": 0.3507, + "step": 7791 + }, + { + "epoch": 0.62, + "learning_rate": 6.7462999486156315e-06, + "loss": 0.2818, + "step": 7792 + }, + { + "epoch": 0.62, + "learning_rate": 6.743873650074807e-06, + "loss": 0.3146, + "step": 7793 + }, + { + "epoch": 0.62, + "learning_rate": 6.741447565934236e-06, + "loss": 0.2505, + "step": 7794 + }, + { + "epoch": 0.62, + "learning_rate": 6.739021696353665e-06, + "loss": 0.2778, + "step": 7795 + }, + { + "epoch": 0.62, + "learning_rate": 6.736596041492821e-06, + "loss": 0.4685, + "step": 7796 + }, + { + "epoch": 0.62, + "learning_rate": 6.734170601511427e-06, + "loss": 0.4349, + "step": 7797 + }, + { + "epoch": 0.62, + "learning_rate": 6.7317453765691855e-06, + "loss": 0.3445, + "step": 7798 + }, + { + "epoch": 0.62, + "learning_rate": 6.729320366825785e-06, + "loss": 0.2368, + "step": 7799 + }, + { + "epoch": 0.62, + "learning_rate": 6.726895572440901e-06, + "loss": 0.3513, + "step": 7800 + }, + { + "epoch": 0.62, + "learning_rate": 6.7244709935741925e-06, + "loss": 0.2876, + "step": 7801 + }, + { + "epoch": 0.62, + "learning_rate": 6.722046630385309e-06, + "loss": 0.3433, + "step": 7802 + }, + { + "epoch": 0.62, + "learning_rate": 6.719622483033883e-06, + "loss": 0.4325, + "step": 7803 + }, + { + "epoch": 0.62, + "learning_rate": 6.7171985516795315e-06, + "loss": 0.2914, + "step": 7804 + }, + { + "epoch": 0.62, + "learning_rate": 6.714774836481862e-06, + "loss": 0.2881, + "step": 7805 + }, + { + "epoch": 0.62, + "learning_rate": 6.71235133760046e-06, + "loss": 0.2964, + "step": 7806 + }, + { + "epoch": 0.62, + "learning_rate": 6.709928055194902e-06, + "loss": 0.408, + "step": 7807 + }, + { + "epoch": 0.62, + "learning_rate": 6.707504989424753e-06, + "loss": 0.4628, + "step": 7808 + }, + { + "epoch": 0.62, + "learning_rate": 6.705082140449557e-06, + "loss": 0.3848, + "step": 7809 + }, + { + "epoch": 0.62, + "learning_rate": 6.702659508428847e-06, + "loss": 0.3888, + "step": 7810 + }, + { + "epoch": 0.62, + "learning_rate": 6.7002370935221454e-06, + "loss": 0.3319, + "step": 7811 + }, + { + "epoch": 0.62, + "learning_rate": 6.697814895888951e-06, + "loss": 0.3724, + "step": 7812 + }, + { + "epoch": 0.62, + "learning_rate": 6.695392915688759e-06, + "loss": 0.3115, + "step": 7813 + }, + { + "epoch": 0.62, + "learning_rate": 6.692971153081041e-06, + "loss": 0.3914, + "step": 7814 + }, + { + "epoch": 0.62, + "learning_rate": 6.690549608225258e-06, + "loss": 0.363, + "step": 7815 + }, + { + "epoch": 0.62, + "learning_rate": 6.688128281280863e-06, + "loss": 0.3415, + "step": 7816 + }, + { + "epoch": 0.62, + "learning_rate": 6.685707172407284e-06, + "loss": 0.2496, + "step": 7817 + }, + { + "epoch": 0.62, + "learning_rate": 6.683286281763939e-06, + "loss": 0.3549, + "step": 7818 + }, + { + "epoch": 0.62, + "learning_rate": 6.6808656095102365e-06, + "loss": 0.3822, + "step": 7819 + }, + { + "epoch": 0.62, + "learning_rate": 6.6784451558055596e-06, + "loss": 0.3122, + "step": 7820 + }, + { + "epoch": 0.62, + "learning_rate": 6.67602492080929e-06, + "loss": 0.3329, + "step": 7821 + }, + { + "epoch": 0.62, + "learning_rate": 6.6736049046807815e-06, + "loss": 0.3225, + "step": 7822 + }, + { + "epoch": 0.62, + "learning_rate": 6.671185107579387e-06, + "loss": 0.3048, + "step": 7823 + }, + { + "epoch": 0.62, + "learning_rate": 6.668765529664436e-06, + "loss": 0.2782, + "step": 7824 + }, + { + "epoch": 0.62, + "learning_rate": 6.6663461710952445e-06, + "loss": 0.2535, + "step": 7825 + }, + { + "epoch": 0.62, + "learning_rate": 6.663927032031118e-06, + "loss": 0.3522, + "step": 7826 + }, + { + "epoch": 0.62, + "learning_rate": 6.661508112631347e-06, + "loss": 0.2886, + "step": 7827 + }, + { + "epoch": 0.62, + "learning_rate": 6.659089413055202e-06, + "loss": 0.4699, + "step": 7828 + }, + { + "epoch": 0.62, + "learning_rate": 6.656670933461942e-06, + "loss": 0.3908, + "step": 7829 + }, + { + "epoch": 0.62, + "learning_rate": 6.654252674010815e-06, + "loss": 0.2806, + "step": 7830 + }, + { + "epoch": 0.62, + "learning_rate": 6.6518346348610484e-06, + "loss": 0.2442, + "step": 7831 + }, + { + "epoch": 0.62, + "learning_rate": 6.649416816171861e-06, + "loss": 0.3621, + "step": 7832 + }, + { + "epoch": 0.62, + "learning_rate": 6.646999218102457e-06, + "loss": 0.4064, + "step": 7833 + }, + { + "epoch": 0.62, + "learning_rate": 6.644581840812019e-06, + "loss": 0.4103, + "step": 7834 + }, + { + "epoch": 0.62, + "learning_rate": 6.64216468445972e-06, + "loss": 0.5081, + "step": 7835 + }, + { + "epoch": 0.62, + "learning_rate": 6.639747749204723e-06, + "loss": 0.3751, + "step": 7836 + }, + { + "epoch": 0.62, + "learning_rate": 6.637331035206166e-06, + "loss": 0.288, + "step": 7837 + }, + { + "epoch": 0.62, + "learning_rate": 6.634914542623182e-06, + "loss": 0.4635, + "step": 7838 + }, + { + "epoch": 0.62, + "learning_rate": 6.632498271614882e-06, + "loss": 0.3489, + "step": 7839 + }, + { + "epoch": 0.62, + "learning_rate": 6.630082222340366e-06, + "loss": 0.2869, + "step": 7840 + }, + { + "epoch": 0.62, + "learning_rate": 6.627666394958725e-06, + "loss": 0.4222, + "step": 7841 + }, + { + "epoch": 0.62, + "learning_rate": 6.625250789629021e-06, + "loss": 0.296, + "step": 7842 + }, + { + "epoch": 0.62, + "learning_rate": 6.622835406510315e-06, + "loss": 0.3379, + "step": 7843 + }, + { + "epoch": 0.62, + "learning_rate": 6.620420245761651e-06, + "loss": 0.3078, + "step": 7844 + }, + { + "epoch": 0.62, + "learning_rate": 6.6180053075420484e-06, + "loss": 0.3523, + "step": 7845 + }, + { + "epoch": 0.62, + "learning_rate": 6.615590592010526e-06, + "loss": 0.4334, + "step": 7846 + }, + { + "epoch": 0.62, + "learning_rate": 6.613176099326077e-06, + "loss": 0.3344, + "step": 7847 + }, + { + "epoch": 0.62, + "learning_rate": 6.610761829647685e-06, + "loss": 0.2783, + "step": 7848 + }, + { + "epoch": 0.62, + "learning_rate": 6.608347783134319e-06, + "loss": 0.3024, + "step": 7849 + }, + { + "epoch": 0.62, + "learning_rate": 6.605933959944933e-06, + "loss": 0.3721, + "step": 7850 + }, + { + "epoch": 0.62, + "learning_rate": 6.603520360238462e-06, + "loss": 0.3082, + "step": 7851 + }, + { + "epoch": 0.62, + "learning_rate": 6.601106984173835e-06, + "loss": 0.3844, + "step": 7852 + }, + { + "epoch": 0.62, + "learning_rate": 6.598693831909957e-06, + "loss": 0.3045, + "step": 7853 + }, + { + "epoch": 0.62, + "learning_rate": 6.596280903605725e-06, + "loss": 0.4874, + "step": 7854 + }, + { + "epoch": 0.62, + "learning_rate": 6.593868199420017e-06, + "loss": 0.3101, + "step": 7855 + }, + { + "epoch": 0.62, + "learning_rate": 6.591455719511699e-06, + "loss": 0.3642, + "step": 7856 + }, + { + "epoch": 0.62, + "learning_rate": 6.589043464039624e-06, + "loss": 0.3995, + "step": 7857 + }, + { + "epoch": 0.62, + "learning_rate": 6.58663143316262e-06, + "loss": 0.4694, + "step": 7858 + }, + { + "epoch": 0.62, + "learning_rate": 6.584219627039513e-06, + "loss": 0.4834, + "step": 7859 + }, + { + "epoch": 0.62, + "learning_rate": 6.58180804582911e-06, + "loss": 0.4195, + "step": 7860 + }, + { + "epoch": 0.62, + "learning_rate": 6.579396689690198e-06, + "loss": 0.31, + "step": 7861 + }, + { + "epoch": 0.62, + "learning_rate": 6.576985558781557e-06, + "loss": 0.3168, + "step": 7862 + }, + { + "epoch": 0.62, + "learning_rate": 6.574574653261945e-06, + "loss": 0.4429, + "step": 7863 + }, + { + "epoch": 0.62, + "learning_rate": 6.572163973290109e-06, + "loss": 0.3201, + "step": 7864 + }, + { + "epoch": 0.62, + "learning_rate": 6.569753519024784e-06, + "loss": 0.355, + "step": 7865 + }, + { + "epoch": 0.62, + "learning_rate": 6.567343290624683e-06, + "loss": 0.3406, + "step": 7866 + }, + { + "epoch": 0.62, + "learning_rate": 6.564933288248509e-06, + "loss": 0.329, + "step": 7867 + }, + { + "epoch": 0.62, + "learning_rate": 6.562523512054951e-06, + "loss": 0.2871, + "step": 7868 + }, + { + "epoch": 0.62, + "learning_rate": 6.560113962202679e-06, + "loss": 0.3148, + "step": 7869 + }, + { + "epoch": 0.62, + "learning_rate": 6.557704638850352e-06, + "loss": 0.3478, + "step": 7870 + }, + { + "epoch": 0.62, + "learning_rate": 6.555295542156609e-06, + "loss": 0.3704, + "step": 7871 + }, + { + "epoch": 0.62, + "learning_rate": 6.55288667228008e-06, + "loss": 0.3879, + "step": 7872 + }, + { + "epoch": 0.62, + "learning_rate": 6.550478029379379e-06, + "loss": 0.4282, + "step": 7873 + }, + { + "epoch": 0.62, + "learning_rate": 6.548069613613099e-06, + "loss": 0.3442, + "step": 7874 + }, + { + "epoch": 0.62, + "learning_rate": 6.545661425139827e-06, + "loss": 0.3125, + "step": 7875 + }, + { + "epoch": 0.62, + "learning_rate": 6.543253464118131e-06, + "loss": 0.2569, + "step": 7876 + }, + { + "epoch": 0.62, + "learning_rate": 6.540845730706557e-06, + "loss": 0.3331, + "step": 7877 + }, + { + "epoch": 0.62, + "learning_rate": 6.538438225063653e-06, + "loss": 0.3733, + "step": 7878 + }, + { + "epoch": 0.62, + "learning_rate": 6.536030947347931e-06, + "loss": 0.3356, + "step": 7879 + }, + { + "epoch": 0.62, + "learning_rate": 6.533623897717905e-06, + "loss": 0.3423, + "step": 7880 + }, + { + "epoch": 0.62, + "learning_rate": 6.531217076332068e-06, + "loss": 0.426, + "step": 7881 + }, + { + "epoch": 0.62, + "learning_rate": 6.528810483348893e-06, + "loss": 0.4252, + "step": 7882 + }, + { + "epoch": 0.62, + "learning_rate": 6.526404118926848e-06, + "loss": 0.3501, + "step": 7883 + }, + { + "epoch": 0.62, + "learning_rate": 6.523997983224375e-06, + "loss": 0.2776, + "step": 7884 + }, + { + "epoch": 0.62, + "learning_rate": 6.52159207639991e-06, + "loss": 0.3806, + "step": 7885 + }, + { + "epoch": 0.62, + "learning_rate": 6.519186398611872e-06, + "loss": 0.4001, + "step": 7886 + }, + { + "epoch": 0.62, + "learning_rate": 6.51678095001866e-06, + "loss": 0.3026, + "step": 7887 + }, + { + "epoch": 0.62, + "learning_rate": 6.51437573077866e-06, + "loss": 0.1833, + "step": 7888 + }, + { + "epoch": 0.62, + "learning_rate": 6.5119707410502495e-06, + "loss": 0.2696, + "step": 7889 + }, + { + "epoch": 0.63, + "learning_rate": 6.509565980991781e-06, + "loss": 0.3754, + "step": 7890 + }, + { + "epoch": 0.63, + "learning_rate": 6.5071614507615985e-06, + "loss": 0.3232, + "step": 7891 + }, + { + "epoch": 0.63, + "learning_rate": 6.5047571505180265e-06, + "loss": 0.3131, + "step": 7892 + }, + { + "epoch": 0.63, + "learning_rate": 6.502353080419379e-06, + "loss": 0.4579, + "step": 7893 + }, + { + "epoch": 0.63, + "learning_rate": 6.4999492406239525e-06, + "loss": 0.372, + "step": 7894 + }, + { + "epoch": 0.63, + "learning_rate": 6.497545631290025e-06, + "loss": 0.3202, + "step": 7895 + }, + { + "epoch": 0.63, + "learning_rate": 6.495142252575866e-06, + "loss": 0.4075, + "step": 7896 + }, + { + "epoch": 0.63, + "learning_rate": 6.492739104639727e-06, + "loss": 0.3094, + "step": 7897 + }, + { + "epoch": 0.63, + "learning_rate": 6.490336187639841e-06, + "loss": 0.3701, + "step": 7898 + }, + { + "epoch": 0.63, + "learning_rate": 6.487933501734429e-06, + "loss": 0.3718, + "step": 7899 + }, + { + "epoch": 0.63, + "learning_rate": 6.485531047081697e-06, + "loss": 0.3146, + "step": 7900 + }, + { + "epoch": 0.63, + "learning_rate": 6.483128823839835e-06, + "loss": 0.3876, + "step": 7901 + }, + { + "epoch": 0.63, + "learning_rate": 6.480726832167019e-06, + "loss": 0.4053, + "step": 7902 + }, + { + "epoch": 0.63, + "learning_rate": 6.4783250722214066e-06, + "loss": 0.3428, + "step": 7903 + }, + { + "epoch": 0.63, + "learning_rate": 6.475923544161142e-06, + "loss": 0.3595, + "step": 7904 + }, + { + "epoch": 0.63, + "learning_rate": 6.473522248144359e-06, + "loss": 0.3422, + "step": 7905 + }, + { + "epoch": 0.63, + "learning_rate": 6.471121184329167e-06, + "loss": 0.2789, + "step": 7906 + }, + { + "epoch": 0.63, + "learning_rate": 6.468720352873662e-06, + "loss": 0.3752, + "step": 7907 + }, + { + "epoch": 0.63, + "learning_rate": 6.466319753935933e-06, + "loss": 0.3271, + "step": 7908 + }, + { + "epoch": 0.63, + "learning_rate": 6.463919387674043e-06, + "loss": 0.3359, + "step": 7909 + }, + { + "epoch": 0.63, + "learning_rate": 6.461519254246046e-06, + "loss": 0.4647, + "step": 7910 + }, + { + "epoch": 0.63, + "learning_rate": 6.459119353809982e-06, + "loss": 0.389, + "step": 7911 + }, + { + "epoch": 0.63, + "learning_rate": 6.45671968652387e-06, + "loss": 0.4379, + "step": 7912 + }, + { + "epoch": 0.63, + "learning_rate": 6.4543202525457175e-06, + "loss": 0.3153, + "step": 7913 + }, + { + "epoch": 0.63, + "learning_rate": 6.451921052033516e-06, + "loss": 0.413, + "step": 7914 + }, + { + "epoch": 0.63, + "learning_rate": 6.449522085145241e-06, + "loss": 0.4584, + "step": 7915 + }, + { + "epoch": 0.63, + "learning_rate": 6.447123352038853e-06, + "loss": 0.316, + "step": 7916 + }, + { + "epoch": 0.63, + "learning_rate": 6.444724852872297e-06, + "loss": 0.3415, + "step": 7917 + }, + { + "epoch": 0.63, + "learning_rate": 6.4423265878035015e-06, + "loss": 0.3394, + "step": 7918 + }, + { + "epoch": 0.63, + "learning_rate": 6.439928556990382e-06, + "loss": 0.3413, + "step": 7919 + }, + { + "epoch": 0.63, + "learning_rate": 6.437530760590838e-06, + "loss": 0.5316, + "step": 7920 + }, + { + "epoch": 0.63, + "learning_rate": 6.435133198762751e-06, + "loss": 0.2748, + "step": 7921 + }, + { + "epoch": 0.63, + "learning_rate": 6.432735871663991e-06, + "loss": 0.3198, + "step": 7922 + }, + { + "epoch": 0.63, + "learning_rate": 6.430338779452407e-06, + "loss": 0.331, + "step": 7923 + }, + { + "epoch": 0.63, + "learning_rate": 6.4279419222858416e-06, + "loss": 0.3909, + "step": 7924 + }, + { + "epoch": 0.63, + "learning_rate": 6.4255453003221115e-06, + "loss": 0.356, + "step": 7925 + }, + { + "epoch": 0.63, + "learning_rate": 6.423148913719022e-06, + "loss": 0.3057, + "step": 7926 + }, + { + "epoch": 0.63, + "learning_rate": 6.420752762634369e-06, + "loss": 0.41, + "step": 7927 + }, + { + "epoch": 0.63, + "learning_rate": 6.4183568472259216e-06, + "loss": 0.3904, + "step": 7928 + }, + { + "epoch": 0.63, + "learning_rate": 6.415961167651443e-06, + "loss": 0.2604, + "step": 7929 + }, + { + "epoch": 0.63, + "learning_rate": 6.413565724068678e-06, + "loss": 0.3516, + "step": 7930 + }, + { + "epoch": 0.63, + "learning_rate": 6.4111705166353525e-06, + "loss": 0.4779, + "step": 7931 + }, + { + "epoch": 0.63, + "learning_rate": 6.40877554550918e-06, + "loss": 0.4303, + "step": 7932 + }, + { + "epoch": 0.63, + "learning_rate": 6.406380810847856e-06, + "loss": 0.2881, + "step": 7933 + }, + { + "epoch": 0.63, + "learning_rate": 6.403986312809065e-06, + "loss": 0.4669, + "step": 7934 + }, + { + "epoch": 0.63, + "learning_rate": 6.401592051550475e-06, + "loss": 0.3424, + "step": 7935 + }, + { + "epoch": 0.63, + "learning_rate": 6.399198027229732e-06, + "loss": 0.3378, + "step": 7936 + }, + { + "epoch": 0.63, + "learning_rate": 6.39680424000447e-06, + "loss": 0.3397, + "step": 7937 + }, + { + "epoch": 0.63, + "learning_rate": 6.3944106900323174e-06, + "loss": 0.3157, + "step": 7938 + }, + { + "epoch": 0.63, + "learning_rate": 6.392017377470867e-06, + "loss": 0.454, + "step": 7939 + }, + { + "epoch": 0.63, + "learning_rate": 6.389624302477715e-06, + "loss": 0.4076, + "step": 7940 + }, + { + "epoch": 0.63, + "learning_rate": 6.387231465210428e-06, + "loss": 0.3527, + "step": 7941 + }, + { + "epoch": 0.63, + "learning_rate": 6.384838865826567e-06, + "loss": 0.4315, + "step": 7942 + }, + { + "epoch": 0.63, + "learning_rate": 6.382446504483672e-06, + "loss": 0.2867, + "step": 7943 + }, + { + "epoch": 0.63, + "learning_rate": 6.380054381339267e-06, + "loss": 0.3589, + "step": 7944 + }, + { + "epoch": 0.63, + "learning_rate": 6.377662496550863e-06, + "loss": 0.3698, + "step": 7945 + }, + { + "epoch": 0.63, + "learning_rate": 6.375270850275956e-06, + "loss": 0.4272, + "step": 7946 + }, + { + "epoch": 0.63, + "learning_rate": 6.37287944267202e-06, + "loss": 0.2453, + "step": 7947 + }, + { + "epoch": 0.63, + "learning_rate": 6.370488273896522e-06, + "loss": 0.3335, + "step": 7948 + }, + { + "epoch": 0.63, + "learning_rate": 6.368097344106905e-06, + "loss": 0.2937, + "step": 7949 + }, + { + "epoch": 0.63, + "learning_rate": 6.365706653460602e-06, + "loss": 0.3494, + "step": 7950 + }, + { + "epoch": 0.63, + "learning_rate": 6.363316202115033e-06, + "loss": 0.3021, + "step": 7951 + }, + { + "epoch": 0.63, + "learning_rate": 6.3609259902275884e-06, + "loss": 0.2684, + "step": 7952 + }, + { + "epoch": 0.63, + "learning_rate": 6.358536017955659e-06, + "loss": 0.3982, + "step": 7953 + }, + { + "epoch": 0.63, + "learning_rate": 6.3561462854566135e-06, + "loss": 0.2843, + "step": 7954 + }, + { + "epoch": 0.63, + "learning_rate": 6.3537567928878e-06, + "loss": 0.431, + "step": 7955 + }, + { + "epoch": 0.63, + "learning_rate": 6.3513675404065575e-06, + "loss": 0.2424, + "step": 7956 + }, + { + "epoch": 0.63, + "learning_rate": 6.348978528170205e-06, + "loss": 0.3845, + "step": 7957 + }, + { + "epoch": 0.63, + "learning_rate": 6.34658975633605e-06, + "loss": 0.324, + "step": 7958 + }, + { + "epoch": 0.63, + "learning_rate": 6.344201225061382e-06, + "loss": 0.3891, + "step": 7959 + }, + { + "epoch": 0.63, + "learning_rate": 6.341812934503469e-06, + "loss": 0.3833, + "step": 7960 + }, + { + "epoch": 0.63, + "learning_rate": 6.339424884819574e-06, + "loss": 0.3962, + "step": 7961 + }, + { + "epoch": 0.63, + "learning_rate": 6.337037076166939e-06, + "loss": 0.3365, + "step": 7962 + }, + { + "epoch": 0.63, + "learning_rate": 6.334649508702784e-06, + "loss": 0.4058, + "step": 7963 + }, + { + "epoch": 0.63, + "learning_rate": 6.332262182584325e-06, + "loss": 0.2587, + "step": 7964 + }, + { + "epoch": 0.63, + "learning_rate": 6.3298750979687515e-06, + "loss": 0.3169, + "step": 7965 + }, + { + "epoch": 0.63, + "learning_rate": 6.327488255013244e-06, + "loss": 0.2583, + "step": 7966 + }, + { + "epoch": 0.63, + "learning_rate": 6.325101653874965e-06, + "loss": 0.4265, + "step": 7967 + }, + { + "epoch": 0.63, + "learning_rate": 6.322715294711057e-06, + "loss": 0.3392, + "step": 7968 + }, + { + "epoch": 0.63, + "learning_rate": 6.320329177678656e-06, + "loss": 0.28, + "step": 7969 + }, + { + "epoch": 0.63, + "learning_rate": 6.31794330293487e-06, + "loss": 0.3849, + "step": 7970 + }, + { + "epoch": 0.63, + "learning_rate": 6.315557670636803e-06, + "loss": 0.3915, + "step": 7971 + }, + { + "epoch": 0.63, + "learning_rate": 6.313172280941534e-06, + "loss": 0.4249, + "step": 7972 + }, + { + "epoch": 0.63, + "learning_rate": 6.31078713400613e-06, + "loss": 0.3541, + "step": 7973 + }, + { + "epoch": 0.63, + "learning_rate": 6.308402229987641e-06, + "loss": 0.2755, + "step": 7974 + }, + { + "epoch": 0.63, + "learning_rate": 6.3060175690431055e-06, + "loss": 0.2805, + "step": 7975 + }, + { + "epoch": 0.63, + "learning_rate": 6.303633151329535e-06, + "loss": 0.2176, + "step": 7976 + }, + { + "epoch": 0.63, + "learning_rate": 6.3012489770039396e-06, + "loss": 0.2858, + "step": 7977 + }, + { + "epoch": 0.63, + "learning_rate": 6.2988650462232995e-06, + "loss": 0.3643, + "step": 7978 + }, + { + "epoch": 0.63, + "learning_rate": 6.296481359144587e-06, + "loss": 0.3028, + "step": 7979 + }, + { + "epoch": 0.63, + "learning_rate": 6.29409791592476e-06, + "loss": 0.4966, + "step": 7980 + }, + { + "epoch": 0.63, + "learning_rate": 6.2917147167207495e-06, + "loss": 0.2834, + "step": 7981 + }, + { + "epoch": 0.63, + "learning_rate": 6.289331761689482e-06, + "loss": 0.2956, + "step": 7982 + }, + { + "epoch": 0.63, + "learning_rate": 6.286949050987868e-06, + "loss": 0.397, + "step": 7983 + }, + { + "epoch": 0.63, + "learning_rate": 6.284566584772791e-06, + "loss": 0.3436, + "step": 7984 + }, + { + "epoch": 0.63, + "learning_rate": 6.2821843632011245e-06, + "loss": 0.2808, + "step": 7985 + }, + { + "epoch": 0.63, + "learning_rate": 6.2798023864297315e-06, + "loss": 0.3119, + "step": 7986 + }, + { + "epoch": 0.63, + "learning_rate": 6.277420654615449e-06, + "loss": 0.2875, + "step": 7987 + }, + { + "epoch": 0.63, + "learning_rate": 6.275039167915103e-06, + "loss": 0.271, + "step": 7988 + }, + { + "epoch": 0.63, + "learning_rate": 6.2726579264855084e-06, + "loss": 0.2851, + "step": 7989 + }, + { + "epoch": 0.63, + "learning_rate": 6.270276930483451e-06, + "loss": 0.3978, + "step": 7990 + }, + { + "epoch": 0.63, + "learning_rate": 6.267896180065711e-06, + "loss": 0.3018, + "step": 7991 + }, + { + "epoch": 0.63, + "learning_rate": 6.265515675389053e-06, + "loss": 0.3438, + "step": 7992 + }, + { + "epoch": 0.63, + "learning_rate": 6.263135416610217e-06, + "loss": 0.3443, + "step": 7993 + }, + { + "epoch": 0.63, + "learning_rate": 6.260755403885934e-06, + "loss": 0.406, + "step": 7994 + }, + { + "epoch": 0.63, + "learning_rate": 6.258375637372914e-06, + "loss": 0.3436, + "step": 7995 + }, + { + "epoch": 0.63, + "learning_rate": 6.2559961172278545e-06, + "loss": 0.3208, + "step": 7996 + }, + { + "epoch": 0.63, + "learning_rate": 6.253616843607439e-06, + "loss": 0.3874, + "step": 7997 + }, + { + "epoch": 0.63, + "learning_rate": 6.251237816668324e-06, + "loss": 0.3, + "step": 7998 + }, + { + "epoch": 0.63, + "learning_rate": 6.248859036567162e-06, + "loss": 0.2984, + "step": 7999 + }, + { + "epoch": 0.63, + "learning_rate": 6.246480503460585e-06, + "loss": 0.3689, + "step": 8000 + }, + { + "epoch": 0.63, + "learning_rate": 6.2441022175052034e-06, + "loss": 0.4676, + "step": 8001 + }, + { + "epoch": 0.63, + "learning_rate": 6.241724178857621e-06, + "loss": 0.2348, + "step": 8002 + }, + { + "epoch": 0.63, + "learning_rate": 6.2393463876744165e-06, + "loss": 0.2929, + "step": 8003 + }, + { + "epoch": 0.63, + "learning_rate": 6.236968844112157e-06, + "loss": 0.3362, + "step": 8004 + }, + { + "epoch": 0.63, + "learning_rate": 6.234591548327393e-06, + "loss": 0.4639, + "step": 8005 + }, + { + "epoch": 0.63, + "learning_rate": 6.232214500476657e-06, + "loss": 0.3088, + "step": 8006 + }, + { + "epoch": 0.63, + "learning_rate": 6.229837700716465e-06, + "loss": 0.3561, + "step": 8007 + }, + { + "epoch": 0.63, + "learning_rate": 6.227461149203324e-06, + "loss": 0.2945, + "step": 8008 + }, + { + "epoch": 0.63, + "learning_rate": 6.225084846093711e-06, + "loss": 0.2933, + "step": 8009 + }, + { + "epoch": 0.63, + "learning_rate": 6.222708791544098e-06, + "loss": 0.3418, + "step": 8010 + }, + { + "epoch": 0.63, + "learning_rate": 6.220332985710936e-06, + "loss": 0.3698, + "step": 8011 + }, + { + "epoch": 0.63, + "learning_rate": 6.21795742875066e-06, + "loss": 0.4253, + "step": 8012 + }, + { + "epoch": 0.63, + "learning_rate": 6.21558212081969e-06, + "loss": 0.2896, + "step": 8013 + }, + { + "epoch": 0.63, + "learning_rate": 6.213207062074427e-06, + "loss": 0.2923, + "step": 8014 + }, + { + "epoch": 0.63, + "learning_rate": 6.210832252671257e-06, + "loss": 0.306, + "step": 8015 + }, + { + "epoch": 0.64, + "learning_rate": 6.208457692766554e-06, + "loss": 0.3934, + "step": 8016 + }, + { + "epoch": 0.64, + "learning_rate": 6.206083382516665e-06, + "loss": 0.2546, + "step": 8017 + }, + { + "epoch": 0.64, + "learning_rate": 6.203709322077933e-06, + "loss": 0.3311, + "step": 8018 + }, + { + "epoch": 0.64, + "learning_rate": 6.201335511606673e-06, + "loss": 0.3493, + "step": 8019 + }, + { + "epoch": 0.64, + "learning_rate": 6.198961951259193e-06, + "loss": 0.3162, + "step": 8020 + }, + { + "epoch": 0.64, + "learning_rate": 6.196588641191778e-06, + "loss": 0.3759, + "step": 8021 + }, + { + "epoch": 0.64, + "learning_rate": 6.194215581560701e-06, + "loss": 0.4077, + "step": 8022 + }, + { + "epoch": 0.64, + "learning_rate": 6.191842772522214e-06, + "loss": 0.3149, + "step": 8023 + }, + { + "epoch": 0.64, + "learning_rate": 6.18947021423256e-06, + "loss": 0.5153, + "step": 8024 + }, + { + "epoch": 0.64, + "learning_rate": 6.187097906847954e-06, + "loss": 0.3367, + "step": 8025 + }, + { + "epoch": 0.64, + "learning_rate": 6.184725850524608e-06, + "loss": 0.3177, + "step": 8026 + }, + { + "epoch": 0.64, + "learning_rate": 6.182354045418704e-06, + "loss": 0.396, + "step": 8027 + }, + { + "epoch": 0.64, + "learning_rate": 6.179982491686416e-06, + "loss": 0.2387, + "step": 8028 + }, + { + "epoch": 0.64, + "learning_rate": 6.177611189483903e-06, + "loss": 0.2904, + "step": 8029 + }, + { + "epoch": 0.64, + "learning_rate": 6.175240138967299e-06, + "loss": 0.3752, + "step": 8030 + }, + { + "epoch": 0.64, + "learning_rate": 6.172869340292729e-06, + "loss": 0.3522, + "step": 8031 + }, + { + "epoch": 0.64, + "learning_rate": 6.170498793616298e-06, + "loss": 0.3184, + "step": 8032 + }, + { + "epoch": 0.64, + "learning_rate": 6.168128499094095e-06, + "loss": 0.3109, + "step": 8033 + }, + { + "epoch": 0.64, + "learning_rate": 6.165758456882193e-06, + "loss": 0.3027, + "step": 8034 + }, + { + "epoch": 0.64, + "learning_rate": 6.163388667136646e-06, + "loss": 0.3406, + "step": 8035 + }, + { + "epoch": 0.64, + "learning_rate": 6.161019130013495e-06, + "loss": 0.3729, + "step": 8036 + }, + { + "epoch": 0.64, + "learning_rate": 6.158649845668764e-06, + "loss": 0.3221, + "step": 8037 + }, + { + "epoch": 0.64, + "learning_rate": 6.156280814258455e-06, + "loss": 0.3228, + "step": 8038 + }, + { + "epoch": 0.64, + "learning_rate": 6.153912035938559e-06, + "loss": 0.2705, + "step": 8039 + }, + { + "epoch": 0.64, + "learning_rate": 6.151543510865053e-06, + "loss": 0.2426, + "step": 8040 + }, + { + "epoch": 0.64, + "learning_rate": 6.149175239193887e-06, + "loss": 0.3932, + "step": 8041 + }, + { + "epoch": 0.64, + "learning_rate": 6.1468072210810035e-06, + "loss": 0.2593, + "step": 8042 + }, + { + "epoch": 0.64, + "learning_rate": 6.144439456682323e-06, + "loss": 0.3584, + "step": 8043 + }, + { + "epoch": 0.64, + "learning_rate": 6.142071946153751e-06, + "loss": 0.3137, + "step": 8044 + }, + { + "epoch": 0.64, + "learning_rate": 6.139704689651181e-06, + "loss": 0.3567, + "step": 8045 + }, + { + "epoch": 0.64, + "learning_rate": 6.1373376873304814e-06, + "loss": 0.2475, + "step": 8046 + }, + { + "epoch": 0.64, + "learning_rate": 6.134970939347511e-06, + "loss": 0.2448, + "step": 8047 + }, + { + "epoch": 0.64, + "learning_rate": 6.132604445858104e-06, + "loss": 0.2603, + "step": 8048 + }, + { + "epoch": 0.64, + "learning_rate": 6.130238207018085e-06, + "loss": 0.2485, + "step": 8049 + }, + { + "epoch": 0.64, + "learning_rate": 6.127872222983264e-06, + "loss": 0.2632, + "step": 8050 + }, + { + "epoch": 0.64, + "learning_rate": 6.125506493909422e-06, + "loss": 0.331, + "step": 8051 + }, + { + "epoch": 0.64, + "learning_rate": 6.123141019952334e-06, + "loss": 0.3611, + "step": 8052 + }, + { + "epoch": 0.64, + "learning_rate": 6.1207758012677595e-06, + "loss": 0.3765, + "step": 8053 + }, + { + "epoch": 0.64, + "learning_rate": 6.11841083801143e-06, + "loss": 0.3564, + "step": 8054 + }, + { + "epoch": 0.64, + "learning_rate": 6.116046130339073e-06, + "loss": 0.3714, + "step": 8055 + }, + { + "epoch": 0.64, + "learning_rate": 6.1136816784063855e-06, + "loss": 0.3709, + "step": 8056 + }, + { + "epoch": 0.64, + "learning_rate": 6.1113174823690615e-06, + "loss": 0.2888, + "step": 8057 + }, + { + "epoch": 0.64, + "learning_rate": 6.108953542382771e-06, + "loss": 0.361, + "step": 8058 + }, + { + "epoch": 0.64, + "learning_rate": 6.106589858603167e-06, + "loss": 0.3222, + "step": 8059 + }, + { + "epoch": 0.64, + "learning_rate": 6.1042264311858845e-06, + "loss": 0.3484, + "step": 8060 + }, + { + "epoch": 0.64, + "learning_rate": 6.101863260286551e-06, + "loss": 0.421, + "step": 8061 + }, + { + "epoch": 0.64, + "learning_rate": 6.099500346060765e-06, + "loss": 0.323, + "step": 8062 + }, + { + "epoch": 0.64, + "learning_rate": 6.09713768866411e-06, + "loss": 0.3116, + "step": 8063 + }, + { + "epoch": 0.64, + "learning_rate": 6.094775288252157e-06, + "loss": 0.2446, + "step": 8064 + }, + { + "epoch": 0.64, + "learning_rate": 6.092413144980465e-06, + "loss": 0.3233, + "step": 8065 + }, + { + "epoch": 0.64, + "learning_rate": 6.090051259004563e-06, + "loss": 0.2778, + "step": 8066 + }, + { + "epoch": 0.64, + "learning_rate": 6.087689630479974e-06, + "loss": 0.3709, + "step": 8067 + }, + { + "epoch": 0.64, + "learning_rate": 6.085328259562195e-06, + "loss": 0.4323, + "step": 8068 + }, + { + "epoch": 0.64, + "learning_rate": 6.082967146406714e-06, + "loss": 0.3475, + "step": 8069 + }, + { + "epoch": 0.64, + "learning_rate": 6.0806062911690025e-06, + "loss": 0.3043, + "step": 8070 + }, + { + "epoch": 0.64, + "learning_rate": 6.078245694004503e-06, + "loss": 0.2943, + "step": 8071 + }, + { + "epoch": 0.64, + "learning_rate": 6.075885355068658e-06, + "loss": 0.3601, + "step": 8072 + }, + { + "epoch": 0.64, + "learning_rate": 6.073525274516879e-06, + "loss": 0.3117, + "step": 8073 + }, + { + "epoch": 0.64, + "learning_rate": 6.071165452504568e-06, + "loss": 0.3015, + "step": 8074 + }, + { + "epoch": 0.64, + "learning_rate": 6.068805889187109e-06, + "loss": 0.3208, + "step": 8075 + }, + { + "epoch": 0.64, + "learning_rate": 6.066446584719864e-06, + "loss": 0.4404, + "step": 8076 + }, + { + "epoch": 0.64, + "learning_rate": 6.064087539258186e-06, + "loss": 0.361, + "step": 8077 + }, + { + "epoch": 0.64, + "learning_rate": 6.061728752957406e-06, + "loss": 0.3359, + "step": 8078 + }, + { + "epoch": 0.64, + "learning_rate": 6.059370225972834e-06, + "loss": 0.3688, + "step": 8079 + }, + { + "epoch": 0.64, + "learning_rate": 6.057011958459776e-06, + "loss": 0.3006, + "step": 8080 + }, + { + "epoch": 0.64, + "learning_rate": 6.0546539505735055e-06, + "loss": 0.3053, + "step": 8081 + }, + { + "epoch": 0.64, + "learning_rate": 6.052296202469288e-06, + "loss": 0.4418, + "step": 8082 + }, + { + "epoch": 0.64, + "learning_rate": 6.049938714302372e-06, + "loss": 0.4857, + "step": 8083 + }, + { + "epoch": 0.64, + "learning_rate": 6.047581486227984e-06, + "loss": 0.3086, + "step": 8084 + }, + { + "epoch": 0.64, + "learning_rate": 6.045224518401338e-06, + "loss": 0.2856, + "step": 8085 + }, + { + "epoch": 0.64, + "learning_rate": 6.04286781097763e-06, + "loss": 0.4181, + "step": 8086 + }, + { + "epoch": 0.64, + "learning_rate": 6.040511364112034e-06, + "loss": 0.3249, + "step": 8087 + }, + { + "epoch": 0.64, + "learning_rate": 6.038155177959715e-06, + "loss": 0.3436, + "step": 8088 + }, + { + "epoch": 0.64, + "learning_rate": 6.035799252675811e-06, + "loss": 0.2591, + "step": 8089 + }, + { + "epoch": 0.64, + "learning_rate": 6.0334435884154526e-06, + "loss": 0.2998, + "step": 8090 + }, + { + "epoch": 0.64, + "learning_rate": 6.031088185333751e-06, + "loss": 0.3963, + "step": 8091 + }, + { + "epoch": 0.64, + "learning_rate": 6.028733043585793e-06, + "loss": 0.3247, + "step": 8092 + }, + { + "epoch": 0.64, + "learning_rate": 6.026378163326654e-06, + "loss": 0.363, + "step": 8093 + }, + { + "epoch": 0.64, + "learning_rate": 6.024023544711396e-06, + "loss": 0.2751, + "step": 8094 + }, + { + "epoch": 0.64, + "learning_rate": 6.021669187895054e-06, + "loss": 0.399, + "step": 8095 + }, + { + "epoch": 0.64, + "learning_rate": 6.019315093032656e-06, + "loss": 0.3769, + "step": 8096 + }, + { + "epoch": 0.64, + "learning_rate": 6.016961260279204e-06, + "loss": 0.3575, + "step": 8097 + }, + { + "epoch": 0.64, + "learning_rate": 6.0146076897896865e-06, + "loss": 0.3929, + "step": 8098 + }, + { + "epoch": 0.64, + "learning_rate": 6.012254381719078e-06, + "loss": 0.3205, + "step": 8099 + }, + { + "epoch": 0.64, + "learning_rate": 6.0099013362223305e-06, + "loss": 0.4255, + "step": 8100 + }, + { + "epoch": 0.64, + "learning_rate": 6.007548553454379e-06, + "loss": 0.383, + "step": 8101 + }, + { + "epoch": 0.64, + "learning_rate": 6.005196033570147e-06, + "loss": 0.3743, + "step": 8102 + }, + { + "epoch": 0.64, + "learning_rate": 6.002843776724534e-06, + "loss": 0.4146, + "step": 8103 + }, + { + "epoch": 0.64, + "learning_rate": 6.000491783072426e-06, + "loss": 0.3891, + "step": 8104 + }, + { + "epoch": 0.64, + "learning_rate": 5.998140052768687e-06, + "loss": 0.3099, + "step": 8105 + }, + { + "epoch": 0.64, + "learning_rate": 5.995788585968171e-06, + "loss": 0.3568, + "step": 8106 + }, + { + "epoch": 0.64, + "learning_rate": 5.993437382825711e-06, + "loss": 0.3543, + "step": 8107 + }, + { + "epoch": 0.64, + "learning_rate": 5.991086443496119e-06, + "loss": 0.407, + "step": 8108 + }, + { + "epoch": 0.64, + "learning_rate": 5.9887357681341955e-06, + "loss": 0.2954, + "step": 8109 + }, + { + "epoch": 0.64, + "learning_rate": 5.9863853568947215e-06, + "loss": 0.3991, + "step": 8110 + }, + { + "epoch": 0.64, + "learning_rate": 5.9840352099324595e-06, + "loss": 0.2431, + "step": 8111 + }, + { + "epoch": 0.64, + "learning_rate": 5.981685327402156e-06, + "loss": 0.3056, + "step": 8112 + }, + { + "epoch": 0.64, + "learning_rate": 5.9793357094585365e-06, + "loss": 0.359, + "step": 8113 + }, + { + "epoch": 0.64, + "learning_rate": 5.976986356256316e-06, + "loss": 0.3282, + "step": 8114 + }, + { + "epoch": 0.64, + "learning_rate": 5.974637267950187e-06, + "loss": 0.3071, + "step": 8115 + }, + { + "epoch": 0.64, + "learning_rate": 5.972288444694822e-06, + "loss": 0.3422, + "step": 8116 + }, + { + "epoch": 0.64, + "learning_rate": 5.9699398866448846e-06, + "loss": 0.4117, + "step": 8117 + }, + { + "epoch": 0.64, + "learning_rate": 5.967591593955016e-06, + "loss": 0.3289, + "step": 8118 + }, + { + "epoch": 0.64, + "learning_rate": 5.965243566779837e-06, + "loss": 0.3314, + "step": 8119 + }, + { + "epoch": 0.64, + "learning_rate": 5.962895805273956e-06, + "loss": 0.3795, + "step": 8120 + }, + { + "epoch": 0.64, + "learning_rate": 5.960548309591958e-06, + "loss": 0.2891, + "step": 8121 + }, + { + "epoch": 0.64, + "learning_rate": 5.958201079888419e-06, + "loss": 0.3303, + "step": 8122 + }, + { + "epoch": 0.64, + "learning_rate": 5.9558541163178915e-06, + "loss": 0.4236, + "step": 8123 + }, + { + "epoch": 0.64, + "learning_rate": 5.953507419034911e-06, + "loss": 0.4395, + "step": 8124 + }, + { + "epoch": 0.64, + "learning_rate": 5.951160988193998e-06, + "loss": 0.4021, + "step": 8125 + }, + { + "epoch": 0.64, + "learning_rate": 5.948814823949649e-06, + "loss": 0.346, + "step": 8126 + }, + { + "epoch": 0.64, + "learning_rate": 5.946468926456352e-06, + "loss": 0.2706, + "step": 8127 + }, + { + "epoch": 0.64, + "learning_rate": 5.944123295868574e-06, + "loss": 0.2943, + "step": 8128 + }, + { + "epoch": 0.64, + "learning_rate": 5.9417779323407576e-06, + "loss": 0.3401, + "step": 8129 + }, + { + "epoch": 0.64, + "learning_rate": 5.939432836027339e-06, + "loss": 0.3218, + "step": 8130 + }, + { + "epoch": 0.64, + "learning_rate": 5.937088007082731e-06, + "loss": 0.3368, + "step": 8131 + }, + { + "epoch": 0.64, + "learning_rate": 5.934743445661326e-06, + "loss": 0.3475, + "step": 8132 + }, + { + "epoch": 0.64, + "learning_rate": 5.932399151917507e-06, + "loss": 0.3339, + "step": 8133 + }, + { + "epoch": 0.64, + "learning_rate": 5.93005512600563e-06, + "loss": 0.4249, + "step": 8134 + }, + { + "epoch": 0.64, + "learning_rate": 5.92771136808004e-06, + "loss": 0.3406, + "step": 8135 + }, + { + "epoch": 0.64, + "learning_rate": 5.925367878295063e-06, + "loss": 0.3043, + "step": 8136 + }, + { + "epoch": 0.64, + "learning_rate": 5.9230246568050035e-06, + "loss": 0.3272, + "step": 8137 + }, + { + "epoch": 0.64, + "learning_rate": 5.920681703764153e-06, + "loss": 0.3181, + "step": 8138 + }, + { + "epoch": 0.64, + "learning_rate": 5.918339019326789e-06, + "loss": 0.276, + "step": 8139 + }, + { + "epoch": 0.64, + "learning_rate": 5.915996603647157e-06, + "loss": 0.3367, + "step": 8140 + }, + { + "epoch": 0.64, + "learning_rate": 5.913654456879496e-06, + "loss": 0.4092, + "step": 8141 + }, + { + "epoch": 0.65, + "learning_rate": 5.911312579178028e-06, + "loss": 0.3814, + "step": 8142 + }, + { + "epoch": 0.65, + "learning_rate": 5.908970970696955e-06, + "loss": 0.3061, + "step": 8143 + }, + { + "epoch": 0.65, + "learning_rate": 5.906629631590457e-06, + "loss": 0.2723, + "step": 8144 + }, + { + "epoch": 0.65, + "learning_rate": 5.904288562012703e-06, + "loss": 0.282, + "step": 8145 + }, + { + "epoch": 0.65, + "learning_rate": 5.901947762117838e-06, + "loss": 0.3745, + "step": 8146 + }, + { + "epoch": 0.65, + "learning_rate": 5.899607232059994e-06, + "loss": 0.3344, + "step": 8147 + }, + { + "epoch": 0.65, + "learning_rate": 5.897266971993286e-06, + "loss": 0.4199, + "step": 8148 + }, + { + "epoch": 0.65, + "learning_rate": 5.894926982071805e-06, + "loss": 0.3536, + "step": 8149 + }, + { + "epoch": 0.65, + "learning_rate": 5.892587262449631e-06, + "loss": 0.3413, + "step": 8150 + }, + { + "epoch": 0.65, + "learning_rate": 5.890247813280822e-06, + "loss": 0.3719, + "step": 8151 + }, + { + "epoch": 0.65, + "learning_rate": 5.8879086347194196e-06, + "loss": 0.3512, + "step": 8152 + }, + { + "epoch": 0.65, + "learning_rate": 5.885569726919449e-06, + "loss": 0.4041, + "step": 8153 + }, + { + "epoch": 0.65, + "learning_rate": 5.883231090034911e-06, + "loss": 0.2719, + "step": 8154 + }, + { + "epoch": 0.65, + "learning_rate": 5.8808927242197984e-06, + "loss": 0.535, + "step": 8155 + }, + { + "epoch": 0.65, + "learning_rate": 5.878554629628081e-06, + "loss": 0.4265, + "step": 8156 + }, + { + "epoch": 0.65, + "learning_rate": 5.87621680641371e-06, + "loss": 0.3837, + "step": 8157 + }, + { + "epoch": 0.65, + "learning_rate": 5.873879254730621e-06, + "loss": 0.2418, + "step": 8158 + }, + { + "epoch": 0.65, + "learning_rate": 5.871541974732727e-06, + "loss": 0.2378, + "step": 8159 + }, + { + "epoch": 0.65, + "learning_rate": 5.869204966573929e-06, + "loss": 0.2475, + "step": 8160 + }, + { + "epoch": 0.65, + "learning_rate": 5.866868230408111e-06, + "loss": 0.3424, + "step": 8161 + }, + { + "epoch": 0.65, + "learning_rate": 5.86453176638913e-06, + "loss": 0.4144, + "step": 8162 + }, + { + "epoch": 0.65, + "learning_rate": 5.862195574670834e-06, + "loss": 0.2705, + "step": 8163 + }, + { + "epoch": 0.65, + "learning_rate": 5.85985965540705e-06, + "loss": 0.3949, + "step": 8164 + }, + { + "epoch": 0.65, + "learning_rate": 5.857524008751586e-06, + "loss": 0.2307, + "step": 8165 + }, + { + "epoch": 0.65, + "learning_rate": 5.855188634858235e-06, + "loss": 0.3801, + "step": 8166 + }, + { + "epoch": 0.65, + "learning_rate": 5.852853533880768e-06, + "loss": 0.3116, + "step": 8167 + }, + { + "epoch": 0.65, + "learning_rate": 5.850518705972941e-06, + "loss": 0.4472, + "step": 8168 + }, + { + "epoch": 0.65, + "learning_rate": 5.848184151288492e-06, + "loss": 0.2909, + "step": 8169 + }, + { + "epoch": 0.65, + "learning_rate": 5.845849869981137e-06, + "loss": 0.2879, + "step": 8170 + }, + { + "epoch": 0.65, + "learning_rate": 5.843515862204581e-06, + "loss": 0.3577, + "step": 8171 + }, + { + "epoch": 0.65, + "learning_rate": 5.841182128112506e-06, + "loss": 0.2408, + "step": 8172 + }, + { + "epoch": 0.65, + "learning_rate": 5.838848667858577e-06, + "loss": 0.3905, + "step": 8173 + }, + { + "epoch": 0.65, + "learning_rate": 5.83651548159644e-06, + "loss": 0.3319, + "step": 8174 + }, + { + "epoch": 0.65, + "learning_rate": 5.834182569479727e-06, + "loss": 0.3855, + "step": 8175 + }, + { + "epoch": 0.65, + "learning_rate": 5.831849931662047e-06, + "loss": 0.2192, + "step": 8176 + }, + { + "epoch": 0.65, + "learning_rate": 5.829517568296989e-06, + "loss": 0.3303, + "step": 8177 + }, + { + "epoch": 0.65, + "learning_rate": 5.827185479538138e-06, + "loss": 0.3799, + "step": 8178 + }, + { + "epoch": 0.65, + "learning_rate": 5.824853665539043e-06, + "loss": 0.3039, + "step": 8179 + }, + { + "epoch": 0.65, + "learning_rate": 5.82252212645324e-06, + "loss": 0.2601, + "step": 8180 + }, + { + "epoch": 0.65, + "learning_rate": 5.820190862434259e-06, + "loss": 0.2921, + "step": 8181 + }, + { + "epoch": 0.65, + "learning_rate": 5.8178598736355985e-06, + "loss": 0.2905, + "step": 8182 + }, + { + "epoch": 0.65, + "learning_rate": 5.815529160210738e-06, + "loss": 0.365, + "step": 8183 + }, + { + "epoch": 0.65, + "learning_rate": 5.813198722313151e-06, + "loss": 0.3302, + "step": 8184 + }, + { + "epoch": 0.65, + "learning_rate": 5.810868560096283e-06, + "loss": 0.3648, + "step": 8185 + }, + { + "epoch": 0.65, + "learning_rate": 5.808538673713564e-06, + "loss": 0.289, + "step": 8186 + }, + { + "epoch": 0.65, + "learning_rate": 5.8062090633184e-06, + "loss": 0.3849, + "step": 8187 + }, + { + "epoch": 0.65, + "learning_rate": 5.803879729064195e-06, + "loss": 0.2071, + "step": 8188 + }, + { + "epoch": 0.65, + "learning_rate": 5.801550671104319e-06, + "loss": 0.4312, + "step": 8189 + }, + { + "epoch": 0.65, + "learning_rate": 5.7992218895921256e-06, + "loss": 0.3021, + "step": 8190 + }, + { + "epoch": 0.65, + "learning_rate": 5.796893384680964e-06, + "loss": 0.3682, + "step": 8191 + }, + { + "epoch": 0.65, + "learning_rate": 5.7945651565241455e-06, + "loss": 0.2449, + "step": 8192 + }, + { + "epoch": 0.65, + "learning_rate": 5.792237205274974e-06, + "loss": 0.293, + "step": 8193 + }, + { + "epoch": 0.65, + "learning_rate": 5.789909531086741e-06, + "loss": 0.4216, + "step": 8194 + }, + { + "epoch": 0.65, + "learning_rate": 5.787582134112706e-06, + "loss": 0.3188, + "step": 8195 + }, + { + "epoch": 0.65, + "learning_rate": 5.785255014506115e-06, + "loss": 0.3255, + "step": 8196 + }, + { + "epoch": 0.65, + "learning_rate": 5.782928172420206e-06, + "loss": 0.356, + "step": 8197 + }, + { + "epoch": 0.65, + "learning_rate": 5.780601608008185e-06, + "loss": 0.3971, + "step": 8198 + }, + { + "epoch": 0.65, + "learning_rate": 5.778275321423241e-06, + "loss": 0.4135, + "step": 8199 + }, + { + "epoch": 0.65, + "learning_rate": 5.7759493128185584e-06, + "loss": 0.4206, + "step": 8200 + }, + { + "epoch": 0.65, + "learning_rate": 5.773623582347289e-06, + "loss": 0.4514, + "step": 8201 + }, + { + "epoch": 0.65, + "learning_rate": 5.77129813016257e-06, + "loss": 0.3645, + "step": 8202 + }, + { + "epoch": 0.65, + "learning_rate": 5.768972956417518e-06, + "loss": 0.3226, + "step": 8203 + }, + { + "epoch": 0.65, + "learning_rate": 5.766648061265242e-06, + "loss": 0.3095, + "step": 8204 + }, + { + "epoch": 0.65, + "learning_rate": 5.764323444858823e-06, + "loss": 0.3218, + "step": 8205 + }, + { + "epoch": 0.65, + "learning_rate": 5.761999107351319e-06, + "loss": 0.4112, + "step": 8206 + }, + { + "epoch": 0.65, + "learning_rate": 5.759675048895785e-06, + "loss": 0.3569, + "step": 8207 + }, + { + "epoch": 0.65, + "learning_rate": 5.757351269645248e-06, + "loss": 0.462, + "step": 8208 + }, + { + "epoch": 0.65, + "learning_rate": 5.75502776975271e-06, + "loss": 0.3204, + "step": 8209 + }, + { + "epoch": 0.65, + "learning_rate": 5.752704549371173e-06, + "loss": 0.4037, + "step": 8210 + }, + { + "epoch": 0.65, + "learning_rate": 5.750381608653605e-06, + "loss": 0.3194, + "step": 8211 + }, + { + "epoch": 0.65, + "learning_rate": 5.748058947752955e-06, + "loss": 0.2283, + "step": 8212 + }, + { + "epoch": 0.65, + "learning_rate": 5.745736566822169e-06, + "loss": 0.2117, + "step": 8213 + }, + { + "epoch": 0.65, + "learning_rate": 5.743414466014159e-06, + "loss": 0.3658, + "step": 8214 + }, + { + "epoch": 0.65, + "learning_rate": 5.7410926454818265e-06, + "loss": 0.4171, + "step": 8215 + }, + { + "epoch": 0.65, + "learning_rate": 5.738771105378046e-06, + "loss": 0.3921, + "step": 8216 + }, + { + "epoch": 0.65, + "learning_rate": 5.7364498458556914e-06, + "loss": 0.3397, + "step": 8217 + }, + { + "epoch": 0.65, + "learning_rate": 5.734128867067593e-06, + "loss": 0.2827, + "step": 8218 + }, + { + "epoch": 0.65, + "learning_rate": 5.731808169166586e-06, + "loss": 0.2803, + "step": 8219 + }, + { + "epoch": 0.65, + "learning_rate": 5.7294877523054735e-06, + "loss": 0.2903, + "step": 8220 + }, + { + "epoch": 0.65, + "learning_rate": 5.727167616637042e-06, + "loss": 0.3474, + "step": 8221 + }, + { + "epoch": 0.65, + "learning_rate": 5.7248477623140655e-06, + "loss": 0.3745, + "step": 8222 + }, + { + "epoch": 0.65, + "learning_rate": 5.722528189489294e-06, + "loss": 0.3129, + "step": 8223 + }, + { + "epoch": 0.65, + "learning_rate": 5.720208898315454e-06, + "loss": 0.4547, + "step": 8224 + }, + { + "epoch": 0.65, + "learning_rate": 5.717889888945271e-06, + "loss": 0.4779, + "step": 8225 + }, + { + "epoch": 0.65, + "learning_rate": 5.715571161531433e-06, + "loss": 0.307, + "step": 8226 + }, + { + "epoch": 0.65, + "learning_rate": 5.7132527162266194e-06, + "loss": 0.4065, + "step": 8227 + }, + { + "epoch": 0.65, + "learning_rate": 5.710934553183484e-06, + "loss": 0.363, + "step": 8228 + }, + { + "epoch": 0.65, + "learning_rate": 5.708616672554675e-06, + "loss": 0.3712, + "step": 8229 + }, + { + "epoch": 0.65, + "learning_rate": 5.7062990744928086e-06, + "loss": 0.4556, + "step": 8230 + }, + { + "epoch": 0.65, + "learning_rate": 5.703981759150483e-06, + "loss": 0.2737, + "step": 8231 + }, + { + "epoch": 0.65, + "learning_rate": 5.701664726680294e-06, + "loss": 0.3499, + "step": 8232 + }, + { + "epoch": 0.65, + "learning_rate": 5.699347977234799e-06, + "loss": 0.4099, + "step": 8233 + }, + { + "epoch": 0.65, + "learning_rate": 5.697031510966542e-06, + "loss": 0.3303, + "step": 8234 + }, + { + "epoch": 0.65, + "learning_rate": 5.69471532802806e-06, + "loss": 0.3832, + "step": 8235 + }, + { + "epoch": 0.65, + "learning_rate": 5.692399428571857e-06, + "loss": 0.3451, + "step": 8236 + }, + { + "epoch": 0.65, + "learning_rate": 5.690083812750422e-06, + "loss": 0.2957, + "step": 8237 + }, + { + "epoch": 0.65, + "learning_rate": 5.687768480716233e-06, + "loss": 0.2884, + "step": 8238 + }, + { + "epoch": 0.65, + "learning_rate": 5.685453432621741e-06, + "loss": 0.2308, + "step": 8239 + }, + { + "epoch": 0.65, + "learning_rate": 5.683138668619381e-06, + "loss": 0.4064, + "step": 8240 + }, + { + "epoch": 0.65, + "learning_rate": 5.680824188861564e-06, + "loss": 0.304, + "step": 8241 + }, + { + "epoch": 0.65, + "learning_rate": 5.678509993500695e-06, + "loss": 0.2687, + "step": 8242 + }, + { + "epoch": 0.65, + "learning_rate": 5.676196082689149e-06, + "loss": 0.356, + "step": 8243 + }, + { + "epoch": 0.65, + "learning_rate": 5.673882456579282e-06, + "loss": 0.2964, + "step": 8244 + }, + { + "epoch": 0.65, + "learning_rate": 5.6715691153234445e-06, + "loss": 0.3304, + "step": 8245 + }, + { + "epoch": 0.65, + "learning_rate": 5.669256059073953e-06, + "loss": 0.26, + "step": 8246 + }, + { + "epoch": 0.65, + "learning_rate": 5.666943287983106e-06, + "loss": 0.4296, + "step": 8247 + }, + { + "epoch": 0.65, + "learning_rate": 5.664630802203201e-06, + "loss": 0.4923, + "step": 8248 + }, + { + "epoch": 0.65, + "learning_rate": 5.662318601886496e-06, + "loss": 0.4228, + "step": 8249 + }, + { + "epoch": 0.65, + "learning_rate": 5.660006687185235e-06, + "loss": 0.3261, + "step": 8250 + }, + { + "epoch": 0.65, + "learning_rate": 5.657695058251656e-06, + "loss": 0.4724, + "step": 8251 + }, + { + "epoch": 0.65, + "learning_rate": 5.655383715237963e-06, + "loss": 0.3097, + "step": 8252 + }, + { + "epoch": 0.65, + "learning_rate": 5.653072658296344e-06, + "loss": 0.2581, + "step": 8253 + }, + { + "epoch": 0.65, + "learning_rate": 5.650761887578977e-06, + "loss": 0.3821, + "step": 8254 + }, + { + "epoch": 0.65, + "learning_rate": 5.648451403238013e-06, + "loss": 0.3726, + "step": 8255 + }, + { + "epoch": 0.65, + "learning_rate": 5.646141205425586e-06, + "loss": 0.378, + "step": 8256 + }, + { + "epoch": 0.65, + "learning_rate": 5.643831294293808e-06, + "loss": 0.3742, + "step": 8257 + }, + { + "epoch": 0.65, + "learning_rate": 5.641521669994782e-06, + "loss": 0.3538, + "step": 8258 + }, + { + "epoch": 0.65, + "learning_rate": 5.639212332680581e-06, + "loss": 0.354, + "step": 8259 + }, + { + "epoch": 0.65, + "learning_rate": 5.636903282503263e-06, + "loss": 0.3169, + "step": 8260 + }, + { + "epoch": 0.65, + "learning_rate": 5.6345945196148734e-06, + "loss": 0.4596, + "step": 8261 + }, + { + "epoch": 0.65, + "learning_rate": 5.63228604416743e-06, + "loss": 0.284, + "step": 8262 + }, + { + "epoch": 0.65, + "learning_rate": 5.62997785631293e-06, + "loss": 0.3064, + "step": 8263 + }, + { + "epoch": 0.65, + "learning_rate": 5.627669956203365e-06, + "loss": 0.2525, + "step": 8264 + }, + { + "epoch": 0.65, + "learning_rate": 5.6253623439906955e-06, + "loss": 0.4597, + "step": 8265 + }, + { + "epoch": 0.65, + "learning_rate": 5.623055019826862e-06, + "loss": 0.3798, + "step": 8266 + }, + { + "epoch": 0.65, + "learning_rate": 5.6207479838637995e-06, + "loss": 0.3675, + "step": 8267 + }, + { + "epoch": 0.66, + "learning_rate": 5.618441236253411e-06, + "loss": 0.3148, + "step": 8268 + }, + { + "epoch": 0.66, + "learning_rate": 5.616134777147578e-06, + "loss": 0.3883, + "step": 8269 + }, + { + "epoch": 0.66, + "learning_rate": 5.6138286066981815e-06, + "loss": 0.3526, + "step": 8270 + }, + { + "epoch": 0.66, + "learning_rate": 5.611522725057067e-06, + "loss": 0.3313, + "step": 8271 + }, + { + "epoch": 0.66, + "learning_rate": 5.6092171323760635e-06, + "loss": 0.3563, + "step": 8272 + }, + { + "epoch": 0.66, + "learning_rate": 5.6069118288069824e-06, + "loss": 0.3396, + "step": 8273 + }, + { + "epoch": 0.66, + "learning_rate": 5.604606814501623e-06, + "loss": 0.3705, + "step": 8274 + }, + { + "epoch": 0.66, + "learning_rate": 5.602302089611755e-06, + "loss": 0.2405, + "step": 8275 + }, + { + "epoch": 0.66, + "learning_rate": 5.599997654289129e-06, + "loss": 0.375, + "step": 8276 + }, + { + "epoch": 0.66, + "learning_rate": 5.5976935086854914e-06, + "loss": 0.4806, + "step": 8277 + }, + { + "epoch": 0.66, + "learning_rate": 5.595389652952555e-06, + "loss": 0.3571, + "step": 8278 + }, + { + "epoch": 0.66, + "learning_rate": 5.59308608724201e-06, + "loss": 0.2861, + "step": 8279 + }, + { + "epoch": 0.66, + "learning_rate": 5.590782811705547e-06, + "loss": 0.3316, + "step": 8280 + }, + { + "epoch": 0.66, + "learning_rate": 5.588479826494817e-06, + "loss": 0.4197, + "step": 8281 + }, + { + "epoch": 0.66, + "learning_rate": 5.5861771317614624e-06, + "loss": 0.4047, + "step": 8282 + }, + { + "epoch": 0.66, + "learning_rate": 5.583874727657109e-06, + "loss": 0.2768, + "step": 8283 + }, + { + "epoch": 0.66, + "learning_rate": 5.581572614333356e-06, + "loss": 0.3595, + "step": 8284 + }, + { + "epoch": 0.66, + "learning_rate": 5.579270791941787e-06, + "loss": 0.2795, + "step": 8285 + }, + { + "epoch": 0.66, + "learning_rate": 5.5769692606339584e-06, + "loss": 0.3905, + "step": 8286 + }, + { + "epoch": 0.66, + "learning_rate": 5.574668020561428e-06, + "loss": 0.2968, + "step": 8287 + }, + { + "epoch": 0.66, + "learning_rate": 5.572367071875715e-06, + "loss": 0.3577, + "step": 8288 + }, + { + "epoch": 0.66, + "learning_rate": 5.570066414728321e-06, + "loss": 0.4365, + "step": 8289 + }, + { + "epoch": 0.66, + "learning_rate": 5.567766049270742e-06, + "loss": 0.2423, + "step": 8290 + }, + { + "epoch": 0.66, + "learning_rate": 5.5654659756544425e-06, + "loss": 0.322, + "step": 8291 + }, + { + "epoch": 0.66, + "learning_rate": 5.563166194030868e-06, + "loss": 0.4519, + "step": 8292 + }, + { + "epoch": 0.66, + "learning_rate": 5.560866704551454e-06, + "loss": 0.3872, + "step": 8293 + }, + { + "epoch": 0.66, + "learning_rate": 5.5585675073676085e-06, + "loss": 0.1819, + "step": 8294 + }, + { + "epoch": 0.66, + "learning_rate": 5.556268602630721e-06, + "loss": 0.3302, + "step": 8295 + }, + { + "epoch": 0.66, + "learning_rate": 5.553969990492164e-06, + "loss": 0.2926, + "step": 8296 + }, + { + "epoch": 0.66, + "learning_rate": 5.5516716711032906e-06, + "loss": 0.3395, + "step": 8297 + }, + { + "epoch": 0.66, + "learning_rate": 5.54937364461543e-06, + "loss": 0.3596, + "step": 8298 + }, + { + "epoch": 0.66, + "learning_rate": 5.547075911179902e-06, + "loss": 0.3006, + "step": 8299 + }, + { + "epoch": 0.66, + "learning_rate": 5.544778470948001e-06, + "loss": 0.3302, + "step": 8300 + }, + { + "epoch": 0.66, + "learning_rate": 5.542481324070996e-06, + "loss": 0.4151, + "step": 8301 + }, + { + "epoch": 0.66, + "learning_rate": 5.540184470700152e-06, + "loss": 0.3273, + "step": 8302 + }, + { + "epoch": 0.66, + "learning_rate": 5.537887910986701e-06, + "loss": 0.3805, + "step": 8303 + }, + { + "epoch": 0.66, + "learning_rate": 5.535591645081857e-06, + "loss": 0.3837, + "step": 8304 + }, + { + "epoch": 0.66, + "learning_rate": 5.5332956731368245e-06, + "loss": 0.2539, + "step": 8305 + }, + { + "epoch": 0.66, + "learning_rate": 5.530999995302781e-06, + "loss": 0.3032, + "step": 8306 + }, + { + "epoch": 0.66, + "learning_rate": 5.528704611730879e-06, + "loss": 0.3216, + "step": 8307 + }, + { + "epoch": 0.66, + "learning_rate": 5.5264095225722705e-06, + "loss": 0.3868, + "step": 8308 + }, + { + "epoch": 0.66, + "learning_rate": 5.524114727978067e-06, + "loss": 0.3373, + "step": 8309 + }, + { + "epoch": 0.66, + "learning_rate": 5.5218202280993725e-06, + "loss": 0.2123, + "step": 8310 + }, + { + "epoch": 0.66, + "learning_rate": 5.519526023087265e-06, + "loss": 0.2521, + "step": 8311 + }, + { + "epoch": 0.66, + "learning_rate": 5.517232113092814e-06, + "loss": 0.3235, + "step": 8312 + }, + { + "epoch": 0.66, + "learning_rate": 5.5149384982670585e-06, + "loss": 0.3687, + "step": 8313 + }, + { + "epoch": 0.66, + "learning_rate": 5.512645178761018e-06, + "loss": 0.3719, + "step": 8314 + }, + { + "epoch": 0.66, + "learning_rate": 5.5103521547257045e-06, + "loss": 0.3595, + "step": 8315 + }, + { + "epoch": 0.66, + "learning_rate": 5.508059426312099e-06, + "loss": 0.2824, + "step": 8316 + }, + { + "epoch": 0.66, + "learning_rate": 5.5057669936711625e-06, + "loss": 0.3335, + "step": 8317 + }, + { + "epoch": 0.66, + "learning_rate": 5.503474856953849e-06, + "loss": 0.3837, + "step": 8318 + }, + { + "epoch": 0.66, + "learning_rate": 5.50118301631108e-06, + "loss": 0.3261, + "step": 8319 + }, + { + "epoch": 0.66, + "learning_rate": 5.498891471893758e-06, + "loss": 0.3999, + "step": 8320 + }, + { + "epoch": 0.66, + "learning_rate": 5.49660022385278e-06, + "loss": 0.309, + "step": 8321 + }, + { + "epoch": 0.66, + "learning_rate": 5.494309272339007e-06, + "loss": 0.3751, + "step": 8322 + }, + { + "epoch": 0.66, + "learning_rate": 5.492018617503284e-06, + "loss": 0.1932, + "step": 8323 + }, + { + "epoch": 0.66, + "learning_rate": 5.48972825949645e-06, + "loss": 0.3247, + "step": 8324 + }, + { + "epoch": 0.66, + "learning_rate": 5.487438198469306e-06, + "loss": 0.4312, + "step": 8325 + }, + { + "epoch": 0.66, + "learning_rate": 5.485148434572645e-06, + "loss": 0.3768, + "step": 8326 + }, + { + "epoch": 0.66, + "learning_rate": 5.48285896795723e-06, + "loss": 0.5103, + "step": 8327 + }, + { + "epoch": 0.66, + "learning_rate": 5.480569798773822e-06, + "loss": 0.5049, + "step": 8328 + }, + { + "epoch": 0.66, + "learning_rate": 5.478280927173145e-06, + "loss": 0.3098, + "step": 8329 + }, + { + "epoch": 0.66, + "learning_rate": 5.4759923533059105e-06, + "loss": 0.4137, + "step": 8330 + }, + { + "epoch": 0.66, + "learning_rate": 5.473704077322814e-06, + "loss": 0.3154, + "step": 8331 + }, + { + "epoch": 0.66, + "learning_rate": 5.471416099374525e-06, + "loss": 0.3231, + "step": 8332 + }, + { + "epoch": 0.66, + "learning_rate": 5.469128419611691e-06, + "loss": 0.2755, + "step": 8333 + }, + { + "epoch": 0.66, + "learning_rate": 5.466841038184954e-06, + "loss": 0.3029, + "step": 8334 + }, + { + "epoch": 0.66, + "learning_rate": 5.464553955244922e-06, + "loss": 0.2691, + "step": 8335 + }, + { + "epoch": 0.66, + "learning_rate": 5.4622671709421856e-06, + "loss": 0.3516, + "step": 8336 + }, + { + "epoch": 0.66, + "learning_rate": 5.459980685427326e-06, + "loss": 0.3281, + "step": 8337 + }, + { + "epoch": 0.66, + "learning_rate": 5.457694498850892e-06, + "loss": 0.3295, + "step": 8338 + }, + { + "epoch": 0.66, + "learning_rate": 5.455408611363416e-06, + "loss": 0.3825, + "step": 8339 + }, + { + "epoch": 0.66, + "learning_rate": 5.45312302311542e-06, + "loss": 0.4009, + "step": 8340 + }, + { + "epoch": 0.66, + "learning_rate": 5.450837734257395e-06, + "loss": 0.3609, + "step": 8341 + }, + { + "epoch": 0.66, + "learning_rate": 5.448552744939815e-06, + "loss": 0.3594, + "step": 8342 + }, + { + "epoch": 0.66, + "learning_rate": 5.446268055313132e-06, + "loss": 0.2846, + "step": 8343 + }, + { + "epoch": 0.66, + "learning_rate": 5.443983665527792e-06, + "loss": 0.2616, + "step": 8344 + }, + { + "epoch": 0.66, + "learning_rate": 5.441699575734204e-06, + "loss": 0.3321, + "step": 8345 + }, + { + "epoch": 0.66, + "learning_rate": 5.439415786082762e-06, + "loss": 0.4022, + "step": 8346 + }, + { + "epoch": 0.66, + "learning_rate": 5.437132296723852e-06, + "loss": 0.2323, + "step": 8347 + }, + { + "epoch": 0.66, + "learning_rate": 5.434849107807823e-06, + "loss": 0.3858, + "step": 8348 + }, + { + "epoch": 0.66, + "learning_rate": 5.432566219485012e-06, + "loss": 0.334, + "step": 8349 + }, + { + "epoch": 0.66, + "learning_rate": 5.430283631905742e-06, + "loss": 0.3351, + "step": 8350 + }, + { + "epoch": 0.66, + "learning_rate": 5.428001345220306e-06, + "loss": 0.3075, + "step": 8351 + }, + { + "epoch": 0.66, + "learning_rate": 5.425719359578978e-06, + "loss": 0.3136, + "step": 8352 + }, + { + "epoch": 0.66, + "learning_rate": 5.423437675132025e-06, + "loss": 0.4623, + "step": 8353 + }, + { + "epoch": 0.66, + "learning_rate": 5.42115629202968e-06, + "loss": 0.404, + "step": 8354 + }, + { + "epoch": 0.66, + "learning_rate": 5.4188752104221565e-06, + "loss": 0.362, + "step": 8355 + }, + { + "epoch": 0.66, + "learning_rate": 5.416594430459663e-06, + "loss": 0.3819, + "step": 8356 + }, + { + "epoch": 0.66, + "learning_rate": 5.41431395229237e-06, + "loss": 0.3781, + "step": 8357 + }, + { + "epoch": 0.66, + "learning_rate": 5.41203377607044e-06, + "loss": 0.3507, + "step": 8358 + }, + { + "epoch": 0.66, + "learning_rate": 5.409753901944006e-06, + "loss": 0.3253, + "step": 8359 + }, + { + "epoch": 0.66, + "learning_rate": 5.407474330063194e-06, + "loss": 0.3502, + "step": 8360 + }, + { + "epoch": 0.66, + "learning_rate": 5.4051950605781e-06, + "loss": 0.4, + "step": 8361 + }, + { + "epoch": 0.66, + "learning_rate": 5.402916093638798e-06, + "loss": 0.3792, + "step": 8362 + }, + { + "epoch": 0.66, + "learning_rate": 5.400637429395357e-06, + "loss": 0.3672, + "step": 8363 + }, + { + "epoch": 0.66, + "learning_rate": 5.398359067997808e-06, + "loss": 0.3805, + "step": 8364 + }, + { + "epoch": 0.66, + "learning_rate": 5.3960810095961705e-06, + "loss": 0.3388, + "step": 8365 + }, + { + "epoch": 0.66, + "learning_rate": 5.39380325434045e-06, + "loss": 0.3208, + "step": 8366 + }, + { + "epoch": 0.66, + "learning_rate": 5.3915258023806195e-06, + "loss": 0.3451, + "step": 8367 + }, + { + "epoch": 0.66, + "learning_rate": 5.3892486538666386e-06, + "loss": 0.2988, + "step": 8368 + }, + { + "epoch": 0.66, + "learning_rate": 5.386971808948451e-06, + "loss": 0.3274, + "step": 8369 + }, + { + "epoch": 0.66, + "learning_rate": 5.384695267775975e-06, + "loss": 0.4039, + "step": 8370 + }, + { + "epoch": 0.66, + "learning_rate": 5.382419030499107e-06, + "loss": 0.2763, + "step": 8371 + }, + { + "epoch": 0.66, + "learning_rate": 5.380143097267723e-06, + "loss": 0.3146, + "step": 8372 + }, + { + "epoch": 0.66, + "learning_rate": 5.377867468231695e-06, + "loss": 0.3703, + "step": 8373 + }, + { + "epoch": 0.66, + "learning_rate": 5.3755921435408464e-06, + "loss": 0.2538, + "step": 8374 + }, + { + "epoch": 0.66, + "learning_rate": 5.373317123345008e-06, + "loss": 0.34, + "step": 8375 + }, + { + "epoch": 0.66, + "learning_rate": 5.371042407793974e-06, + "loss": 0.3193, + "step": 8376 + }, + { + "epoch": 0.66, + "learning_rate": 5.368767997037521e-06, + "loss": 0.4734, + "step": 8377 + }, + { + "epoch": 0.66, + "learning_rate": 5.366493891225415e-06, + "loss": 0.2457, + "step": 8378 + }, + { + "epoch": 0.66, + "learning_rate": 5.3642200905073914e-06, + "loss": 0.2579, + "step": 8379 + }, + { + "epoch": 0.66, + "learning_rate": 5.361946595033165e-06, + "loss": 0.3571, + "step": 8380 + }, + { + "epoch": 0.66, + "learning_rate": 5.359673404952442e-06, + "loss": 0.3401, + "step": 8381 + }, + { + "epoch": 0.66, + "learning_rate": 5.357400520414898e-06, + "loss": 0.3806, + "step": 8382 + }, + { + "epoch": 0.66, + "learning_rate": 5.355127941570191e-06, + "loss": 0.3646, + "step": 8383 + }, + { + "epoch": 0.66, + "learning_rate": 5.352855668567956e-06, + "loss": 0.2728, + "step": 8384 + }, + { + "epoch": 0.66, + "learning_rate": 5.350583701557816e-06, + "loss": 0.4264, + "step": 8385 + }, + { + "epoch": 0.66, + "learning_rate": 5.348312040689369e-06, + "loss": 0.2461, + "step": 8386 + }, + { + "epoch": 0.66, + "learning_rate": 5.346040686112189e-06, + "loss": 0.3328, + "step": 8387 + }, + { + "epoch": 0.66, + "learning_rate": 5.34376963797584e-06, + "loss": 0.3584, + "step": 8388 + }, + { + "epoch": 0.66, + "learning_rate": 5.3414988964298555e-06, + "loss": 0.308, + "step": 8389 + }, + { + "epoch": 0.66, + "learning_rate": 5.3392284616237486e-06, + "loss": 0.2983, + "step": 8390 + }, + { + "epoch": 0.66, + "learning_rate": 5.336958333707026e-06, + "loss": 0.3054, + "step": 8391 + }, + { + "epoch": 0.66, + "learning_rate": 5.33468851282916e-06, + "loss": 0.3273, + "step": 8392 + }, + { + "epoch": 0.66, + "learning_rate": 5.332418999139604e-06, + "loss": 0.4073, + "step": 8393 + }, + { + "epoch": 0.67, + "learning_rate": 5.330149792787801e-06, + "loss": 0.3553, + "step": 8394 + }, + { + "epoch": 0.67, + "learning_rate": 5.3278808939231654e-06, + "loss": 0.472, + "step": 8395 + }, + { + "epoch": 0.67, + "learning_rate": 5.32561230269509e-06, + "loss": 0.3474, + "step": 8396 + }, + { + "epoch": 0.67, + "learning_rate": 5.32334401925295e-06, + "loss": 0.3281, + "step": 8397 + }, + { + "epoch": 0.67, + "learning_rate": 5.321076043746108e-06, + "loss": 0.4564, + "step": 8398 + }, + { + "epoch": 0.67, + "learning_rate": 5.318808376323895e-06, + "loss": 0.3553, + "step": 8399 + }, + { + "epoch": 0.67, + "learning_rate": 5.316541017135622e-06, + "loss": 0.3678, + "step": 8400 + }, + { + "epoch": 0.67, + "learning_rate": 5.314273966330591e-06, + "loss": 0.4128, + "step": 8401 + }, + { + "epoch": 0.67, + "learning_rate": 5.3120072240580735e-06, + "loss": 0.4899, + "step": 8402 + }, + { + "epoch": 0.67, + "learning_rate": 5.309740790467319e-06, + "loss": 0.3757, + "step": 8403 + }, + { + "epoch": 0.67, + "learning_rate": 5.307474665707569e-06, + "loss": 0.3052, + "step": 8404 + }, + { + "epoch": 0.67, + "learning_rate": 5.305208849928034e-06, + "loss": 0.2589, + "step": 8405 + }, + { + "epoch": 0.67, + "learning_rate": 5.302943343277902e-06, + "loss": 0.3981, + "step": 8406 + }, + { + "epoch": 0.67, + "learning_rate": 5.300678145906354e-06, + "loss": 0.4549, + "step": 8407 + }, + { + "epoch": 0.67, + "learning_rate": 5.298413257962538e-06, + "loss": 0.4773, + "step": 8408 + }, + { + "epoch": 0.67, + "learning_rate": 5.296148679595583e-06, + "loss": 0.2993, + "step": 8409 + }, + { + "epoch": 0.67, + "learning_rate": 5.293884410954608e-06, + "loss": 0.3433, + "step": 8410 + }, + { + "epoch": 0.67, + "learning_rate": 5.291620452188699e-06, + "loss": 0.331, + "step": 8411 + }, + { + "epoch": 0.67, + "learning_rate": 5.28935680344693e-06, + "loss": 0.2596, + "step": 8412 + }, + { + "epoch": 0.67, + "learning_rate": 5.287093464878343e-06, + "loss": 0.3207, + "step": 8413 + }, + { + "epoch": 0.67, + "learning_rate": 5.28483043663198e-06, + "loss": 0.3818, + "step": 8414 + }, + { + "epoch": 0.67, + "learning_rate": 5.282567718856845e-06, + "loss": 0.2782, + "step": 8415 + }, + { + "epoch": 0.67, + "learning_rate": 5.280305311701921e-06, + "loss": 0.3766, + "step": 8416 + }, + { + "epoch": 0.67, + "learning_rate": 5.278043215316189e-06, + "loss": 0.4211, + "step": 8417 + }, + { + "epoch": 0.67, + "learning_rate": 5.275781429848589e-06, + "loss": 0.4446, + "step": 8418 + }, + { + "epoch": 0.67, + "learning_rate": 5.273519955448047e-06, + "loss": 0.2886, + "step": 8419 + }, + { + "epoch": 0.67, + "learning_rate": 5.271258792263476e-06, + "loss": 0.2133, + "step": 8420 + }, + { + "epoch": 0.67, + "learning_rate": 5.268997940443762e-06, + "loss": 0.3058, + "step": 8421 + }, + { + "epoch": 0.67, + "learning_rate": 5.266737400137765e-06, + "loss": 0.3063, + "step": 8422 + }, + { + "epoch": 0.67, + "learning_rate": 5.26447717149434e-06, + "loss": 0.4532, + "step": 8423 + }, + { + "epoch": 0.67, + "learning_rate": 5.2622172546623055e-06, + "loss": 0.4175, + "step": 8424 + }, + { + "epoch": 0.67, + "learning_rate": 5.259957649790466e-06, + "loss": 0.3401, + "step": 8425 + }, + { + "epoch": 0.67, + "learning_rate": 5.257698357027609e-06, + "loss": 0.3774, + "step": 8426 + }, + { + "epoch": 0.67, + "learning_rate": 5.2554393765225e-06, + "loss": 0.3027, + "step": 8427 + }, + { + "epoch": 0.67, + "learning_rate": 5.253180708423877e-06, + "loss": 0.2585, + "step": 8428 + }, + { + "epoch": 0.67, + "learning_rate": 5.25092235288046e-06, + "loss": 0.3667, + "step": 8429 + }, + { + "epoch": 0.67, + "learning_rate": 5.248664310040958e-06, + "loss": 0.3928, + "step": 8430 + }, + { + "epoch": 0.67, + "learning_rate": 5.246406580054051e-06, + "loss": 0.4622, + "step": 8431 + }, + { + "epoch": 0.67, + "learning_rate": 5.244149163068394e-06, + "loss": 0.3479, + "step": 8432 + }, + { + "epoch": 0.67, + "learning_rate": 5.241892059232634e-06, + "loss": 0.4028, + "step": 8433 + }, + { + "epoch": 0.67, + "learning_rate": 5.239635268695386e-06, + "loss": 0.4869, + "step": 8434 + }, + { + "epoch": 0.67, + "learning_rate": 5.237378791605249e-06, + "loss": 0.2607, + "step": 8435 + }, + { + "epoch": 0.67, + "learning_rate": 5.235122628110805e-06, + "loss": 0.3397, + "step": 8436 + }, + { + "epoch": 0.67, + "learning_rate": 5.232866778360608e-06, + "loss": 0.2961, + "step": 8437 + }, + { + "epoch": 0.67, + "learning_rate": 5.230611242503193e-06, + "loss": 0.447, + "step": 8438 + }, + { + "epoch": 0.67, + "learning_rate": 5.228356020687082e-06, + "loss": 0.2943, + "step": 8439 + }, + { + "epoch": 0.67, + "learning_rate": 5.226101113060769e-06, + "loss": 0.4684, + "step": 8440 + }, + { + "epoch": 0.67, + "learning_rate": 5.223846519772722e-06, + "loss": 0.2466, + "step": 8441 + }, + { + "epoch": 0.67, + "learning_rate": 5.221592240971403e-06, + "loss": 0.268, + "step": 8442 + }, + { + "epoch": 0.67, + "learning_rate": 5.219338276805243e-06, + "loss": 0.3941, + "step": 8443 + }, + { + "epoch": 0.67, + "learning_rate": 5.217084627422656e-06, + "loss": 0.3054, + "step": 8444 + }, + { + "epoch": 0.67, + "learning_rate": 5.214831292972027e-06, + "loss": 0.405, + "step": 8445 + }, + { + "epoch": 0.67, + "learning_rate": 5.212578273601738e-06, + "loss": 0.3351, + "step": 8446 + }, + { + "epoch": 0.67, + "learning_rate": 5.210325569460133e-06, + "loss": 0.2263, + "step": 8447 + }, + { + "epoch": 0.67, + "learning_rate": 5.208073180695538e-06, + "loss": 0.4156, + "step": 8448 + }, + { + "epoch": 0.67, + "learning_rate": 5.205821107456273e-06, + "loss": 0.3713, + "step": 8449 + }, + { + "epoch": 0.67, + "learning_rate": 5.203569349890618e-06, + "loss": 0.3272, + "step": 8450 + }, + { + "epoch": 0.67, + "learning_rate": 5.201317908146843e-06, + "loss": 0.4154, + "step": 8451 + }, + { + "epoch": 0.67, + "learning_rate": 5.199066782373194e-06, + "loss": 0.2781, + "step": 8452 + }, + { + "epoch": 0.67, + "learning_rate": 5.196815972717897e-06, + "loss": 0.3432, + "step": 8453 + }, + { + "epoch": 0.67, + "learning_rate": 5.194565479329154e-06, + "loss": 0.3251, + "step": 8454 + }, + { + "epoch": 0.67, + "learning_rate": 5.192315302355153e-06, + "loss": 0.4063, + "step": 8455 + }, + { + "epoch": 0.67, + "learning_rate": 5.190065441944059e-06, + "loss": 0.3937, + "step": 8456 + }, + { + "epoch": 0.67, + "learning_rate": 5.187815898244006e-06, + "loss": 0.3223, + "step": 8457 + }, + { + "epoch": 0.67, + "learning_rate": 5.185566671403126e-06, + "loss": 0.4383, + "step": 8458 + }, + { + "epoch": 0.67, + "learning_rate": 5.183317761569515e-06, + "loss": 0.3899, + "step": 8459 + }, + { + "epoch": 0.67, + "learning_rate": 5.181069168891248e-06, + "loss": 0.2959, + "step": 8460 + }, + { + "epoch": 0.67, + "learning_rate": 5.178820893516394e-06, + "loss": 0.2379, + "step": 8461 + }, + { + "epoch": 0.67, + "learning_rate": 5.176572935592986e-06, + "loss": 0.3674, + "step": 8462 + }, + { + "epoch": 0.67, + "learning_rate": 5.1743252952690385e-06, + "loss": 0.4483, + "step": 8463 + }, + { + "epoch": 0.67, + "learning_rate": 5.172077972692553e-06, + "loss": 0.4111, + "step": 8464 + }, + { + "epoch": 0.67, + "learning_rate": 5.1698309680115024e-06, + "loss": 0.4129, + "step": 8465 + }, + { + "epoch": 0.67, + "learning_rate": 5.167584281373838e-06, + "loss": 0.5219, + "step": 8466 + }, + { + "epoch": 0.67, + "learning_rate": 5.165337912927502e-06, + "loss": 0.232, + "step": 8467 + }, + { + "epoch": 0.67, + "learning_rate": 5.1630918628204e-06, + "loss": 0.3013, + "step": 8468 + }, + { + "epoch": 0.67, + "learning_rate": 5.1608461312004245e-06, + "loss": 0.3707, + "step": 8469 + }, + { + "epoch": 0.67, + "learning_rate": 5.158600718215443e-06, + "loss": 0.3188, + "step": 8470 + }, + { + "epoch": 0.67, + "learning_rate": 5.156355624013314e-06, + "loss": 0.3035, + "step": 8471 + }, + { + "epoch": 0.67, + "learning_rate": 5.15411084874186e-06, + "loss": 0.3842, + "step": 8472 + }, + { + "epoch": 0.67, + "learning_rate": 5.151866392548886e-06, + "loss": 0.3588, + "step": 8473 + }, + { + "epoch": 0.67, + "learning_rate": 5.149622255582185e-06, + "loss": 0.4037, + "step": 8474 + }, + { + "epoch": 0.67, + "learning_rate": 5.147378437989522e-06, + "loss": 0.3125, + "step": 8475 + }, + { + "epoch": 0.67, + "learning_rate": 5.145134939918634e-06, + "loss": 0.3311, + "step": 8476 + }, + { + "epoch": 0.67, + "learning_rate": 5.1428917615172555e-06, + "loss": 0.4467, + "step": 8477 + }, + { + "epoch": 0.67, + "learning_rate": 5.140648902933083e-06, + "loss": 0.3685, + "step": 8478 + }, + { + "epoch": 0.67, + "learning_rate": 5.138406364313795e-06, + "loss": 0.3139, + "step": 8479 + }, + { + "epoch": 0.67, + "learning_rate": 5.136164145807059e-06, + "loss": 0.3319, + "step": 8480 + }, + { + "epoch": 0.67, + "learning_rate": 5.13392224756051e-06, + "loss": 0.4355, + "step": 8481 + }, + { + "epoch": 0.67, + "learning_rate": 5.131680669721768e-06, + "loss": 0.368, + "step": 8482 + }, + { + "epoch": 0.67, + "learning_rate": 5.129439412438424e-06, + "loss": 0.3861, + "step": 8483 + }, + { + "epoch": 0.67, + "learning_rate": 5.127198475858064e-06, + "loss": 0.4346, + "step": 8484 + }, + { + "epoch": 0.67, + "learning_rate": 5.124957860128237e-06, + "loss": 0.3076, + "step": 8485 + }, + { + "epoch": 0.67, + "learning_rate": 5.122717565396474e-06, + "loss": 0.399, + "step": 8486 + }, + { + "epoch": 0.67, + "learning_rate": 5.1204775918102955e-06, + "loss": 0.4051, + "step": 8487 + }, + { + "epoch": 0.67, + "learning_rate": 5.11823793951719e-06, + "loss": 0.3023, + "step": 8488 + }, + { + "epoch": 0.67, + "learning_rate": 5.115998608664621e-06, + "loss": 0.3812, + "step": 8489 + }, + { + "epoch": 0.67, + "learning_rate": 5.1137595994000475e-06, + "loss": 0.2618, + "step": 8490 + }, + { + "epoch": 0.67, + "learning_rate": 5.111520911870894e-06, + "loss": 0.2815, + "step": 8491 + }, + { + "epoch": 0.67, + "learning_rate": 5.109282546224563e-06, + "loss": 0.4053, + "step": 8492 + }, + { + "epoch": 0.67, + "learning_rate": 5.107044502608447e-06, + "loss": 0.4307, + "step": 8493 + }, + { + "epoch": 0.67, + "learning_rate": 5.104806781169906e-06, + "loss": 0.3451, + "step": 8494 + }, + { + "epoch": 0.67, + "learning_rate": 5.102569382056281e-06, + "loss": 0.4148, + "step": 8495 + }, + { + "epoch": 0.67, + "learning_rate": 5.100332305414902e-06, + "loss": 0.2126, + "step": 8496 + }, + { + "epoch": 0.67, + "learning_rate": 5.098095551393066e-06, + "loss": 0.4334, + "step": 8497 + }, + { + "epoch": 0.67, + "learning_rate": 5.095859120138049e-06, + "loss": 0.2991, + "step": 8498 + }, + { + "epoch": 0.67, + "learning_rate": 5.093623011797108e-06, + "loss": 0.2848, + "step": 8499 + }, + { + "epoch": 0.67, + "learning_rate": 5.091387226517489e-06, + "loss": 0.4375, + "step": 8500 + }, + { + "epoch": 0.67, + "learning_rate": 5.089151764446403e-06, + "loss": 0.2731, + "step": 8501 + }, + { + "epoch": 0.67, + "learning_rate": 5.086916625731038e-06, + "loss": 0.2512, + "step": 8502 + }, + { + "epoch": 0.67, + "learning_rate": 5.084681810518577e-06, + "loss": 0.301, + "step": 8503 + }, + { + "epoch": 0.67, + "learning_rate": 5.0824473189561695e-06, + "loss": 0.3084, + "step": 8504 + }, + { + "epoch": 0.67, + "learning_rate": 5.080213151190938e-06, + "loss": 0.2711, + "step": 8505 + }, + { + "epoch": 0.67, + "learning_rate": 5.077979307370004e-06, + "loss": 0.2909, + "step": 8506 + }, + { + "epoch": 0.67, + "learning_rate": 5.075745787640448e-06, + "loss": 0.4373, + "step": 8507 + }, + { + "epoch": 0.67, + "learning_rate": 5.073512592149334e-06, + "loss": 0.3263, + "step": 8508 + }, + { + "epoch": 0.67, + "learning_rate": 5.071279721043716e-06, + "loss": 0.257, + "step": 8509 + }, + { + "epoch": 0.67, + "learning_rate": 5.069047174470613e-06, + "loss": 0.4659, + "step": 8510 + }, + { + "epoch": 0.67, + "learning_rate": 5.066814952577021e-06, + "loss": 0.3662, + "step": 8511 + }, + { + "epoch": 0.67, + "learning_rate": 5.064583055509935e-06, + "loss": 0.4112, + "step": 8512 + }, + { + "epoch": 0.67, + "learning_rate": 5.062351483416304e-06, + "loss": 0.3267, + "step": 8513 + }, + { + "epoch": 0.67, + "learning_rate": 5.060120236443071e-06, + "loss": 0.3148, + "step": 8514 + }, + { + "epoch": 0.67, + "learning_rate": 5.057889314737148e-06, + "loss": 0.3743, + "step": 8515 + }, + { + "epoch": 0.67, + "learning_rate": 5.055658718445435e-06, + "loss": 0.3564, + "step": 8516 + }, + { + "epoch": 0.67, + "learning_rate": 5.053428447714806e-06, + "loss": 0.4191, + "step": 8517 + }, + { + "epoch": 0.67, + "learning_rate": 5.05119850269211e-06, + "loss": 0.3367, + "step": 8518 + }, + { + "epoch": 0.67, + "learning_rate": 5.048968883524182e-06, + "loss": 0.3209, + "step": 8519 + }, + { + "epoch": 0.67, + "learning_rate": 5.046739590357832e-06, + "loss": 0.3253, + "step": 8520 + }, + { + "epoch": 0.68, + "learning_rate": 5.044510623339842e-06, + "loss": 0.3663, + "step": 8521 + }, + { + "epoch": 0.68, + "learning_rate": 5.042281982616986e-06, + "loss": 0.3932, + "step": 8522 + }, + { + "epoch": 0.68, + "learning_rate": 5.0400536683360064e-06, + "loss": 0.3677, + "step": 8523 + }, + { + "epoch": 0.68, + "learning_rate": 5.037825680643624e-06, + "loss": 0.3333, + "step": 8524 + }, + { + "epoch": 0.68, + "learning_rate": 5.035598019686549e-06, + "loss": 0.3113, + "step": 8525 + }, + { + "epoch": 0.68, + "learning_rate": 5.033370685611456e-06, + "loss": 0.3857, + "step": 8526 + }, + { + "epoch": 0.68, + "learning_rate": 5.031143678565005e-06, + "loss": 0.3906, + "step": 8527 + }, + { + "epoch": 0.68, + "learning_rate": 5.028916998693831e-06, + "loss": 0.3165, + "step": 8528 + }, + { + "epoch": 0.68, + "learning_rate": 5.02669064614456e-06, + "loss": 0.3585, + "step": 8529 + }, + { + "epoch": 0.68, + "learning_rate": 5.024464621063773e-06, + "loss": 0.4815, + "step": 8530 + }, + { + "epoch": 0.68, + "learning_rate": 5.022238923598055e-06, + "loss": 0.2836, + "step": 8531 + }, + { + "epoch": 0.68, + "learning_rate": 5.020013553893952e-06, + "loss": 0.3653, + "step": 8532 + }, + { + "epoch": 0.68, + "learning_rate": 5.017788512097989e-06, + "loss": 0.3197, + "step": 8533 + }, + { + "epoch": 0.68, + "learning_rate": 5.015563798356684e-06, + "loss": 0.3328, + "step": 8534 + }, + { + "epoch": 0.68, + "learning_rate": 5.0133394128165204e-06, + "loss": 0.3374, + "step": 8535 + }, + { + "epoch": 0.68, + "learning_rate": 5.011115355623957e-06, + "loss": 0.3334, + "step": 8536 + }, + { + "epoch": 0.68, + "learning_rate": 5.008891626925447e-06, + "loss": 0.2946, + "step": 8537 + }, + { + "epoch": 0.68, + "learning_rate": 5.006668226867407e-06, + "loss": 0.2331, + "step": 8538 + }, + { + "epoch": 0.68, + "learning_rate": 5.004445155596238e-06, + "loss": 0.3653, + "step": 8539 + }, + { + "epoch": 0.68, + "learning_rate": 5.0022224132583154e-06, + "loss": 0.1861, + "step": 8540 + }, + { + "epoch": 0.68, + "learning_rate": 5.000000000000003e-06, + "loss": 0.2223, + "step": 8541 + }, + { + "epoch": 0.68, + "learning_rate": 4.997777915967631e-06, + "loss": 0.3561, + "step": 8542 + }, + { + "epoch": 0.68, + "learning_rate": 4.995556161307511e-06, + "loss": 0.3757, + "step": 8543 + }, + { + "epoch": 0.68, + "learning_rate": 4.993334736165941e-06, + "loss": 0.2599, + "step": 8544 + }, + { + "epoch": 0.68, + "learning_rate": 4.991113640689189e-06, + "loss": 0.2489, + "step": 8545 + }, + { + "epoch": 0.68, + "learning_rate": 4.988892875023499e-06, + "loss": 0.5149, + "step": 8546 + }, + { + "epoch": 0.68, + "learning_rate": 4.9866724393151044e-06, + "loss": 0.4494, + "step": 8547 + }, + { + "epoch": 0.68, + "learning_rate": 4.984452333710207e-06, + "loss": 0.2551, + "step": 8548 + }, + { + "epoch": 0.68, + "learning_rate": 4.982232558354986e-06, + "loss": 0.3241, + "step": 8549 + }, + { + "epoch": 0.68, + "learning_rate": 4.980013113395612e-06, + "loss": 0.2463, + "step": 8550 + }, + { + "epoch": 0.68, + "learning_rate": 4.9777939989782185e-06, + "loss": 0.3463, + "step": 8551 + }, + { + "epoch": 0.68, + "learning_rate": 4.975575215248926e-06, + "loss": 0.3286, + "step": 8552 + }, + { + "epoch": 0.68, + "learning_rate": 4.9733567623538245e-06, + "loss": 0.4202, + "step": 8553 + }, + { + "epoch": 0.68, + "learning_rate": 4.9711386404389995e-06, + "loss": 0.2571, + "step": 8554 + }, + { + "epoch": 0.68, + "learning_rate": 4.968920849650496e-06, + "loss": 0.3657, + "step": 8555 + }, + { + "epoch": 0.68, + "learning_rate": 4.966703390134343e-06, + "loss": 0.2954, + "step": 8556 + }, + { + "epoch": 0.68, + "learning_rate": 4.964486262036557e-06, + "loss": 0.2899, + "step": 8557 + }, + { + "epoch": 0.68, + "learning_rate": 4.962269465503121e-06, + "loss": 0.3942, + "step": 8558 + }, + { + "epoch": 0.68, + "learning_rate": 4.960053000679997e-06, + "loss": 0.4054, + "step": 8559 + }, + { + "epoch": 0.68, + "learning_rate": 4.957836867713138e-06, + "loss": 0.3036, + "step": 8560 + }, + { + "epoch": 0.68, + "learning_rate": 4.955621066748457e-06, + "loss": 0.2966, + "step": 8561 + }, + { + "epoch": 0.68, + "learning_rate": 4.953405597931854e-06, + "loss": 0.3632, + "step": 8562 + }, + { + "epoch": 0.68, + "learning_rate": 4.951190461409214e-06, + "loss": 0.4405, + "step": 8563 + }, + { + "epoch": 0.68, + "learning_rate": 4.948975657326388e-06, + "loss": 0.2373, + "step": 8564 + }, + { + "epoch": 0.68, + "learning_rate": 4.946761185829208e-06, + "loss": 0.4678, + "step": 8565 + }, + { + "epoch": 0.68, + "learning_rate": 4.944547047063493e-06, + "loss": 0.3794, + "step": 8566 + }, + { + "epoch": 0.68, + "learning_rate": 4.942333241175029e-06, + "loss": 0.333, + "step": 8567 + }, + { + "epoch": 0.68, + "learning_rate": 4.940119768309585e-06, + "loss": 0.3577, + "step": 8568 + }, + { + "epoch": 0.68, + "learning_rate": 4.937906628612905e-06, + "loss": 0.3972, + "step": 8569 + }, + { + "epoch": 0.68, + "learning_rate": 4.93569382223072e-06, + "loss": 0.356, + "step": 8570 + }, + { + "epoch": 0.68, + "learning_rate": 4.933481349308728e-06, + "loss": 0.2686, + "step": 8571 + }, + { + "epoch": 0.68, + "learning_rate": 4.931269209992607e-06, + "loss": 0.2635, + "step": 8572 + }, + { + "epoch": 0.68, + "learning_rate": 4.929057404428023e-06, + "loss": 0.3562, + "step": 8573 + }, + { + "epoch": 0.68, + "learning_rate": 4.926845932760609e-06, + "loss": 0.255, + "step": 8574 + }, + { + "epoch": 0.68, + "learning_rate": 4.924634795135976e-06, + "loss": 0.2946, + "step": 8575 + }, + { + "epoch": 0.68, + "learning_rate": 4.922423991699725e-06, + "loss": 0.3081, + "step": 8576 + }, + { + "epoch": 0.68, + "learning_rate": 4.920213522597422e-06, + "loss": 0.3238, + "step": 8577 + }, + { + "epoch": 0.68, + "learning_rate": 4.918003387974614e-06, + "loss": 0.3671, + "step": 8578 + }, + { + "epoch": 0.68, + "learning_rate": 4.915793587976832e-06, + "loss": 0.2945, + "step": 8579 + }, + { + "epoch": 0.68, + "learning_rate": 4.913584122749578e-06, + "loss": 0.4275, + "step": 8580 + }, + { + "epoch": 0.68, + "learning_rate": 4.911374992438334e-06, + "loss": 0.3187, + "step": 8581 + }, + { + "epoch": 0.68, + "learning_rate": 4.909166197188563e-06, + "loss": 0.2492, + "step": 8582 + }, + { + "epoch": 0.68, + "learning_rate": 4.906957737145703e-06, + "loss": 0.3142, + "step": 8583 + }, + { + "epoch": 0.68, + "learning_rate": 4.904749612455171e-06, + "loss": 0.3794, + "step": 8584 + }, + { + "epoch": 0.68, + "learning_rate": 4.902541823262356e-06, + "loss": 0.3594, + "step": 8585 + }, + { + "epoch": 0.68, + "learning_rate": 4.900334369712637e-06, + "loss": 0.324, + "step": 8586 + }, + { + "epoch": 0.68, + "learning_rate": 4.898127251951363e-06, + "loss": 0.4116, + "step": 8587 + }, + { + "epoch": 0.68, + "learning_rate": 4.895920470123857e-06, + "loss": 0.3144, + "step": 8588 + }, + { + "epoch": 0.68, + "learning_rate": 4.893714024375432e-06, + "loss": 0.4516, + "step": 8589 + }, + { + "epoch": 0.68, + "learning_rate": 4.89150791485137e-06, + "loss": 0.3444, + "step": 8590 + }, + { + "epoch": 0.68, + "learning_rate": 4.889302141696925e-06, + "loss": 0.3287, + "step": 8591 + }, + { + "epoch": 0.68, + "learning_rate": 4.88709670505735e-06, + "loss": 0.3211, + "step": 8592 + }, + { + "epoch": 0.68, + "learning_rate": 4.884891605077853e-06, + "loss": 0.3008, + "step": 8593 + }, + { + "epoch": 0.68, + "learning_rate": 4.882686841903627e-06, + "loss": 0.3979, + "step": 8594 + }, + { + "epoch": 0.68, + "learning_rate": 4.8804824156798544e-06, + "loss": 0.3046, + "step": 8595 + }, + { + "epoch": 0.68, + "learning_rate": 4.878278326551682e-06, + "loss": 0.3071, + "step": 8596 + }, + { + "epoch": 0.68, + "learning_rate": 4.876074574664232e-06, + "loss": 0.2671, + "step": 8597 + }, + { + "epoch": 0.68, + "learning_rate": 4.873871160162622e-06, + "loss": 0.3031, + "step": 8598 + }, + { + "epoch": 0.68, + "learning_rate": 4.871668083191931e-06, + "loss": 0.3542, + "step": 8599 + }, + { + "epoch": 0.68, + "learning_rate": 4.8694653438972195e-06, + "loss": 0.3023, + "step": 8600 + }, + { + "epoch": 0.68, + "learning_rate": 4.867262942423525e-06, + "loss": 0.3336, + "step": 8601 + }, + { + "epoch": 0.68, + "learning_rate": 4.865060878915873e-06, + "loss": 0.3482, + "step": 8602 + }, + { + "epoch": 0.68, + "learning_rate": 4.862859153519252e-06, + "loss": 0.4979, + "step": 8603 + }, + { + "epoch": 0.68, + "learning_rate": 4.860657766378637e-06, + "loss": 0.4289, + "step": 8604 + }, + { + "epoch": 0.68, + "learning_rate": 4.858456717638981e-06, + "loss": 0.2131, + "step": 8605 + }, + { + "epoch": 0.68, + "learning_rate": 4.856256007445211e-06, + "loss": 0.1931, + "step": 8606 + }, + { + "epoch": 0.68, + "learning_rate": 4.8540556359422335e-06, + "loss": 0.3515, + "step": 8607 + }, + { + "epoch": 0.68, + "learning_rate": 4.85185560327493e-06, + "loss": 0.2649, + "step": 8608 + }, + { + "epoch": 0.68, + "learning_rate": 4.849655909588165e-06, + "loss": 0.3549, + "step": 8609 + }, + { + "epoch": 0.68, + "learning_rate": 4.847456555026773e-06, + "loss": 0.3572, + "step": 8610 + }, + { + "epoch": 0.68, + "learning_rate": 4.845257539735577e-06, + "loss": 0.285, + "step": 8611 + }, + { + "epoch": 0.68, + "learning_rate": 4.843058863859369e-06, + "loss": 0.353, + "step": 8612 + }, + { + "epoch": 0.68, + "learning_rate": 4.840860527542919e-06, + "loss": 0.3043, + "step": 8613 + }, + { + "epoch": 0.68, + "learning_rate": 4.838662530930981e-06, + "loss": 0.2703, + "step": 8614 + }, + { + "epoch": 0.68, + "learning_rate": 4.836464874168282e-06, + "loss": 0.418, + "step": 8615 + }, + { + "epoch": 0.68, + "learning_rate": 4.834267557399521e-06, + "loss": 0.3369, + "step": 8616 + }, + { + "epoch": 0.68, + "learning_rate": 4.832070580769389e-06, + "loss": 0.333, + "step": 8617 + }, + { + "epoch": 0.68, + "learning_rate": 4.829873944422544e-06, + "loss": 0.3154, + "step": 8618 + }, + { + "epoch": 0.68, + "learning_rate": 4.8276776485036185e-06, + "loss": 0.3784, + "step": 8619 + }, + { + "epoch": 0.68, + "learning_rate": 4.825481693157235e-06, + "loss": 0.4263, + "step": 8620 + }, + { + "epoch": 0.68, + "learning_rate": 4.823286078527984e-06, + "loss": 0.3096, + "step": 8621 + }, + { + "epoch": 0.68, + "learning_rate": 4.8210908047604336e-06, + "loss": 0.3891, + "step": 8622 + }, + { + "epoch": 0.68, + "learning_rate": 4.818895871999136e-06, + "loss": 0.3114, + "step": 8623 + }, + { + "epoch": 0.68, + "learning_rate": 4.816701280388617e-06, + "loss": 0.2782, + "step": 8624 + }, + { + "epoch": 0.68, + "learning_rate": 4.814507030073377e-06, + "loss": 0.2934, + "step": 8625 + }, + { + "epoch": 0.68, + "learning_rate": 4.812313121197896e-06, + "loss": 0.3367, + "step": 8626 + }, + { + "epoch": 0.68, + "learning_rate": 4.810119553906637e-06, + "loss": 0.3617, + "step": 8627 + }, + { + "epoch": 0.68, + "learning_rate": 4.807926328344033e-06, + "loss": 0.3086, + "step": 8628 + }, + { + "epoch": 0.68, + "learning_rate": 4.805733444654496e-06, + "loss": 0.3131, + "step": 8629 + }, + { + "epoch": 0.68, + "learning_rate": 4.8035409029824195e-06, + "loss": 0.2467, + "step": 8630 + }, + { + "epoch": 0.68, + "learning_rate": 4.801348703472173e-06, + "loss": 0.3664, + "step": 8631 + }, + { + "epoch": 0.68, + "learning_rate": 4.7991568462680945e-06, + "loss": 0.3282, + "step": 8632 + }, + { + "epoch": 0.68, + "learning_rate": 4.796965331514517e-06, + "loss": 0.2674, + "step": 8633 + }, + { + "epoch": 0.68, + "learning_rate": 4.794774159355737e-06, + "loss": 0.263, + "step": 8634 + }, + { + "epoch": 0.68, + "learning_rate": 4.79258332993603e-06, + "loss": 0.4334, + "step": 8635 + }, + { + "epoch": 0.68, + "learning_rate": 4.7903928433996576e-06, + "loss": 0.2919, + "step": 8636 + }, + { + "epoch": 0.68, + "learning_rate": 4.788202699890848e-06, + "loss": 0.313, + "step": 8637 + }, + { + "epoch": 0.68, + "learning_rate": 4.786012899553815e-06, + "loss": 0.436, + "step": 8638 + }, + { + "epoch": 0.68, + "learning_rate": 4.783823442532739e-06, + "loss": 0.3719, + "step": 8639 + }, + { + "epoch": 0.68, + "learning_rate": 4.781634328971796e-06, + "loss": 0.4176, + "step": 8640 + }, + { + "epoch": 0.68, + "learning_rate": 4.779445559015122e-06, + "loss": 0.2888, + "step": 8641 + }, + { + "epoch": 0.68, + "learning_rate": 4.777257132806835e-06, + "loss": 0.2828, + "step": 8642 + }, + { + "epoch": 0.68, + "learning_rate": 4.775069050491039e-06, + "loss": 0.2151, + "step": 8643 + }, + { + "epoch": 0.68, + "learning_rate": 4.772881312211805e-06, + "loss": 0.3745, + "step": 8644 + }, + { + "epoch": 0.68, + "learning_rate": 4.770693918113183e-06, + "loss": 0.2559, + "step": 8645 + }, + { + "epoch": 0.68, + "learning_rate": 4.768506868339206e-06, + "loss": 0.3218, + "step": 8646 + }, + { + "epoch": 0.69, + "learning_rate": 4.766320163033882e-06, + "loss": 0.3135, + "step": 8647 + }, + { + "epoch": 0.69, + "learning_rate": 4.764133802341188e-06, + "loss": 0.3666, + "step": 8648 + }, + { + "epoch": 0.69, + "learning_rate": 4.761947786405092e-06, + "loss": 0.3688, + "step": 8649 + }, + { + "epoch": 0.69, + "learning_rate": 4.759762115369531e-06, + "loss": 0.3289, + "step": 8650 + }, + { + "epoch": 0.69, + "learning_rate": 4.7575767893784174e-06, + "loss": 0.2574, + "step": 8651 + }, + { + "epoch": 0.69, + "learning_rate": 4.755391808575651e-06, + "loss": 0.2979, + "step": 8652 + }, + { + "epoch": 0.69, + "learning_rate": 4.7532071731050975e-06, + "loss": 0.3916, + "step": 8653 + }, + { + "epoch": 0.69, + "learning_rate": 4.7510228831106064e-06, + "loss": 0.2908, + "step": 8654 + }, + { + "epoch": 0.69, + "learning_rate": 4.748838938735999e-06, + "loss": 0.4071, + "step": 8655 + }, + { + "epoch": 0.69, + "learning_rate": 4.746655340125082e-06, + "loss": 0.3016, + "step": 8656 + }, + { + "epoch": 0.69, + "learning_rate": 4.744472087421635e-06, + "loss": 0.2975, + "step": 8657 + }, + { + "epoch": 0.69, + "learning_rate": 4.74228918076941e-06, + "loss": 0.2487, + "step": 8658 + }, + { + "epoch": 0.69, + "learning_rate": 4.740106620312147e-06, + "loss": 0.3438, + "step": 8659 + }, + { + "epoch": 0.69, + "learning_rate": 4.737924406193554e-06, + "loss": 0.3609, + "step": 8660 + }, + { + "epoch": 0.69, + "learning_rate": 4.735742538557316e-06, + "loss": 0.2719, + "step": 8661 + }, + { + "epoch": 0.69, + "learning_rate": 4.733561017547104e-06, + "loss": 0.3542, + "step": 8662 + }, + { + "epoch": 0.69, + "learning_rate": 4.73137984330656e-06, + "loss": 0.3613, + "step": 8663 + }, + { + "epoch": 0.69, + "learning_rate": 4.729199015979298e-06, + "loss": 0.2209, + "step": 8664 + }, + { + "epoch": 0.69, + "learning_rate": 4.727018535708922e-06, + "loss": 0.2839, + "step": 8665 + }, + { + "epoch": 0.69, + "learning_rate": 4.724838402639006e-06, + "loss": 0.3774, + "step": 8666 + }, + { + "epoch": 0.69, + "learning_rate": 4.7226586169130925e-06, + "loss": 0.3578, + "step": 8667 + }, + { + "epoch": 0.69, + "learning_rate": 4.7204791786747215e-06, + "loss": 0.2793, + "step": 8668 + }, + { + "epoch": 0.69, + "learning_rate": 4.718300088067392e-06, + "loss": 0.3829, + "step": 8669 + }, + { + "epoch": 0.69, + "learning_rate": 4.716121345234589e-06, + "loss": 0.2884, + "step": 8670 + }, + { + "epoch": 0.69, + "learning_rate": 4.713942950319767e-06, + "loss": 0.3772, + "step": 8671 + }, + { + "epoch": 0.69, + "learning_rate": 4.71176490346637e-06, + "loss": 0.3755, + "step": 8672 + }, + { + "epoch": 0.69, + "learning_rate": 4.709587204817809e-06, + "loss": 0.2008, + "step": 8673 + }, + { + "epoch": 0.69, + "learning_rate": 4.707409854517471e-06, + "loss": 0.2868, + "step": 8674 + }, + { + "epoch": 0.69, + "learning_rate": 4.705232852708732e-06, + "loss": 0.4133, + "step": 8675 + }, + { + "epoch": 0.69, + "learning_rate": 4.703056199534933e-06, + "loss": 0.3785, + "step": 8676 + }, + { + "epoch": 0.69, + "learning_rate": 4.700879895139391e-06, + "loss": 0.2684, + "step": 8677 + }, + { + "epoch": 0.69, + "learning_rate": 4.698703939665414e-06, + "loss": 0.3368, + "step": 8678 + }, + { + "epoch": 0.69, + "learning_rate": 4.696528333256275e-06, + "loss": 0.3941, + "step": 8679 + }, + { + "epoch": 0.69, + "learning_rate": 4.694353076055222e-06, + "loss": 0.3322, + "step": 8680 + }, + { + "epoch": 0.69, + "learning_rate": 4.6921781682054954e-06, + "loss": 0.2126, + "step": 8681 + }, + { + "epoch": 0.69, + "learning_rate": 4.6900036098502956e-06, + "loss": 0.2907, + "step": 8682 + }, + { + "epoch": 0.69, + "learning_rate": 4.687829401132804e-06, + "loss": 0.3778, + "step": 8683 + }, + { + "epoch": 0.69, + "learning_rate": 4.685655542196194e-06, + "loss": 0.27, + "step": 8684 + }, + { + "epoch": 0.69, + "learning_rate": 4.6834820331835915e-06, + "loss": 0.4733, + "step": 8685 + }, + { + "epoch": 0.69, + "learning_rate": 4.681308874238112e-06, + "loss": 0.2395, + "step": 8686 + }, + { + "epoch": 0.69, + "learning_rate": 4.679136065502855e-06, + "loss": 0.3382, + "step": 8687 + }, + { + "epoch": 0.69, + "learning_rate": 4.676963607120886e-06, + "loss": 0.405, + "step": 8688 + }, + { + "epoch": 0.69, + "learning_rate": 4.674791499235246e-06, + "loss": 0.4409, + "step": 8689 + }, + { + "epoch": 0.69, + "learning_rate": 4.672619741988966e-06, + "loss": 0.2501, + "step": 8690 + }, + { + "epoch": 0.69, + "learning_rate": 4.670448335525043e-06, + "loss": 0.4708, + "step": 8691 + }, + { + "epoch": 0.69, + "learning_rate": 4.66827727998645e-06, + "loss": 0.2513, + "step": 8692 + }, + { + "epoch": 0.69, + "learning_rate": 4.666106575516146e-06, + "loss": 0.4421, + "step": 8693 + }, + { + "epoch": 0.69, + "learning_rate": 4.663936222257059e-06, + "loss": 0.273, + "step": 8694 + }, + { + "epoch": 0.69, + "learning_rate": 4.661766220352098e-06, + "loss": 0.3438, + "step": 8695 + }, + { + "epoch": 0.69, + "learning_rate": 4.659596569944139e-06, + "loss": 0.3222, + "step": 8696 + }, + { + "epoch": 0.69, + "learning_rate": 4.657427271176055e-06, + "loss": 0.3002, + "step": 8697 + }, + { + "epoch": 0.69, + "learning_rate": 4.655258324190678e-06, + "loss": 0.4341, + "step": 8698 + }, + { + "epoch": 0.69, + "learning_rate": 4.65308972913082e-06, + "loss": 0.4084, + "step": 8699 + }, + { + "epoch": 0.69, + "learning_rate": 4.6509214861392785e-06, + "loss": 0.3222, + "step": 8700 + }, + { + "epoch": 0.69, + "learning_rate": 4.648753595358818e-06, + "loss": 0.4007, + "step": 8701 + }, + { + "epoch": 0.69, + "learning_rate": 4.646586056932183e-06, + "loss": 0.3565, + "step": 8702 + }, + { + "epoch": 0.69, + "learning_rate": 4.6444188710021e-06, + "loss": 0.3043, + "step": 8703 + }, + { + "epoch": 0.69, + "learning_rate": 4.6422520377112646e-06, + "loss": 0.3775, + "step": 8704 + }, + { + "epoch": 0.69, + "learning_rate": 4.640085557202349e-06, + "loss": 0.3157, + "step": 8705 + }, + { + "epoch": 0.69, + "learning_rate": 4.637919429618014e-06, + "loss": 0.3041, + "step": 8706 + }, + { + "epoch": 0.69, + "learning_rate": 4.635753655100883e-06, + "loss": 0.2467, + "step": 8707 + }, + { + "epoch": 0.69, + "learning_rate": 4.633588233793559e-06, + "loss": 0.3913, + "step": 8708 + }, + { + "epoch": 0.69, + "learning_rate": 4.631423165838632e-06, + "loss": 0.2093, + "step": 8709 + }, + { + "epoch": 0.69, + "learning_rate": 4.629258451378658e-06, + "loss": 0.3479, + "step": 8710 + }, + { + "epoch": 0.69, + "learning_rate": 4.6270940905561725e-06, + "loss": 0.4234, + "step": 8711 + }, + { + "epoch": 0.69, + "learning_rate": 4.624930083513684e-06, + "loss": 0.2622, + "step": 8712 + }, + { + "epoch": 0.69, + "learning_rate": 4.62276643039369e-06, + "loss": 0.3286, + "step": 8713 + }, + { + "epoch": 0.69, + "learning_rate": 4.620603131338655e-06, + "loss": 0.3599, + "step": 8714 + }, + { + "epoch": 0.69, + "learning_rate": 4.6184401864910136e-06, + "loss": 0.4843, + "step": 8715 + }, + { + "epoch": 0.69, + "learning_rate": 4.616277595993196e-06, + "loss": 0.3023, + "step": 8716 + }, + { + "epoch": 0.69, + "learning_rate": 4.614115359987595e-06, + "loss": 0.3252, + "step": 8717 + }, + { + "epoch": 0.69, + "learning_rate": 4.6119534786165765e-06, + "loss": 0.3492, + "step": 8718 + }, + { + "epoch": 0.69, + "learning_rate": 4.609791952022501e-06, + "loss": 0.3382, + "step": 8719 + }, + { + "epoch": 0.69, + "learning_rate": 4.607630780347689e-06, + "loss": 0.3954, + "step": 8720 + }, + { + "epoch": 0.69, + "learning_rate": 4.60546996373444e-06, + "loss": 0.3365, + "step": 8721 + }, + { + "epoch": 0.69, + "learning_rate": 4.603309502325041e-06, + "loss": 0.383, + "step": 8722 + }, + { + "epoch": 0.69, + "learning_rate": 4.601149396261744e-06, + "loss": 0.3691, + "step": 8723 + }, + { + "epoch": 0.69, + "learning_rate": 4.598989645686782e-06, + "loss": 0.2209, + "step": 8724 + }, + { + "epoch": 0.69, + "learning_rate": 4.596830250742359e-06, + "loss": 0.3408, + "step": 8725 + }, + { + "epoch": 0.69, + "learning_rate": 4.594671211570671e-06, + "loss": 0.2548, + "step": 8726 + }, + { + "epoch": 0.69, + "learning_rate": 4.592512528313874e-06, + "loss": 0.3426, + "step": 8727 + }, + { + "epoch": 0.69, + "learning_rate": 4.590354201114103e-06, + "loss": 0.425, + "step": 8728 + }, + { + "epoch": 0.69, + "learning_rate": 4.588196230113483e-06, + "loss": 0.4425, + "step": 8729 + }, + { + "epoch": 0.69, + "learning_rate": 4.586038615454102e-06, + "loss": 0.3723, + "step": 8730 + }, + { + "epoch": 0.69, + "learning_rate": 4.583881357278023e-06, + "loss": 0.3336, + "step": 8731 + }, + { + "epoch": 0.69, + "learning_rate": 4.5817244557273e-06, + "loss": 0.3877, + "step": 8732 + }, + { + "epoch": 0.69, + "learning_rate": 4.5795679109439505e-06, + "loss": 0.3421, + "step": 8733 + }, + { + "epoch": 0.69, + "learning_rate": 4.57741172306997e-06, + "loss": 0.3963, + "step": 8734 + }, + { + "epoch": 0.69, + "learning_rate": 4.5752558922473376e-06, + "loss": 0.3619, + "step": 8735 + }, + { + "epoch": 0.69, + "learning_rate": 4.573100418618004e-06, + "loss": 0.3536, + "step": 8736 + }, + { + "epoch": 0.69, + "learning_rate": 4.57094530232389e-06, + "loss": 0.3651, + "step": 8737 + }, + { + "epoch": 0.69, + "learning_rate": 4.5687905435069106e-06, + "loss": 0.3708, + "step": 8738 + }, + { + "epoch": 0.69, + "learning_rate": 4.566636142308939e-06, + "loss": 0.399, + "step": 8739 + }, + { + "epoch": 0.69, + "learning_rate": 4.564482098871834e-06, + "loss": 0.3939, + "step": 8740 + }, + { + "epoch": 0.69, + "learning_rate": 4.562328413337426e-06, + "loss": 0.2723, + "step": 8741 + }, + { + "epoch": 0.69, + "learning_rate": 4.56017508584753e-06, + "loss": 0.3408, + "step": 8742 + }, + { + "epoch": 0.69, + "learning_rate": 4.558022116543931e-06, + "loss": 0.2895, + "step": 8743 + }, + { + "epoch": 0.69, + "learning_rate": 4.555869505568386e-06, + "loss": 0.3156, + "step": 8744 + }, + { + "epoch": 0.69, + "learning_rate": 4.553717253062643e-06, + "loss": 0.2951, + "step": 8745 + }, + { + "epoch": 0.69, + "learning_rate": 4.551565359168411e-06, + "loss": 0.2808, + "step": 8746 + }, + { + "epoch": 0.69, + "learning_rate": 4.549413824027382e-06, + "loss": 0.3832, + "step": 8747 + }, + { + "epoch": 0.69, + "learning_rate": 4.54726264778123e-06, + "loss": 0.4395, + "step": 8748 + }, + { + "epoch": 0.69, + "learning_rate": 4.5451118305715954e-06, + "loss": 0.3797, + "step": 8749 + }, + { + "epoch": 0.69, + "learning_rate": 4.542961372540096e-06, + "loss": 0.3133, + "step": 8750 + }, + { + "epoch": 0.69, + "learning_rate": 4.540811273828336e-06, + "loss": 0.3479, + "step": 8751 + }, + { + "epoch": 0.69, + "learning_rate": 4.538661534577886e-06, + "loss": 0.4155, + "step": 8752 + }, + { + "epoch": 0.69, + "learning_rate": 4.5365121549302916e-06, + "loss": 0.2925, + "step": 8753 + }, + { + "epoch": 0.69, + "learning_rate": 4.534363135027086e-06, + "loss": 0.3028, + "step": 8754 + }, + { + "epoch": 0.69, + "learning_rate": 4.532214475009771e-06, + "loss": 0.3329, + "step": 8755 + }, + { + "epoch": 0.69, + "learning_rate": 4.530066175019823e-06, + "loss": 0.4165, + "step": 8756 + }, + { + "epoch": 0.69, + "learning_rate": 4.527918235198692e-06, + "loss": 0.341, + "step": 8757 + }, + { + "epoch": 0.69, + "learning_rate": 4.525770655687821e-06, + "loss": 0.3737, + "step": 8758 + }, + { + "epoch": 0.69, + "learning_rate": 4.523623436628611e-06, + "loss": 0.4294, + "step": 8759 + }, + { + "epoch": 0.69, + "learning_rate": 4.521476578162445e-06, + "loss": 0.2685, + "step": 8760 + }, + { + "epoch": 0.69, + "learning_rate": 4.519330080430687e-06, + "loss": 0.3488, + "step": 8761 + }, + { + "epoch": 0.69, + "learning_rate": 4.517183943574673e-06, + "loss": 0.3087, + "step": 8762 + }, + { + "epoch": 0.69, + "learning_rate": 4.515038167735715e-06, + "loss": 0.4403, + "step": 8763 + }, + { + "epoch": 0.69, + "learning_rate": 4.5128927530551e-06, + "loss": 0.2745, + "step": 8764 + }, + { + "epoch": 0.69, + "learning_rate": 4.510747699674096e-06, + "loss": 0.1754, + "step": 8765 + }, + { + "epoch": 0.69, + "learning_rate": 4.50860300773394e-06, + "loss": 0.354, + "step": 8766 + }, + { + "epoch": 0.69, + "learning_rate": 4.506458677375856e-06, + "loss": 0.4173, + "step": 8767 + }, + { + "epoch": 0.69, + "learning_rate": 4.504314708741037e-06, + "loss": 0.4004, + "step": 8768 + }, + { + "epoch": 0.69, + "learning_rate": 4.502171101970645e-06, + "loss": 0.3504, + "step": 8769 + }, + { + "epoch": 0.69, + "learning_rate": 4.5000278572058365e-06, + "loss": 0.2478, + "step": 8770 + }, + { + "epoch": 0.69, + "learning_rate": 4.497884974587729e-06, + "loss": 0.2399, + "step": 8771 + }, + { + "epoch": 0.69, + "learning_rate": 4.495742454257418e-06, + "loss": 0.3452, + "step": 8772 + }, + { + "epoch": 0.7, + "learning_rate": 4.493600296355986e-06, + "loss": 0.3987, + "step": 8773 + }, + { + "epoch": 0.7, + "learning_rate": 4.491458501024479e-06, + "loss": 0.4622, + "step": 8774 + }, + { + "epoch": 0.7, + "learning_rate": 4.489317068403919e-06, + "loss": 0.2889, + "step": 8775 + }, + { + "epoch": 0.7, + "learning_rate": 4.487175998635319e-06, + "loss": 0.4114, + "step": 8776 + }, + { + "epoch": 0.7, + "learning_rate": 4.485035291859654e-06, + "loss": 0.3147, + "step": 8777 + }, + { + "epoch": 0.7, + "learning_rate": 4.482894948217875e-06, + "loss": 0.3011, + "step": 8778 + }, + { + "epoch": 0.7, + "learning_rate": 4.48075496785092e-06, + "loss": 0.2357, + "step": 8779 + }, + { + "epoch": 0.7, + "learning_rate": 4.4786153508996944e-06, + "loss": 0.2947, + "step": 8780 + }, + { + "epoch": 0.7, + "learning_rate": 4.47647609750508e-06, + "loss": 0.2722, + "step": 8781 + }, + { + "epoch": 0.7, + "learning_rate": 4.4743372078079335e-06, + "loss": 0.3747, + "step": 8782 + }, + { + "epoch": 0.7, + "learning_rate": 4.472198681949098e-06, + "loss": 0.2842, + "step": 8783 + }, + { + "epoch": 0.7, + "learning_rate": 4.470060520069381e-06, + "loss": 0.3371, + "step": 8784 + }, + { + "epoch": 0.7, + "learning_rate": 4.467922722309567e-06, + "loss": 0.3492, + "step": 8785 + }, + { + "epoch": 0.7, + "learning_rate": 4.465785288810427e-06, + "loss": 0.3741, + "step": 8786 + }, + { + "epoch": 0.7, + "learning_rate": 4.4636482197126965e-06, + "loss": 0.3379, + "step": 8787 + }, + { + "epoch": 0.7, + "learning_rate": 4.461511515157087e-06, + "loss": 0.2939, + "step": 8788 + }, + { + "epoch": 0.7, + "learning_rate": 4.459375175284299e-06, + "loss": 0.3315, + "step": 8789 + }, + { + "epoch": 0.7, + "learning_rate": 4.457239200234996e-06, + "loss": 0.4213, + "step": 8790 + }, + { + "epoch": 0.7, + "learning_rate": 4.4551035901498186e-06, + "loss": 0.3721, + "step": 8791 + }, + { + "epoch": 0.7, + "learning_rate": 4.4529683451693916e-06, + "loss": 0.3291, + "step": 8792 + }, + { + "epoch": 0.7, + "learning_rate": 4.45083346543431e-06, + "loss": 0.3356, + "step": 8793 + }, + { + "epoch": 0.7, + "learning_rate": 4.448698951085143e-06, + "loss": 0.3279, + "step": 8794 + }, + { + "epoch": 0.7, + "learning_rate": 4.446564802262435e-06, + "loss": 0.2849, + "step": 8795 + }, + { + "epoch": 0.7, + "learning_rate": 4.444431019106718e-06, + "loss": 0.3881, + "step": 8796 + }, + { + "epoch": 0.7, + "learning_rate": 4.4422976017584866e-06, + "loss": 0.4166, + "step": 8797 + }, + { + "epoch": 0.7, + "learning_rate": 4.440164550358212e-06, + "loss": 0.2788, + "step": 8798 + }, + { + "epoch": 0.7, + "learning_rate": 4.438031865046353e-06, + "loss": 0.2628, + "step": 8799 + }, + { + "epoch": 0.7, + "learning_rate": 4.435899545963333e-06, + "loss": 0.3327, + "step": 8800 + }, + { + "epoch": 0.7, + "learning_rate": 4.4337675932495515e-06, + "loss": 0.2938, + "step": 8801 + }, + { + "epoch": 0.7, + "learning_rate": 4.431636007045396e-06, + "loss": 0.2048, + "step": 8802 + }, + { + "epoch": 0.7, + "learning_rate": 4.429504787491214e-06, + "loss": 0.4041, + "step": 8803 + }, + { + "epoch": 0.7, + "learning_rate": 4.427373934727337e-06, + "loss": 0.4008, + "step": 8804 + }, + { + "epoch": 0.7, + "learning_rate": 4.425243448894074e-06, + "loss": 0.2524, + "step": 8805 + }, + { + "epoch": 0.7, + "learning_rate": 4.423113330131708e-06, + "loss": 0.3525, + "step": 8806 + }, + { + "epoch": 0.7, + "learning_rate": 4.42098357858049e-06, + "loss": 0.4638, + "step": 8807 + }, + { + "epoch": 0.7, + "learning_rate": 4.418854194380663e-06, + "loss": 0.3352, + "step": 8808 + }, + { + "epoch": 0.7, + "learning_rate": 4.416725177672432e-06, + "loss": 0.2261, + "step": 8809 + }, + { + "epoch": 0.7, + "learning_rate": 4.4145965285959836e-06, + "loss": 0.3483, + "step": 8810 + }, + { + "epoch": 0.7, + "learning_rate": 4.412468247291474e-06, + "loss": 0.3193, + "step": 8811 + }, + { + "epoch": 0.7, + "learning_rate": 4.410340333899049e-06, + "loss": 0.4588, + "step": 8812 + }, + { + "epoch": 0.7, + "learning_rate": 4.408212788558818e-06, + "loss": 0.3848, + "step": 8813 + }, + { + "epoch": 0.7, + "learning_rate": 4.406085611410864e-06, + "loss": 0.3956, + "step": 8814 + }, + { + "epoch": 0.7, + "learning_rate": 4.403958802595261e-06, + "loss": 0.4191, + "step": 8815 + }, + { + "epoch": 0.7, + "learning_rate": 4.401832362252044e-06, + "loss": 0.2995, + "step": 8816 + }, + { + "epoch": 0.7, + "learning_rate": 4.399706290521225e-06, + "loss": 0.2901, + "step": 8817 + }, + { + "epoch": 0.7, + "learning_rate": 4.397580587542805e-06, + "loss": 0.2578, + "step": 8818 + }, + { + "epoch": 0.7, + "learning_rate": 4.3954552534567455e-06, + "loss": 0.3345, + "step": 8819 + }, + { + "epoch": 0.7, + "learning_rate": 4.393330288402986e-06, + "loss": 0.3874, + "step": 8820 + }, + { + "epoch": 0.7, + "learning_rate": 4.391205692521453e-06, + "loss": 0.3672, + "step": 8821 + }, + { + "epoch": 0.7, + "learning_rate": 4.389081465952039e-06, + "loss": 0.3812, + "step": 8822 + }, + { + "epoch": 0.7, + "learning_rate": 4.386957608834607e-06, + "loss": 0.2053, + "step": 8823 + }, + { + "epoch": 0.7, + "learning_rate": 4.384834121309013e-06, + "loss": 0.4392, + "step": 8824 + }, + { + "epoch": 0.7, + "learning_rate": 4.382711003515072e-06, + "loss": 0.3832, + "step": 8825 + }, + { + "epoch": 0.7, + "learning_rate": 4.3805882555925846e-06, + "loss": 0.3068, + "step": 8826 + }, + { + "epoch": 0.7, + "learning_rate": 4.378465877681317e-06, + "loss": 0.4159, + "step": 8827 + }, + { + "epoch": 0.7, + "learning_rate": 4.376343869921027e-06, + "loss": 0.3861, + "step": 8828 + }, + { + "epoch": 0.7, + "learning_rate": 4.374222232451433e-06, + "loss": 0.3602, + "step": 8829 + }, + { + "epoch": 0.7, + "learning_rate": 4.3721009654122315e-06, + "loss": 0.4136, + "step": 8830 + }, + { + "epoch": 0.7, + "learning_rate": 4.369980068943106e-06, + "loss": 0.2614, + "step": 8831 + }, + { + "epoch": 0.7, + "learning_rate": 4.367859543183702e-06, + "loss": 0.3766, + "step": 8832 + }, + { + "epoch": 0.7, + "learning_rate": 4.3657393882736456e-06, + "loss": 0.315, + "step": 8833 + }, + { + "epoch": 0.7, + "learning_rate": 4.3636196043525415e-06, + "loss": 0.402, + "step": 8834 + }, + { + "epoch": 0.7, + "learning_rate": 4.361500191559967e-06, + "loss": 0.3854, + "step": 8835 + }, + { + "epoch": 0.7, + "learning_rate": 4.35938115003547e-06, + "loss": 0.35, + "step": 8836 + }, + { + "epoch": 0.7, + "learning_rate": 4.357262479918587e-06, + "loss": 0.333, + "step": 8837 + }, + { + "epoch": 0.7, + "learning_rate": 4.355144181348819e-06, + "loss": 0.3689, + "step": 8838 + }, + { + "epoch": 0.7, + "learning_rate": 4.353026254465642e-06, + "loss": 0.4301, + "step": 8839 + }, + { + "epoch": 0.7, + "learning_rate": 4.350908699408521e-06, + "loss": 0.3832, + "step": 8840 + }, + { + "epoch": 0.7, + "learning_rate": 4.348791516316878e-06, + "loss": 0.3682, + "step": 8841 + }, + { + "epoch": 0.7, + "learning_rate": 4.346674705330117e-06, + "loss": 0.3247, + "step": 8842 + }, + { + "epoch": 0.7, + "learning_rate": 4.344558266587628e-06, + "loss": 0.2973, + "step": 8843 + }, + { + "epoch": 0.7, + "learning_rate": 4.342442200228766e-06, + "loss": 0.2902, + "step": 8844 + }, + { + "epoch": 0.7, + "learning_rate": 4.340326506392859e-06, + "loss": 0.2875, + "step": 8845 + }, + { + "epoch": 0.7, + "learning_rate": 4.338211185219222e-06, + "loss": 0.3513, + "step": 8846 + }, + { + "epoch": 0.7, + "learning_rate": 4.336096236847136e-06, + "loss": 0.2951, + "step": 8847 + }, + { + "epoch": 0.7, + "learning_rate": 4.333981661415856e-06, + "loss": 0.1973, + "step": 8848 + }, + { + "epoch": 0.7, + "learning_rate": 4.331867459064623e-06, + "loss": 0.3646, + "step": 8849 + }, + { + "epoch": 0.7, + "learning_rate": 4.329753629932646e-06, + "loss": 0.3584, + "step": 8850 + }, + { + "epoch": 0.7, + "learning_rate": 4.327640174159109e-06, + "loss": 0.3128, + "step": 8851 + }, + { + "epoch": 0.7, + "learning_rate": 4.325527091883168e-06, + "loss": 0.2442, + "step": 8852 + }, + { + "epoch": 0.7, + "learning_rate": 4.323414383243969e-06, + "loss": 0.3629, + "step": 8853 + }, + { + "epoch": 0.7, + "learning_rate": 4.321302048380619e-06, + "loss": 0.3384, + "step": 8854 + }, + { + "epoch": 0.7, + "learning_rate": 4.319190087432201e-06, + "loss": 0.341, + "step": 8855 + }, + { + "epoch": 0.7, + "learning_rate": 4.317078500537785e-06, + "loss": 0.32, + "step": 8856 + }, + { + "epoch": 0.7, + "learning_rate": 4.314967287836405e-06, + "loss": 0.3641, + "step": 8857 + }, + { + "epoch": 0.7, + "learning_rate": 4.3128564494670715e-06, + "loss": 0.3323, + "step": 8858 + }, + { + "epoch": 0.7, + "learning_rate": 4.310745985568779e-06, + "loss": 0.4212, + "step": 8859 + }, + { + "epoch": 0.7, + "learning_rate": 4.3086358962804885e-06, + "loss": 0.3101, + "step": 8860 + }, + { + "epoch": 0.7, + "learning_rate": 4.306526181741135e-06, + "loss": 0.3227, + "step": 8861 + }, + { + "epoch": 0.7, + "learning_rate": 4.304416842089641e-06, + "loss": 0.3317, + "step": 8862 + }, + { + "epoch": 0.7, + "learning_rate": 4.302307877464893e-06, + "loss": 0.4127, + "step": 8863 + }, + { + "epoch": 0.7, + "learning_rate": 4.300199288005753e-06, + "loss": 0.3498, + "step": 8864 + }, + { + "epoch": 0.7, + "learning_rate": 4.298091073851066e-06, + "loss": 0.2982, + "step": 8865 + }, + { + "epoch": 0.7, + "learning_rate": 4.295983235139647e-06, + "loss": 0.277, + "step": 8866 + }, + { + "epoch": 0.7, + "learning_rate": 4.293875772010287e-06, + "loss": 0.2874, + "step": 8867 + }, + { + "epoch": 0.7, + "learning_rate": 4.291768684601746e-06, + "loss": 0.377, + "step": 8868 + }, + { + "epoch": 0.7, + "learning_rate": 4.289661973052774e-06, + "loss": 0.291, + "step": 8869 + }, + { + "epoch": 0.7, + "learning_rate": 4.287555637502086e-06, + "loss": 0.3974, + "step": 8870 + }, + { + "epoch": 0.7, + "learning_rate": 4.285449678088369e-06, + "loss": 0.3778, + "step": 8871 + }, + { + "epoch": 0.7, + "learning_rate": 4.283344094950297e-06, + "loss": 0.356, + "step": 8872 + }, + { + "epoch": 0.7, + "learning_rate": 4.2812388882265095e-06, + "loss": 0.3586, + "step": 8873 + }, + { + "epoch": 0.7, + "learning_rate": 4.279134058055622e-06, + "loss": 0.3414, + "step": 8874 + }, + { + "epoch": 0.7, + "learning_rate": 4.2770296045762315e-06, + "loss": 0.4693, + "step": 8875 + }, + { + "epoch": 0.7, + "learning_rate": 4.274925527926907e-06, + "loss": 0.4077, + "step": 8876 + }, + { + "epoch": 0.7, + "learning_rate": 4.272821828246183e-06, + "loss": 0.2514, + "step": 8877 + }, + { + "epoch": 0.7, + "learning_rate": 4.270718505672588e-06, + "loss": 0.3524, + "step": 8878 + }, + { + "epoch": 0.7, + "learning_rate": 4.2686155603446134e-06, + "loss": 0.2906, + "step": 8879 + }, + { + "epoch": 0.7, + "learning_rate": 4.266512992400726e-06, + "loss": 0.5256, + "step": 8880 + }, + { + "epoch": 0.7, + "learning_rate": 4.2644108019793665e-06, + "loss": 0.4232, + "step": 8881 + }, + { + "epoch": 0.7, + "learning_rate": 4.262308989218961e-06, + "loss": 0.3781, + "step": 8882 + }, + { + "epoch": 0.7, + "learning_rate": 4.2602075542579e-06, + "loss": 0.3507, + "step": 8883 + }, + { + "epoch": 0.7, + "learning_rate": 4.258106497234551e-06, + "loss": 0.3361, + "step": 8884 + }, + { + "epoch": 0.7, + "learning_rate": 4.256005818287265e-06, + "loss": 0.461, + "step": 8885 + }, + { + "epoch": 0.7, + "learning_rate": 4.253905517554356e-06, + "loss": 0.3052, + "step": 8886 + }, + { + "epoch": 0.7, + "learning_rate": 4.251805595174117e-06, + "loss": 0.2739, + "step": 8887 + }, + { + "epoch": 0.7, + "learning_rate": 4.249706051284824e-06, + "loss": 0.3571, + "step": 8888 + }, + { + "epoch": 0.7, + "learning_rate": 4.24760688602472e-06, + "loss": 0.3671, + "step": 8889 + }, + { + "epoch": 0.7, + "learning_rate": 4.245508099532021e-06, + "loss": 0.3198, + "step": 8890 + }, + { + "epoch": 0.7, + "learning_rate": 4.243409691944927e-06, + "loss": 0.4105, + "step": 8891 + }, + { + "epoch": 0.7, + "learning_rate": 4.241311663401606e-06, + "loss": 0.3395, + "step": 8892 + }, + { + "epoch": 0.7, + "learning_rate": 4.2392140140401996e-06, + "loss": 0.2771, + "step": 8893 + }, + { + "epoch": 0.7, + "learning_rate": 4.237116743998835e-06, + "loss": 0.4266, + "step": 8894 + }, + { + "epoch": 0.7, + "learning_rate": 4.235019853415603e-06, + "loss": 0.4056, + "step": 8895 + }, + { + "epoch": 0.7, + "learning_rate": 4.232923342428574e-06, + "loss": 0.2685, + "step": 8896 + }, + { + "epoch": 0.7, + "learning_rate": 4.230827211175791e-06, + "loss": 0.3214, + "step": 8897 + }, + { + "epoch": 0.7, + "learning_rate": 4.22873145979528e-06, + "loss": 0.3473, + "step": 8898 + }, + { + "epoch": 0.71, + "learning_rate": 4.226636088425033e-06, + "loss": 0.34, + "step": 8899 + }, + { + "epoch": 0.71, + "learning_rate": 4.2245410972030154e-06, + "loss": 0.3867, + "step": 8900 + }, + { + "epoch": 0.71, + "learning_rate": 4.222446486267181e-06, + "loss": 0.3512, + "step": 8901 + }, + { + "epoch": 0.71, + "learning_rate": 4.220352255755445e-06, + "loss": 0.362, + "step": 8902 + }, + { + "epoch": 0.71, + "learning_rate": 4.218258405805701e-06, + "loss": 0.2374, + "step": 8903 + }, + { + "epoch": 0.71, + "learning_rate": 4.216164936555823e-06, + "loss": 0.3807, + "step": 8904 + }, + { + "epoch": 0.71, + "learning_rate": 4.214071848143655e-06, + "loss": 0.4712, + "step": 8905 + }, + { + "epoch": 0.71, + "learning_rate": 4.211979140707012e-06, + "loss": 0.256, + "step": 8906 + }, + { + "epoch": 0.71, + "learning_rate": 4.209886814383696e-06, + "loss": 0.4039, + "step": 8907 + }, + { + "epoch": 0.71, + "learning_rate": 4.207794869311472e-06, + "loss": 0.3001, + "step": 8908 + }, + { + "epoch": 0.71, + "learning_rate": 4.205703305628082e-06, + "loss": 0.4042, + "step": 8909 + }, + { + "epoch": 0.71, + "learning_rate": 4.203612123471254e-06, + "loss": 0.3979, + "step": 8910 + }, + { + "epoch": 0.71, + "learning_rate": 4.201521322978677e-06, + "loss": 0.3346, + "step": 8911 + }, + { + "epoch": 0.71, + "learning_rate": 4.19943090428802e-06, + "loss": 0.3607, + "step": 8912 + }, + { + "epoch": 0.71, + "learning_rate": 4.197340867536923e-06, + "loss": 0.2989, + "step": 8913 + }, + { + "epoch": 0.71, + "learning_rate": 4.195251212863014e-06, + "loss": 0.2077, + "step": 8914 + }, + { + "epoch": 0.71, + "learning_rate": 4.193161940403882e-06, + "loss": 0.4289, + "step": 8915 + }, + { + "epoch": 0.71, + "learning_rate": 4.191073050297091e-06, + "loss": 0.2157, + "step": 8916 + }, + { + "epoch": 0.71, + "learning_rate": 4.188984542680192e-06, + "loss": 0.4255, + "step": 8917 + }, + { + "epoch": 0.71, + "learning_rate": 4.186896417690701e-06, + "loss": 0.2832, + "step": 8918 + }, + { + "epoch": 0.71, + "learning_rate": 4.18480867546611e-06, + "loss": 0.3475, + "step": 8919 + }, + { + "epoch": 0.71, + "learning_rate": 4.182721316143888e-06, + "loss": 0.436, + "step": 8920 + }, + { + "epoch": 0.71, + "learning_rate": 4.180634339861474e-06, + "loss": 0.2903, + "step": 8921 + }, + { + "epoch": 0.71, + "learning_rate": 4.178547746756285e-06, + "loss": 0.4434, + "step": 8922 + }, + { + "epoch": 0.71, + "learning_rate": 4.17646153696572e-06, + "loss": 0.3823, + "step": 8923 + }, + { + "epoch": 0.71, + "learning_rate": 4.174375710627141e-06, + "loss": 0.361, + "step": 8924 + }, + { + "epoch": 0.71, + "learning_rate": 4.172290267877887e-06, + "loss": 0.3261, + "step": 8925 + }, + { + "epoch": 0.71, + "learning_rate": 4.170205208855281e-06, + "loss": 0.2571, + "step": 8926 + }, + { + "epoch": 0.71, + "learning_rate": 4.1681205336966115e-06, + "loss": 0.2413, + "step": 8927 + }, + { + "epoch": 0.71, + "learning_rate": 4.16603624253914e-06, + "loss": 0.2512, + "step": 8928 + }, + { + "epoch": 0.71, + "learning_rate": 4.163952335520114e-06, + "loss": 0.4565, + "step": 8929 + }, + { + "epoch": 0.71, + "learning_rate": 4.161868812776746e-06, + "loss": 0.1983, + "step": 8930 + }, + { + "epoch": 0.71, + "learning_rate": 4.15978567444622e-06, + "loss": 0.3744, + "step": 8931 + }, + { + "epoch": 0.71, + "learning_rate": 4.157702920665712e-06, + "loss": 0.2848, + "step": 8932 + }, + { + "epoch": 0.71, + "learning_rate": 4.155620551572354e-06, + "loss": 0.3935, + "step": 8933 + }, + { + "epoch": 0.71, + "learning_rate": 4.153538567303258e-06, + "loss": 0.2529, + "step": 8934 + }, + { + "epoch": 0.71, + "learning_rate": 4.151456967995519e-06, + "loss": 0.4273, + "step": 8935 + }, + { + "epoch": 0.71, + "learning_rate": 4.149375753786198e-06, + "loss": 0.3448, + "step": 8936 + }, + { + "epoch": 0.71, + "learning_rate": 4.147294924812332e-06, + "loss": 0.32, + "step": 8937 + }, + { + "epoch": 0.71, + "learning_rate": 4.14521448121093e-06, + "loss": 0.3538, + "step": 8938 + }, + { + "epoch": 0.71, + "learning_rate": 4.143134423118986e-06, + "loss": 0.4068, + "step": 8939 + }, + { + "epoch": 0.71, + "learning_rate": 4.14105475067346e-06, + "loss": 0.3521, + "step": 8940 + }, + { + "epoch": 0.71, + "learning_rate": 4.138975464011284e-06, + "loss": 0.4728, + "step": 8941 + }, + { + "epoch": 0.71, + "learning_rate": 4.136896563269375e-06, + "loss": 0.3224, + "step": 8942 + }, + { + "epoch": 0.71, + "learning_rate": 4.1348180485846145e-06, + "loss": 0.3509, + "step": 8943 + }, + { + "epoch": 0.71, + "learning_rate": 4.1327399200938625e-06, + "loss": 0.3933, + "step": 8944 + }, + { + "epoch": 0.71, + "learning_rate": 4.1306621779339585e-06, + "loss": 0.2698, + "step": 8945 + }, + { + "epoch": 0.71, + "learning_rate": 4.128584822241708e-06, + "loss": 0.342, + "step": 8946 + }, + { + "epoch": 0.71, + "learning_rate": 4.126507853153891e-06, + "loss": 0.2885, + "step": 8947 + }, + { + "epoch": 0.71, + "learning_rate": 4.124431270807277e-06, + "loss": 0.2836, + "step": 8948 + }, + { + "epoch": 0.71, + "learning_rate": 4.12235507533859e-06, + "loss": 0.4018, + "step": 8949 + }, + { + "epoch": 0.71, + "learning_rate": 4.120279266884537e-06, + "loss": 0.3806, + "step": 8950 + }, + { + "epoch": 0.71, + "learning_rate": 4.118203845581807e-06, + "loss": 0.4588, + "step": 8951 + }, + { + "epoch": 0.71, + "learning_rate": 4.11612881156705e-06, + "loss": 0.4049, + "step": 8952 + }, + { + "epoch": 0.71, + "learning_rate": 4.114054164976902e-06, + "loss": 0.3427, + "step": 8953 + }, + { + "epoch": 0.71, + "learning_rate": 4.111979905947961e-06, + "loss": 0.3261, + "step": 8954 + }, + { + "epoch": 0.71, + "learning_rate": 4.109906034616816e-06, + "loss": 0.2479, + "step": 8955 + }, + { + "epoch": 0.71, + "learning_rate": 4.107832551120017e-06, + "loss": 0.3542, + "step": 8956 + }, + { + "epoch": 0.71, + "learning_rate": 4.105759455594091e-06, + "loss": 0.2468, + "step": 8957 + }, + { + "epoch": 0.71, + "learning_rate": 4.103686748175545e-06, + "loss": 0.3617, + "step": 8958 + }, + { + "epoch": 0.71, + "learning_rate": 4.101614429000857e-06, + "loss": 0.3408, + "step": 8959 + }, + { + "epoch": 0.71, + "learning_rate": 4.099542498206473e-06, + "loss": 0.3038, + "step": 8960 + }, + { + "epoch": 0.71, + "learning_rate": 4.0974709559288275e-06, + "loss": 0.3784, + "step": 8961 + }, + { + "epoch": 0.71, + "learning_rate": 4.095399802304319e-06, + "loss": 0.2723, + "step": 8962 + }, + { + "epoch": 0.71, + "learning_rate": 4.093329037469319e-06, + "loss": 0.2857, + "step": 8963 + }, + { + "epoch": 0.71, + "learning_rate": 4.091258661560184e-06, + "loss": 0.256, + "step": 8964 + }, + { + "epoch": 0.71, + "learning_rate": 4.0891886747132356e-06, + "loss": 0.3474, + "step": 8965 + }, + { + "epoch": 0.71, + "learning_rate": 4.087119077064772e-06, + "loss": 0.2844, + "step": 8966 + }, + { + "epoch": 0.71, + "learning_rate": 4.085049868751062e-06, + "loss": 0.3369, + "step": 8967 + }, + { + "epoch": 0.71, + "learning_rate": 4.082981049908362e-06, + "loss": 0.203, + "step": 8968 + }, + { + "epoch": 0.71, + "learning_rate": 4.080912620672888e-06, + "loss": 0.4175, + "step": 8969 + }, + { + "epoch": 0.71, + "learning_rate": 4.078844581180833e-06, + "loss": 0.3347, + "step": 8970 + }, + { + "epoch": 0.71, + "learning_rate": 4.076776931568376e-06, + "loss": 0.3752, + "step": 8971 + }, + { + "epoch": 0.71, + "learning_rate": 4.074709671971657e-06, + "loss": 0.311, + "step": 8972 + }, + { + "epoch": 0.71, + "learning_rate": 4.0726428025267925e-06, + "loss": 0.2383, + "step": 8973 + }, + { + "epoch": 0.71, + "learning_rate": 4.070576323369882e-06, + "loss": 0.3457, + "step": 8974 + }, + { + "epoch": 0.71, + "learning_rate": 4.06851023463699e-06, + "loss": 0.5, + "step": 8975 + }, + { + "epoch": 0.71, + "learning_rate": 4.066444536464155e-06, + "loss": 0.3421, + "step": 8976 + }, + { + "epoch": 0.71, + "learning_rate": 4.0643792289874e-06, + "loss": 0.4045, + "step": 8977 + }, + { + "epoch": 0.71, + "learning_rate": 4.062314312342712e-06, + "loss": 0.3278, + "step": 8978 + }, + { + "epoch": 0.71, + "learning_rate": 4.060249786666054e-06, + "loss": 0.3784, + "step": 8979 + }, + { + "epoch": 0.71, + "learning_rate": 4.0581856520933706e-06, + "loss": 0.401, + "step": 8980 + }, + { + "epoch": 0.71, + "learning_rate": 4.056121908760571e-06, + "loss": 0.4038, + "step": 8981 + }, + { + "epoch": 0.71, + "learning_rate": 4.054058556803544e-06, + "loss": 0.3618, + "step": 8982 + }, + { + "epoch": 0.71, + "learning_rate": 4.051995596358147e-06, + "loss": 0.4473, + "step": 8983 + }, + { + "epoch": 0.71, + "learning_rate": 4.049933027560225e-06, + "loss": 0.4155, + "step": 8984 + }, + { + "epoch": 0.71, + "learning_rate": 4.047870850545581e-06, + "loss": 0.371, + "step": 8985 + }, + { + "epoch": 0.71, + "learning_rate": 4.045809065449999e-06, + "loss": 0.3159, + "step": 8986 + }, + { + "epoch": 0.71, + "learning_rate": 4.043747672409245e-06, + "loss": 0.3523, + "step": 8987 + }, + { + "epoch": 0.71, + "learning_rate": 4.041686671559046e-06, + "loss": 0.3291, + "step": 8988 + }, + { + "epoch": 0.71, + "learning_rate": 4.039626063035107e-06, + "loss": 0.3224, + "step": 8989 + }, + { + "epoch": 0.71, + "learning_rate": 4.0375658469731164e-06, + "loss": 0.3274, + "step": 8990 + }, + { + "epoch": 0.71, + "learning_rate": 4.035506023508724e-06, + "loss": 0.3615, + "step": 8991 + }, + { + "epoch": 0.71, + "learning_rate": 4.033446592777558e-06, + "loss": 0.3283, + "step": 8992 + }, + { + "epoch": 0.71, + "learning_rate": 4.031387554915228e-06, + "loss": 0.1987, + "step": 8993 + }, + { + "epoch": 0.71, + "learning_rate": 4.029328910057308e-06, + "loss": 0.3296, + "step": 8994 + }, + { + "epoch": 0.71, + "learning_rate": 4.027270658339347e-06, + "loss": 0.336, + "step": 8995 + }, + { + "epoch": 0.71, + "learning_rate": 4.025212799896881e-06, + "loss": 0.3944, + "step": 8996 + }, + { + "epoch": 0.71, + "learning_rate": 4.023155334865401e-06, + "loss": 0.3272, + "step": 8997 + }, + { + "epoch": 0.71, + "learning_rate": 4.0210982633803784e-06, + "loss": 0.4109, + "step": 8998 + }, + { + "epoch": 0.71, + "learning_rate": 4.01904158557727e-06, + "loss": 0.3306, + "step": 8999 + }, + { + "epoch": 0.71, + "learning_rate": 4.016985301591496e-06, + "loss": 0.3401, + "step": 9000 + }, + { + "epoch": 0.71, + "learning_rate": 4.014929411558447e-06, + "loss": 0.3556, + "step": 9001 + }, + { + "epoch": 0.71, + "learning_rate": 4.012873915613501e-06, + "loss": 0.2967, + "step": 9002 + }, + { + "epoch": 0.71, + "learning_rate": 4.010818813892e-06, + "loss": 0.3836, + "step": 9003 + }, + { + "epoch": 0.71, + "learning_rate": 4.008764106529259e-06, + "loss": 0.3572, + "step": 9004 + }, + { + "epoch": 0.71, + "learning_rate": 4.006709793660577e-06, + "loss": 0.351, + "step": 9005 + }, + { + "epoch": 0.71, + "learning_rate": 4.004655875421217e-06, + "loss": 0.3603, + "step": 9006 + }, + { + "epoch": 0.71, + "learning_rate": 4.00260235194642e-06, + "loss": 0.3935, + "step": 9007 + }, + { + "epoch": 0.71, + "learning_rate": 4.0005492233713964e-06, + "loss": 0.3313, + "step": 9008 + }, + { + "epoch": 0.71, + "learning_rate": 3.998496489831343e-06, + "loss": 0.319, + "step": 9009 + }, + { + "epoch": 0.71, + "learning_rate": 3.996444151461417e-06, + "loss": 0.3529, + "step": 9010 + }, + { + "epoch": 0.71, + "learning_rate": 3.994392208396754e-06, + "loss": 0.3741, + "step": 9011 + }, + { + "epoch": 0.71, + "learning_rate": 3.992340660772472e-06, + "loss": 0.2556, + "step": 9012 + }, + { + "epoch": 0.71, + "learning_rate": 3.990289508723648e-06, + "loss": 0.4291, + "step": 9013 + }, + { + "epoch": 0.71, + "learning_rate": 3.988238752385341e-06, + "loss": 0.3108, + "step": 9014 + }, + { + "epoch": 0.71, + "learning_rate": 3.986188391892587e-06, + "loss": 0.4903, + "step": 9015 + }, + { + "epoch": 0.71, + "learning_rate": 3.984138427380393e-06, + "loss": 0.4002, + "step": 9016 + }, + { + "epoch": 0.71, + "learning_rate": 3.982088858983733e-06, + "loss": 0.3132, + "step": 9017 + }, + { + "epoch": 0.71, + "learning_rate": 3.9800396868375675e-06, + "loss": 0.3967, + "step": 9018 + }, + { + "epoch": 0.71, + "learning_rate": 3.977990911076823e-06, + "loss": 0.327, + "step": 9019 + }, + { + "epoch": 0.71, + "learning_rate": 3.975942531836397e-06, + "loss": 0.3672, + "step": 9020 + }, + { + "epoch": 0.71, + "learning_rate": 3.973894549251175e-06, + "loss": 0.4131, + "step": 9021 + }, + { + "epoch": 0.71, + "learning_rate": 3.971846963455999e-06, + "loss": 0.4288, + "step": 9022 + }, + { + "epoch": 0.71, + "learning_rate": 3.969799774585696e-06, + "loss": 0.2992, + "step": 9023 + }, + { + "epoch": 0.71, + "learning_rate": 3.967752982775058e-06, + "loss": 0.3225, + "step": 9024 + }, + { + "epoch": 0.71, + "learning_rate": 3.965706588158865e-06, + "loss": 0.4109, + "step": 9025 + }, + { + "epoch": 0.72, + "learning_rate": 3.963660590871858e-06, + "loss": 0.3385, + "step": 9026 + }, + { + "epoch": 0.72, + "learning_rate": 3.961614991048752e-06, + "loss": 0.2757, + "step": 9027 + }, + { + "epoch": 0.72, + "learning_rate": 3.959569788824248e-06, + "loss": 0.4323, + "step": 9028 + }, + { + "epoch": 0.72, + "learning_rate": 3.957524984333009e-06, + "loss": 0.327, + "step": 9029 + }, + { + "epoch": 0.72, + "learning_rate": 3.955480577709672e-06, + "loss": 0.4016, + "step": 9030 + }, + { + "epoch": 0.72, + "learning_rate": 3.953436569088856e-06, + "loss": 0.3417, + "step": 9031 + }, + { + "epoch": 0.72, + "learning_rate": 3.951392958605149e-06, + "loss": 0.2926, + "step": 9032 + }, + { + "epoch": 0.72, + "learning_rate": 3.949349746393108e-06, + "loss": 0.3275, + "step": 9033 + }, + { + "epoch": 0.72, + "learning_rate": 3.947306932587277e-06, + "loss": 0.4024, + "step": 9034 + }, + { + "epoch": 0.72, + "learning_rate": 3.945264517322159e-06, + "loss": 0.3811, + "step": 9035 + }, + { + "epoch": 0.72, + "learning_rate": 3.943222500732241e-06, + "loss": 0.3152, + "step": 9036 + }, + { + "epoch": 0.72, + "learning_rate": 3.941180882951972e-06, + "loss": 0.3636, + "step": 9037 + }, + { + "epoch": 0.72, + "learning_rate": 3.9391396641157945e-06, + "loss": 0.3195, + "step": 9038 + }, + { + "epoch": 0.72, + "learning_rate": 3.937098844358106e-06, + "loss": 0.2573, + "step": 9039 + }, + { + "epoch": 0.72, + "learning_rate": 3.935058423813282e-06, + "loss": 0.341, + "step": 9040 + }, + { + "epoch": 0.72, + "learning_rate": 3.933018402615683e-06, + "loss": 0.325, + "step": 9041 + }, + { + "epoch": 0.72, + "learning_rate": 3.9309787808996284e-06, + "loss": 0.3279, + "step": 9042 + }, + { + "epoch": 0.72, + "learning_rate": 3.928939558799415e-06, + "loss": 0.1847, + "step": 9043 + }, + { + "epoch": 0.72, + "learning_rate": 3.926900736449324e-06, + "loss": 0.3987, + "step": 9044 + }, + { + "epoch": 0.72, + "learning_rate": 3.924862313983597e-06, + "loss": 0.2696, + "step": 9045 + }, + { + "epoch": 0.72, + "learning_rate": 3.922824291536452e-06, + "loss": 0.3596, + "step": 9046 + }, + { + "epoch": 0.72, + "learning_rate": 3.920786669242089e-06, + "loss": 0.2172, + "step": 9047 + }, + { + "epoch": 0.72, + "learning_rate": 3.918749447234674e-06, + "loss": 0.3392, + "step": 9048 + }, + { + "epoch": 0.72, + "learning_rate": 3.9167126256483415e-06, + "loss": 0.3781, + "step": 9049 + }, + { + "epoch": 0.72, + "learning_rate": 3.914676204617216e-06, + "loss": 0.3249, + "step": 9050 + }, + { + "epoch": 0.72, + "learning_rate": 3.912640184275381e-06, + "loss": 0.3896, + "step": 9051 + }, + { + "epoch": 0.72, + "learning_rate": 3.9106045647569005e-06, + "loss": 0.3296, + "step": 9052 + }, + { + "epoch": 0.72, + "learning_rate": 3.908569346195804e-06, + "loss": 0.4353, + "step": 9053 + }, + { + "epoch": 0.72, + "learning_rate": 3.90653452872611e-06, + "loss": 0.3558, + "step": 9054 + }, + { + "epoch": 0.72, + "learning_rate": 3.904500112481798e-06, + "loss": 0.2771, + "step": 9055 + }, + { + "epoch": 0.72, + "learning_rate": 3.902466097596821e-06, + "loss": 0.3282, + "step": 9056 + }, + { + "epoch": 0.72, + "learning_rate": 3.900432484205115e-06, + "loss": 0.4264, + "step": 9057 + }, + { + "epoch": 0.72, + "learning_rate": 3.89839927244058e-06, + "loss": 0.4262, + "step": 9058 + }, + { + "epoch": 0.72, + "learning_rate": 3.89636646243709e-06, + "loss": 0.3254, + "step": 9059 + }, + { + "epoch": 0.72, + "learning_rate": 3.894334054328505e-06, + "loss": 0.2766, + "step": 9060 + }, + { + "epoch": 0.72, + "learning_rate": 3.892302048248642e-06, + "loss": 0.3962, + "step": 9061 + }, + { + "epoch": 0.72, + "learning_rate": 3.890270444331298e-06, + "loss": 0.404, + "step": 9062 + }, + { + "epoch": 0.72, + "learning_rate": 3.888239242710251e-06, + "loss": 0.272, + "step": 9063 + }, + { + "epoch": 0.72, + "learning_rate": 3.886208443519242e-06, + "loss": 0.2896, + "step": 9064 + }, + { + "epoch": 0.72, + "learning_rate": 3.884178046891984e-06, + "loss": 0.3953, + "step": 9065 + }, + { + "epoch": 0.72, + "learning_rate": 3.88214805296218e-06, + "loss": 0.4421, + "step": 9066 + }, + { + "epoch": 0.72, + "learning_rate": 3.880118461863488e-06, + "loss": 0.472, + "step": 9067 + }, + { + "epoch": 0.72, + "learning_rate": 3.878089273729549e-06, + "loss": 0.2511, + "step": 9068 + }, + { + "epoch": 0.72, + "learning_rate": 3.876060488693971e-06, + "loss": 0.3511, + "step": 9069 + }, + { + "epoch": 0.72, + "learning_rate": 3.874032106890347e-06, + "loss": 0.3438, + "step": 9070 + }, + { + "epoch": 0.72, + "learning_rate": 3.872004128452231e-06, + "loss": 0.3681, + "step": 9071 + }, + { + "epoch": 0.72, + "learning_rate": 3.8699765535131565e-06, + "loss": 0.4137, + "step": 9072 + }, + { + "epoch": 0.72, + "learning_rate": 3.867949382206632e-06, + "loss": 0.2715, + "step": 9073 + }, + { + "epoch": 0.72, + "learning_rate": 3.8659226146661344e-06, + "loss": 0.278, + "step": 9074 + }, + { + "epoch": 0.72, + "learning_rate": 3.8638962510251175e-06, + "loss": 0.3346, + "step": 9075 + }, + { + "epoch": 0.72, + "learning_rate": 3.861870291417008e-06, + "loss": 0.437, + "step": 9076 + }, + { + "epoch": 0.72, + "learning_rate": 3.859844735975205e-06, + "loss": 0.4452, + "step": 9077 + }, + { + "epoch": 0.72, + "learning_rate": 3.857819584833078e-06, + "loss": 0.2946, + "step": 9078 + }, + { + "epoch": 0.72, + "learning_rate": 3.855794838123981e-06, + "loss": 0.353, + "step": 9079 + }, + { + "epoch": 0.72, + "learning_rate": 3.85377049598123e-06, + "loss": 0.3289, + "step": 9080 + }, + { + "epoch": 0.72, + "learning_rate": 3.851746558538113e-06, + "loss": 0.3738, + "step": 9081 + }, + { + "epoch": 0.72, + "learning_rate": 3.849723025927907e-06, + "loss": 0.3196, + "step": 9082 + }, + { + "epoch": 0.72, + "learning_rate": 3.847699898283846e-06, + "loss": 0.4327, + "step": 9083 + }, + { + "epoch": 0.72, + "learning_rate": 3.84567717573914e-06, + "loss": 0.3986, + "step": 9084 + }, + { + "epoch": 0.72, + "learning_rate": 3.843654858426981e-06, + "loss": 0.3365, + "step": 9085 + }, + { + "epoch": 0.72, + "learning_rate": 3.84163294648053e-06, + "loss": 0.4065, + "step": 9086 + }, + { + "epoch": 0.72, + "learning_rate": 3.839611440032912e-06, + "loss": 0.4019, + "step": 9087 + }, + { + "epoch": 0.72, + "learning_rate": 3.837590339217243e-06, + "loss": 0.412, + "step": 9088 + }, + { + "epoch": 0.72, + "learning_rate": 3.835569644166599e-06, + "loss": 0.3436, + "step": 9089 + }, + { + "epoch": 0.72, + "learning_rate": 3.833549355014028e-06, + "loss": 0.3025, + "step": 9090 + }, + { + "epoch": 0.72, + "learning_rate": 3.8315294718925656e-06, + "loss": 0.2761, + "step": 9091 + }, + { + "epoch": 0.72, + "learning_rate": 3.829509994935206e-06, + "loss": 0.3804, + "step": 9092 + }, + { + "epoch": 0.72, + "learning_rate": 3.827490924274922e-06, + "loss": 0.3012, + "step": 9093 + }, + { + "epoch": 0.72, + "learning_rate": 3.825472260044658e-06, + "loss": 0.2972, + "step": 9094 + }, + { + "epoch": 0.72, + "learning_rate": 3.8234540023773385e-06, + "loss": 0.3655, + "step": 9095 + }, + { + "epoch": 0.72, + "learning_rate": 3.821436151405854e-06, + "loss": 0.2942, + "step": 9096 + }, + { + "epoch": 0.72, + "learning_rate": 3.819418707263065e-06, + "loss": 0.4476, + "step": 9097 + }, + { + "epoch": 0.72, + "learning_rate": 3.8174016700818196e-06, + "loss": 0.2742, + "step": 9098 + }, + { + "epoch": 0.72, + "learning_rate": 3.815385039994925e-06, + "loss": 0.3394, + "step": 9099 + }, + { + "epoch": 0.72, + "learning_rate": 3.8133688171351645e-06, + "loss": 0.3273, + "step": 9100 + }, + { + "epoch": 0.72, + "learning_rate": 3.811353001635302e-06, + "loss": 0.3274, + "step": 9101 + }, + { + "epoch": 0.72, + "learning_rate": 3.8093375936280665e-06, + "loss": 0.3007, + "step": 9102 + }, + { + "epoch": 0.72, + "learning_rate": 3.807322593246159e-06, + "loss": 0.4181, + "step": 9103 + }, + { + "epoch": 0.72, + "learning_rate": 3.805308000622265e-06, + "loss": 0.3748, + "step": 9104 + }, + { + "epoch": 0.72, + "learning_rate": 3.8032938158890333e-06, + "loss": 0.3194, + "step": 9105 + }, + { + "epoch": 0.72, + "learning_rate": 3.8012800391790814e-06, + "loss": 0.2896, + "step": 9106 + }, + { + "epoch": 0.72, + "learning_rate": 3.799266670625018e-06, + "loss": 0.3182, + "step": 9107 + }, + { + "epoch": 0.72, + "learning_rate": 3.797253710359409e-06, + "loss": 0.2867, + "step": 9108 + }, + { + "epoch": 0.72, + "learning_rate": 3.7952411585147954e-06, + "loss": 0.3652, + "step": 9109 + }, + { + "epoch": 0.72, + "learning_rate": 3.793229015223694e-06, + "loss": 0.4143, + "step": 9110 + }, + { + "epoch": 0.72, + "learning_rate": 3.7912172806186e-06, + "loss": 0.3022, + "step": 9111 + }, + { + "epoch": 0.72, + "learning_rate": 3.7892059548319726e-06, + "loss": 0.2712, + "step": 9112 + }, + { + "epoch": 0.72, + "learning_rate": 3.7871950379962463e-06, + "loss": 0.4019, + "step": 9113 + }, + { + "epoch": 0.72, + "learning_rate": 3.785184530243835e-06, + "loss": 0.3504, + "step": 9114 + }, + { + "epoch": 0.72, + "learning_rate": 3.7831744317071194e-06, + "loss": 0.3885, + "step": 9115 + }, + { + "epoch": 0.72, + "learning_rate": 3.7811647425184508e-06, + "loss": 0.3731, + "step": 9116 + }, + { + "epoch": 0.72, + "learning_rate": 3.7791554628101635e-06, + "loss": 0.3415, + "step": 9117 + }, + { + "epoch": 0.72, + "learning_rate": 3.777146592714557e-06, + "loss": 0.2732, + "step": 9118 + }, + { + "epoch": 0.72, + "learning_rate": 3.7751381323639e-06, + "loss": 0.401, + "step": 9119 + }, + { + "epoch": 0.72, + "learning_rate": 3.7731300818904494e-06, + "loss": 0.3012, + "step": 9120 + }, + { + "epoch": 0.72, + "learning_rate": 3.7711224414264216e-06, + "loss": 0.3701, + "step": 9121 + }, + { + "epoch": 0.72, + "learning_rate": 3.7691152111040087e-06, + "loss": 0.3785, + "step": 9122 + }, + { + "epoch": 0.72, + "learning_rate": 3.767108391055374e-06, + "loss": 0.2662, + "step": 9123 + }, + { + "epoch": 0.72, + "learning_rate": 3.7651019814126656e-06, + "loss": 0.3099, + "step": 9124 + }, + { + "epoch": 0.72, + "learning_rate": 3.7630959823079914e-06, + "loss": 0.3813, + "step": 9125 + }, + { + "epoch": 0.72, + "learning_rate": 3.761090393873432e-06, + "loss": 0.1733, + "step": 9126 + }, + { + "epoch": 0.72, + "learning_rate": 3.7590852162410553e-06, + "loss": 0.2421, + "step": 9127 + }, + { + "epoch": 0.72, + "learning_rate": 3.757080449542887e-06, + "loss": 0.3332, + "step": 9128 + }, + { + "epoch": 0.72, + "learning_rate": 3.7550760939109287e-06, + "loss": 0.3689, + "step": 9129 + }, + { + "epoch": 0.72, + "learning_rate": 3.7530721494771648e-06, + "loss": 0.3576, + "step": 9130 + }, + { + "epoch": 0.72, + "learning_rate": 3.751068616373541e-06, + "loss": 0.3017, + "step": 9131 + }, + { + "epoch": 0.72, + "learning_rate": 3.749065494731978e-06, + "loss": 0.3249, + "step": 9132 + }, + { + "epoch": 0.72, + "learning_rate": 3.747062784684378e-06, + "loss": 0.4252, + "step": 9133 + }, + { + "epoch": 0.72, + "learning_rate": 3.7450604863626063e-06, + "loss": 0.272, + "step": 9134 + }, + { + "epoch": 0.72, + "learning_rate": 3.7430585998985004e-06, + "loss": 0.402, + "step": 9135 + }, + { + "epoch": 0.72, + "learning_rate": 3.7410571254238835e-06, + "loss": 0.3733, + "step": 9136 + }, + { + "epoch": 0.72, + "learning_rate": 3.7390560630705387e-06, + "loss": 0.3389, + "step": 9137 + }, + { + "epoch": 0.72, + "learning_rate": 3.7370554129702265e-06, + "loss": 0.2774, + "step": 9138 + }, + { + "epoch": 0.72, + "learning_rate": 3.735055175254676e-06, + "loss": 0.3326, + "step": 9139 + }, + { + "epoch": 0.72, + "learning_rate": 3.733055350055601e-06, + "loss": 0.3984, + "step": 9140 + }, + { + "epoch": 0.72, + "learning_rate": 3.7310559375046774e-06, + "loss": 0.338, + "step": 9141 + }, + { + "epoch": 0.72, + "learning_rate": 3.7290569377335517e-06, + "loss": 0.2072, + "step": 9142 + }, + { + "epoch": 0.72, + "learning_rate": 3.7270583508738565e-06, + "loss": 0.3049, + "step": 9143 + }, + { + "epoch": 0.72, + "learning_rate": 3.725060177057185e-06, + "loss": 0.4199, + "step": 9144 + }, + { + "epoch": 0.72, + "learning_rate": 3.723062416415105e-06, + "loss": 0.4601, + "step": 9145 + }, + { + "epoch": 0.72, + "learning_rate": 3.721065069079165e-06, + "loss": 0.3328, + "step": 9146 + }, + { + "epoch": 0.72, + "learning_rate": 3.7190681351808778e-06, + "loss": 0.4165, + "step": 9147 + }, + { + "epoch": 0.72, + "learning_rate": 3.7170716148517294e-06, + "loss": 0.397, + "step": 9148 + }, + { + "epoch": 0.72, + "learning_rate": 3.715075508223187e-06, + "loss": 0.3318, + "step": 9149 + }, + { + "epoch": 0.72, + "learning_rate": 3.71307981542668e-06, + "loss": 0.278, + "step": 9150 + }, + { + "epoch": 0.72, + "learning_rate": 3.7110845365936144e-06, + "loss": 0.2601, + "step": 9151 + }, + { + "epoch": 0.73, + "learning_rate": 3.709089671855378e-06, + "loss": 0.4019, + "step": 9152 + }, + { + "epoch": 0.73, + "learning_rate": 3.707095221343313e-06, + "loss": 0.2737, + "step": 9153 + }, + { + "epoch": 0.73, + "learning_rate": 3.7051011851887455e-06, + "loss": 0.3091, + "step": 9154 + }, + { + "epoch": 0.73, + "learning_rate": 3.7031075635229787e-06, + "loss": 0.3576, + "step": 9155 + }, + { + "epoch": 0.73, + "learning_rate": 3.70111435647728e-06, + "loss": 0.309, + "step": 9156 + }, + { + "epoch": 0.73, + "learning_rate": 3.6991215641828903e-06, + "loss": 0.3256, + "step": 9157 + }, + { + "epoch": 0.73, + "learning_rate": 3.6971291867710303e-06, + "loss": 0.41, + "step": 9158 + }, + { + "epoch": 0.73, + "learning_rate": 3.6951372243728854e-06, + "loss": 0.2249, + "step": 9159 + }, + { + "epoch": 0.73, + "learning_rate": 3.693145677119615e-06, + "loss": 0.4312, + "step": 9160 + }, + { + "epoch": 0.73, + "learning_rate": 3.691154545142357e-06, + "loss": 0.349, + "step": 9161 + }, + { + "epoch": 0.73, + "learning_rate": 3.6891638285722176e-06, + "loss": 0.252, + "step": 9162 + }, + { + "epoch": 0.73, + "learning_rate": 3.687173527540273e-06, + "loss": 0.3325, + "step": 9163 + }, + { + "epoch": 0.73, + "learning_rate": 3.6851836421775733e-06, + "loss": 0.3466, + "step": 9164 + }, + { + "epoch": 0.73, + "learning_rate": 3.683194172615149e-06, + "loss": 0.3393, + "step": 9165 + }, + { + "epoch": 0.73, + "learning_rate": 3.681205118983995e-06, + "loss": 0.345, + "step": 9166 + }, + { + "epoch": 0.73, + "learning_rate": 3.6792164814150756e-06, + "loss": 0.2309, + "step": 9167 + }, + { + "epoch": 0.73, + "learning_rate": 3.6772282600393393e-06, + "loss": 0.2737, + "step": 9168 + }, + { + "epoch": 0.73, + "learning_rate": 3.675240454987701e-06, + "loss": 0.2897, + "step": 9169 + }, + { + "epoch": 0.73, + "learning_rate": 3.6732530663910415e-06, + "loss": 0.2496, + "step": 9170 + }, + { + "epoch": 0.73, + "learning_rate": 3.6712660943802292e-06, + "loss": 0.307, + "step": 9171 + }, + { + "epoch": 0.73, + "learning_rate": 3.6692795390860913e-06, + "loss": 0.3372, + "step": 9172 + }, + { + "epoch": 0.73, + "learning_rate": 3.667293400639432e-06, + "loss": 0.376, + "step": 9173 + }, + { + "epoch": 0.73, + "learning_rate": 3.665307679171034e-06, + "loss": 0.2574, + "step": 9174 + }, + { + "epoch": 0.73, + "learning_rate": 3.6633223748116454e-06, + "loss": 0.3713, + "step": 9175 + }, + { + "epoch": 0.73, + "learning_rate": 3.661337487691985e-06, + "loss": 0.3479, + "step": 9176 + }, + { + "epoch": 0.73, + "learning_rate": 3.659353017942754e-06, + "loss": 0.5077, + "step": 9177 + }, + { + "epoch": 0.73, + "learning_rate": 3.6573689656946177e-06, + "loss": 0.301, + "step": 9178 + }, + { + "epoch": 0.73, + "learning_rate": 3.655385331078217e-06, + "loss": 0.3267, + "step": 9179 + }, + { + "epoch": 0.73, + "learning_rate": 3.6534021142241595e-06, + "loss": 0.3713, + "step": 9180 + }, + { + "epoch": 0.73, + "learning_rate": 3.6514193152630382e-06, + "loss": 0.3603, + "step": 9181 + }, + { + "epoch": 0.73, + "learning_rate": 3.649436934325409e-06, + "loss": 0.2842, + "step": 9182 + }, + { + "epoch": 0.73, + "learning_rate": 3.647454971541796e-06, + "loss": 0.3742, + "step": 9183 + }, + { + "epoch": 0.73, + "learning_rate": 3.6454734270427107e-06, + "loss": 0.176, + "step": 9184 + }, + { + "epoch": 0.73, + "learning_rate": 3.6434923009586244e-06, + "loss": 0.3204, + "step": 9185 + }, + { + "epoch": 0.73, + "learning_rate": 3.6415115934199795e-06, + "loss": 0.2622, + "step": 9186 + }, + { + "epoch": 0.73, + "learning_rate": 3.6395313045572055e-06, + "loss": 0.3237, + "step": 9187 + }, + { + "epoch": 0.73, + "learning_rate": 3.6375514345006913e-06, + "loss": 0.3256, + "step": 9188 + }, + { + "epoch": 0.73, + "learning_rate": 3.635571983380797e-06, + "loss": 0.272, + "step": 9189 + }, + { + "epoch": 0.73, + "learning_rate": 3.6335929513278667e-06, + "loss": 0.3162, + "step": 9190 + }, + { + "epoch": 0.73, + "learning_rate": 3.631614338472208e-06, + "loss": 0.334, + "step": 9191 + }, + { + "epoch": 0.73, + "learning_rate": 3.6296361449440985e-06, + "loss": 0.4194, + "step": 9192 + }, + { + "epoch": 0.73, + "learning_rate": 3.6276583708738013e-06, + "loss": 0.3687, + "step": 9193 + }, + { + "epoch": 0.73, + "learning_rate": 3.6256810163915368e-06, + "loss": 0.3159, + "step": 9194 + }, + { + "epoch": 0.73, + "learning_rate": 3.623704081627507e-06, + "loss": 0.3598, + "step": 9195 + }, + { + "epoch": 0.73, + "learning_rate": 3.62172756671188e-06, + "loss": 0.3176, + "step": 9196 + }, + { + "epoch": 0.73, + "learning_rate": 3.619751471774805e-06, + "loss": 0.3993, + "step": 9197 + }, + { + "epoch": 0.73, + "learning_rate": 3.6177757969463956e-06, + "loss": 0.2657, + "step": 9198 + }, + { + "epoch": 0.73, + "learning_rate": 3.615800542356738e-06, + "loss": 0.2912, + "step": 9199 + }, + { + "epoch": 0.73, + "learning_rate": 3.6138257081358985e-06, + "loss": 0.3541, + "step": 9200 + }, + { + "epoch": 0.73, + "learning_rate": 3.6118512944139084e-06, + "loss": 0.4037, + "step": 9201 + }, + { + "epoch": 0.73, + "learning_rate": 3.609877301320769e-06, + "loss": 0.3632, + "step": 9202 + }, + { + "epoch": 0.73, + "learning_rate": 3.607903728986465e-06, + "loss": 0.4287, + "step": 9203 + }, + { + "epoch": 0.73, + "learning_rate": 3.6059305775409435e-06, + "loss": 0.3776, + "step": 9204 + }, + { + "epoch": 0.73, + "learning_rate": 3.6039578471141244e-06, + "loss": 0.416, + "step": 9205 + }, + { + "epoch": 0.73, + "learning_rate": 3.6019855378359092e-06, + "loss": 0.3871, + "step": 9206 + }, + { + "epoch": 0.73, + "learning_rate": 3.6000136498361605e-06, + "loss": 0.3038, + "step": 9207 + }, + { + "epoch": 0.73, + "learning_rate": 3.5980421832447188e-06, + "loss": 0.2423, + "step": 9208 + }, + { + "epoch": 0.73, + "learning_rate": 3.5960711381913904e-06, + "loss": 0.4243, + "step": 9209 + }, + { + "epoch": 0.73, + "learning_rate": 3.5941005148059684e-06, + "loss": 0.418, + "step": 9210 + }, + { + "epoch": 0.73, + "learning_rate": 3.5921303132182038e-06, + "loss": 0.4179, + "step": 9211 + }, + { + "epoch": 0.73, + "learning_rate": 3.5901605335578214e-06, + "loss": 0.2805, + "step": 9212 + }, + { + "epoch": 0.73, + "learning_rate": 3.5881911759545296e-06, + "loss": 0.4127, + "step": 9213 + }, + { + "epoch": 0.73, + "learning_rate": 3.5862222405379975e-06, + "loss": 0.2307, + "step": 9214 + }, + { + "epoch": 0.73, + "learning_rate": 3.584253727437866e-06, + "loss": 0.4153, + "step": 9215 + }, + { + "epoch": 0.73, + "learning_rate": 3.5822856367837587e-06, + "loss": 0.2865, + "step": 9216 + }, + { + "epoch": 0.73, + "learning_rate": 3.5803179687052636e-06, + "loss": 0.3333, + "step": 9217 + }, + { + "epoch": 0.73, + "learning_rate": 3.578350723331937e-06, + "loss": 0.2583, + "step": 9218 + }, + { + "epoch": 0.73, + "learning_rate": 3.5763839007933186e-06, + "loss": 0.3705, + "step": 9219 + }, + { + "epoch": 0.73, + "learning_rate": 3.574417501218913e-06, + "loss": 0.2716, + "step": 9220 + }, + { + "epoch": 0.73, + "learning_rate": 3.572451524738193e-06, + "loss": 0.4044, + "step": 9221 + }, + { + "epoch": 0.73, + "learning_rate": 3.5704859714806162e-06, + "loss": 0.3296, + "step": 9222 + }, + { + "epoch": 0.73, + "learning_rate": 3.568520841575601e-06, + "loss": 0.3764, + "step": 9223 + }, + { + "epoch": 0.73, + "learning_rate": 3.5665561351525423e-06, + "loss": 0.3512, + "step": 9224 + }, + { + "epoch": 0.73, + "learning_rate": 3.564591852340803e-06, + "loss": 0.3779, + "step": 9225 + }, + { + "epoch": 0.73, + "learning_rate": 3.562627993269728e-06, + "loss": 0.2659, + "step": 9226 + }, + { + "epoch": 0.73, + "learning_rate": 3.5606645580686262e-06, + "loss": 0.4378, + "step": 9227 + }, + { + "epoch": 0.73, + "learning_rate": 3.558701546866775e-06, + "loss": 0.3446, + "step": 9228 + }, + { + "epoch": 0.73, + "learning_rate": 3.5567389597934367e-06, + "loss": 0.3361, + "step": 9229 + }, + { + "epoch": 0.73, + "learning_rate": 3.5547767969778355e-06, + "loss": 0.2944, + "step": 9230 + }, + { + "epoch": 0.73, + "learning_rate": 3.5528150585491695e-06, + "loss": 0.3686, + "step": 9231 + }, + { + "epoch": 0.73, + "learning_rate": 3.5508537446366097e-06, + "loss": 0.3956, + "step": 9232 + }, + { + "epoch": 0.73, + "learning_rate": 3.548892855369299e-06, + "loss": 0.3685, + "step": 9233 + }, + { + "epoch": 0.73, + "learning_rate": 3.5469323908763507e-06, + "loss": 0.2669, + "step": 9234 + }, + { + "epoch": 0.73, + "learning_rate": 3.544972351286857e-06, + "loss": 0.4328, + "step": 9235 + }, + { + "epoch": 0.73, + "learning_rate": 3.543012736729875e-06, + "loss": 0.3671, + "step": 9236 + }, + { + "epoch": 0.73, + "learning_rate": 3.541053547334431e-06, + "loss": 0.3734, + "step": 9237 + }, + { + "epoch": 0.73, + "learning_rate": 3.5390947832295366e-06, + "loss": 0.2826, + "step": 9238 + }, + { + "epoch": 0.73, + "learning_rate": 3.5371364445441624e-06, + "loss": 0.4837, + "step": 9239 + }, + { + "epoch": 0.73, + "learning_rate": 3.535178531407253e-06, + "loss": 0.3569, + "step": 9240 + }, + { + "epoch": 0.73, + "learning_rate": 3.5332210439477334e-06, + "loss": 0.3223, + "step": 9241 + }, + { + "epoch": 0.73, + "learning_rate": 3.5312639822944917e-06, + "loss": 0.3092, + "step": 9242 + }, + { + "epoch": 0.73, + "learning_rate": 3.529307346576388e-06, + "loss": 0.4363, + "step": 9243 + }, + { + "epoch": 0.73, + "learning_rate": 3.527351136922265e-06, + "loss": 0.3629, + "step": 9244 + }, + { + "epoch": 0.73, + "learning_rate": 3.525395353460924e-06, + "loss": 0.3313, + "step": 9245 + }, + { + "epoch": 0.73, + "learning_rate": 3.5234399963211418e-06, + "loss": 0.2138, + "step": 9246 + }, + { + "epoch": 0.73, + "learning_rate": 3.521485065631677e-06, + "loss": 0.2826, + "step": 9247 + }, + { + "epoch": 0.73, + "learning_rate": 3.5195305615212473e-06, + "loss": 0.4121, + "step": 9248 + }, + { + "epoch": 0.73, + "learning_rate": 3.517576484118549e-06, + "loss": 0.3263, + "step": 9249 + }, + { + "epoch": 0.73, + "learning_rate": 3.5156228335522434e-06, + "loss": 0.451, + "step": 9250 + }, + { + "epoch": 0.73, + "learning_rate": 3.513669609950977e-06, + "loss": 0.3573, + "step": 9251 + }, + { + "epoch": 0.73, + "learning_rate": 3.5117168134433566e-06, + "loss": 0.4817, + "step": 9252 + }, + { + "epoch": 0.73, + "learning_rate": 3.5097644441579602e-06, + "loss": 0.4876, + "step": 9253 + }, + { + "epoch": 0.73, + "learning_rate": 3.507812502223351e-06, + "loss": 0.424, + "step": 9254 + }, + { + "epoch": 0.73, + "learning_rate": 3.5058609877680495e-06, + "loss": 0.3544, + "step": 9255 + }, + { + "epoch": 0.73, + "learning_rate": 3.5039099009205503e-06, + "loss": 0.2889, + "step": 9256 + }, + { + "epoch": 0.73, + "learning_rate": 3.5019592418093306e-06, + "loss": 0.2706, + "step": 9257 + }, + { + "epoch": 0.73, + "learning_rate": 3.5000090105628282e-06, + "loss": 0.3834, + "step": 9258 + }, + { + "epoch": 0.73, + "learning_rate": 3.4980592073094533e-06, + "loss": 0.3845, + "step": 9259 + }, + { + "epoch": 0.73, + "learning_rate": 3.4961098321775978e-06, + "loss": 0.2691, + "step": 9260 + }, + { + "epoch": 0.73, + "learning_rate": 3.4941608852956143e-06, + "loss": 0.3656, + "step": 9261 + }, + { + "epoch": 0.73, + "learning_rate": 3.4922123667918305e-06, + "loss": 0.3551, + "step": 9262 + }, + { + "epoch": 0.73, + "learning_rate": 3.4902642767945506e-06, + "loss": 0.3561, + "step": 9263 + }, + { + "epoch": 0.73, + "learning_rate": 3.488316615432047e-06, + "loss": 0.3787, + "step": 9264 + }, + { + "epoch": 0.73, + "learning_rate": 3.486369382832561e-06, + "loss": 0.2651, + "step": 9265 + }, + { + "epoch": 0.73, + "learning_rate": 3.484422579124306e-06, + "loss": 0.4861, + "step": 9266 + }, + { + "epoch": 0.73, + "learning_rate": 3.4824762044354763e-06, + "loss": 0.3417, + "step": 9267 + }, + { + "epoch": 0.73, + "learning_rate": 3.480530258894229e-06, + "loss": 0.4283, + "step": 9268 + }, + { + "epoch": 0.73, + "learning_rate": 3.478584742628691e-06, + "loss": 0.329, + "step": 9269 + }, + { + "epoch": 0.73, + "learning_rate": 3.4766396557669712e-06, + "loss": 0.3222, + "step": 9270 + }, + { + "epoch": 0.73, + "learning_rate": 3.4746949984371425e-06, + "loss": 0.3792, + "step": 9271 + }, + { + "epoch": 0.73, + "learning_rate": 3.472750770767247e-06, + "loss": 0.3758, + "step": 9272 + }, + { + "epoch": 0.73, + "learning_rate": 3.470806972885309e-06, + "loss": 0.3401, + "step": 9273 + }, + { + "epoch": 0.73, + "learning_rate": 3.468863604919316e-06, + "loss": 0.3693, + "step": 9274 + }, + { + "epoch": 0.73, + "learning_rate": 3.4669206669972254e-06, + "loss": 0.3246, + "step": 9275 + }, + { + "epoch": 0.73, + "learning_rate": 3.4649781592469765e-06, + "loss": 0.3187, + "step": 9276 + }, + { + "epoch": 0.73, + "learning_rate": 3.4630360817964715e-06, + "loss": 0.4438, + "step": 9277 + }, + { + "epoch": 0.74, + "learning_rate": 3.4610944347735864e-06, + "loss": 0.3939, + "step": 9278 + }, + { + "epoch": 0.74, + "learning_rate": 3.459153218306167e-06, + "loss": 0.3832, + "step": 9279 + }, + { + "epoch": 0.74, + "learning_rate": 3.457212432522038e-06, + "loss": 0.3386, + "step": 9280 + }, + { + "epoch": 0.74, + "learning_rate": 3.455272077548989e-06, + "loss": 0.4267, + "step": 9281 + }, + { + "epoch": 0.74, + "learning_rate": 3.453332153514779e-06, + "loss": 0.4181, + "step": 9282 + }, + { + "epoch": 0.74, + "learning_rate": 3.4513926605471504e-06, + "loss": 0.2843, + "step": 9283 + }, + { + "epoch": 0.74, + "learning_rate": 3.449453598773804e-06, + "loss": 0.2752, + "step": 9284 + }, + { + "epoch": 0.74, + "learning_rate": 3.4475149683224164e-06, + "loss": 0.3912, + "step": 9285 + }, + { + "epoch": 0.74, + "learning_rate": 3.445576769320642e-06, + "loss": 0.3647, + "step": 9286 + }, + { + "epoch": 0.74, + "learning_rate": 3.4436390018960997e-06, + "loss": 0.4686, + "step": 9287 + }, + { + "epoch": 0.74, + "learning_rate": 3.4417016661763793e-06, + "loss": 0.3564, + "step": 9288 + }, + { + "epoch": 0.74, + "learning_rate": 3.439764762289051e-06, + "loss": 0.318, + "step": 9289 + }, + { + "epoch": 0.74, + "learning_rate": 3.4378282903616457e-06, + "loss": 0.2981, + "step": 9290 + }, + { + "epoch": 0.74, + "learning_rate": 3.4358922505216707e-06, + "loss": 0.4217, + "step": 9291 + }, + { + "epoch": 0.74, + "learning_rate": 3.4339566428966086e-06, + "loss": 0.2503, + "step": 9292 + }, + { + "epoch": 0.74, + "learning_rate": 3.4320214676139087e-06, + "loss": 0.315, + "step": 9293 + }, + { + "epoch": 0.74, + "learning_rate": 3.4300867248009917e-06, + "loss": 0.3414, + "step": 9294 + }, + { + "epoch": 0.74, + "learning_rate": 3.4281524145852485e-06, + "loss": 0.3444, + "step": 9295 + }, + { + "epoch": 0.74, + "learning_rate": 3.4262185370940504e-06, + "loss": 0.2545, + "step": 9296 + }, + { + "epoch": 0.74, + "learning_rate": 3.4242850924547297e-06, + "loss": 0.2036, + "step": 9297 + }, + { + "epoch": 0.74, + "learning_rate": 3.422352080794593e-06, + "loss": 0.3221, + "step": 9298 + }, + { + "epoch": 0.74, + "learning_rate": 3.4204195022409247e-06, + "loss": 0.2927, + "step": 9299 + }, + { + "epoch": 0.74, + "learning_rate": 3.418487356920974e-06, + "loss": 0.3277, + "step": 9300 + }, + { + "epoch": 0.74, + "learning_rate": 3.4165556449619584e-06, + "loss": 0.3561, + "step": 9301 + }, + { + "epoch": 0.74, + "learning_rate": 3.4146243664910804e-06, + "loss": 0.2816, + "step": 9302 + }, + { + "epoch": 0.74, + "learning_rate": 3.4126935216355005e-06, + "loss": 0.3214, + "step": 9303 + }, + { + "epoch": 0.74, + "learning_rate": 3.4107631105223528e-06, + "loss": 0.3646, + "step": 9304 + }, + { + "epoch": 0.74, + "learning_rate": 3.4088331332787527e-06, + "loss": 0.4121, + "step": 9305 + }, + { + "epoch": 0.74, + "learning_rate": 3.406903590031776e-06, + "loss": 0.3073, + "step": 9306 + }, + { + "epoch": 0.74, + "learning_rate": 3.4049744809084697e-06, + "loss": 0.2699, + "step": 9307 + }, + { + "epoch": 0.74, + "learning_rate": 3.4030458060358682e-06, + "loss": 0.2949, + "step": 9308 + }, + { + "epoch": 0.74, + "learning_rate": 3.4011175655409546e-06, + "loss": 0.417, + "step": 9309 + }, + { + "epoch": 0.74, + "learning_rate": 3.399189759550694e-06, + "loss": 0.2549, + "step": 9310 + }, + { + "epoch": 0.74, + "learning_rate": 3.3972623881920296e-06, + "loss": 0.3205, + "step": 9311 + }, + { + "epoch": 0.74, + "learning_rate": 3.3953354515918667e-06, + "loss": 0.3412, + "step": 9312 + }, + { + "epoch": 0.74, + "learning_rate": 3.3934089498770816e-06, + "loss": 0.2966, + "step": 9313 + }, + { + "epoch": 0.74, + "learning_rate": 3.3914828831745306e-06, + "loss": 0.2937, + "step": 9314 + }, + { + "epoch": 0.74, + "learning_rate": 3.3895572516110353e-06, + "loss": 0.3213, + "step": 9315 + }, + { + "epoch": 0.74, + "learning_rate": 3.3876320553133834e-06, + "loss": 0.4012, + "step": 9316 + }, + { + "epoch": 0.74, + "learning_rate": 3.385707294408347e-06, + "loss": 0.3042, + "step": 9317 + }, + { + "epoch": 0.74, + "learning_rate": 3.38378296902266e-06, + "loss": 0.3338, + "step": 9318 + }, + { + "epoch": 0.74, + "learning_rate": 3.3818590792830285e-06, + "loss": 0.3045, + "step": 9319 + }, + { + "epoch": 0.74, + "learning_rate": 3.3799356253161288e-06, + "loss": 0.4593, + "step": 9320 + }, + { + "epoch": 0.74, + "learning_rate": 3.3780126072486188e-06, + "loss": 0.3249, + "step": 9321 + }, + { + "epoch": 0.74, + "learning_rate": 3.376090025207115e-06, + "loss": 0.4397, + "step": 9322 + }, + { + "epoch": 0.74, + "learning_rate": 3.3741678793182077e-06, + "loss": 0.3833, + "step": 9323 + }, + { + "epoch": 0.74, + "learning_rate": 3.372246169708466e-06, + "loss": 0.3405, + "step": 9324 + }, + { + "epoch": 0.74, + "learning_rate": 3.3703248965044253e-06, + "loss": 0.2264, + "step": 9325 + }, + { + "epoch": 0.74, + "learning_rate": 3.368404059832586e-06, + "loss": 0.453, + "step": 9326 + }, + { + "epoch": 0.74, + "learning_rate": 3.366483659819434e-06, + "loss": 0.3507, + "step": 9327 + }, + { + "epoch": 0.74, + "learning_rate": 3.364563696591414e-06, + "loss": 0.4052, + "step": 9328 + }, + { + "epoch": 0.74, + "learning_rate": 3.3626441702749436e-06, + "loss": 0.2735, + "step": 9329 + }, + { + "epoch": 0.74, + "learning_rate": 3.360725080996421e-06, + "loss": 0.357, + "step": 9330 + }, + { + "epoch": 0.74, + "learning_rate": 3.3588064288822055e-06, + "loss": 0.3967, + "step": 9331 + }, + { + "epoch": 0.74, + "learning_rate": 3.356888214058629e-06, + "loss": 0.3667, + "step": 9332 + }, + { + "epoch": 0.74, + "learning_rate": 3.354970436652001e-06, + "loss": 0.3043, + "step": 9333 + }, + { + "epoch": 0.74, + "learning_rate": 3.3530530967885964e-06, + "loss": 0.3189, + "step": 9334 + }, + { + "epoch": 0.74, + "learning_rate": 3.351136194594662e-06, + "loss": 0.2299, + "step": 9335 + }, + { + "epoch": 0.74, + "learning_rate": 3.3492197301964145e-06, + "loss": 0.2985, + "step": 9336 + }, + { + "epoch": 0.74, + "learning_rate": 3.3473037037200484e-06, + "loss": 0.4318, + "step": 9337 + }, + { + "epoch": 0.74, + "learning_rate": 3.345388115291723e-06, + "loss": 0.3423, + "step": 9338 + }, + { + "epoch": 0.74, + "learning_rate": 3.3434729650375675e-06, + "loss": 0.3522, + "step": 9339 + }, + { + "epoch": 0.74, + "learning_rate": 3.341558253083692e-06, + "loss": 0.3502, + "step": 9340 + }, + { + "epoch": 0.74, + "learning_rate": 3.3396439795561662e-06, + "loss": 0.446, + "step": 9341 + }, + { + "epoch": 0.74, + "learning_rate": 3.3377301445810327e-06, + "loss": 0.2107, + "step": 9342 + }, + { + "epoch": 0.74, + "learning_rate": 3.3358167482843173e-06, + "loss": 0.4185, + "step": 9343 + }, + { + "epoch": 0.74, + "learning_rate": 3.3339037907920024e-06, + "loss": 0.3311, + "step": 9344 + }, + { + "epoch": 0.74, + "learning_rate": 3.331991272230044e-06, + "loss": 0.2938, + "step": 9345 + }, + { + "epoch": 0.74, + "learning_rate": 3.330079192724379e-06, + "loss": 0.3911, + "step": 9346 + }, + { + "epoch": 0.74, + "learning_rate": 3.328167552400906e-06, + "loss": 0.3112, + "step": 9347 + }, + { + "epoch": 0.74, + "learning_rate": 3.326256351385494e-06, + "loss": 0.3364, + "step": 9348 + }, + { + "epoch": 0.74, + "learning_rate": 3.324345589803991e-06, + "loss": 0.2803, + "step": 9349 + }, + { + "epoch": 0.74, + "learning_rate": 3.3224352677822115e-06, + "loss": 0.2501, + "step": 9350 + }, + { + "epoch": 0.74, + "learning_rate": 3.3205253854459386e-06, + "loss": 0.2638, + "step": 9351 + }, + { + "epoch": 0.74, + "learning_rate": 3.3186159429209263e-06, + "loss": 0.2798, + "step": 9352 + }, + { + "epoch": 0.74, + "learning_rate": 3.316706940332908e-06, + "loss": 0.3465, + "step": 9353 + }, + { + "epoch": 0.74, + "learning_rate": 3.314798377807581e-06, + "loss": 0.4053, + "step": 9354 + }, + { + "epoch": 0.74, + "learning_rate": 3.312890255470609e-06, + "loss": 0.3701, + "step": 9355 + }, + { + "epoch": 0.74, + "learning_rate": 3.3109825734476407e-06, + "loss": 0.3701, + "step": 9356 + }, + { + "epoch": 0.74, + "learning_rate": 3.3090753318642855e-06, + "loss": 0.3569, + "step": 9357 + }, + { + "epoch": 0.74, + "learning_rate": 3.307168530846121e-06, + "loss": 0.2901, + "step": 9358 + }, + { + "epoch": 0.74, + "learning_rate": 3.3052621705187083e-06, + "loss": 0.2494, + "step": 9359 + }, + { + "epoch": 0.74, + "learning_rate": 3.303356251007569e-06, + "loss": 0.4365, + "step": 9360 + }, + { + "epoch": 0.74, + "learning_rate": 3.301450772438195e-06, + "loss": 0.3066, + "step": 9361 + }, + { + "epoch": 0.74, + "learning_rate": 3.2995457349360595e-06, + "loss": 0.3239, + "step": 9362 + }, + { + "epoch": 0.74, + "learning_rate": 3.297641138626597e-06, + "loss": 0.4303, + "step": 9363 + }, + { + "epoch": 0.74, + "learning_rate": 3.295736983635215e-06, + "loss": 0.411, + "step": 9364 + }, + { + "epoch": 0.74, + "learning_rate": 3.293833270087291e-06, + "loss": 0.2941, + "step": 9365 + }, + { + "epoch": 0.74, + "learning_rate": 3.291929998108182e-06, + "loss": 0.3329, + "step": 9366 + }, + { + "epoch": 0.74, + "learning_rate": 3.2900271678232045e-06, + "loss": 0.3707, + "step": 9367 + }, + { + "epoch": 0.74, + "learning_rate": 3.2881247793576488e-06, + "loss": 0.3693, + "step": 9368 + }, + { + "epoch": 0.74, + "learning_rate": 3.286222832836784e-06, + "loss": 0.4122, + "step": 9369 + }, + { + "epoch": 0.74, + "learning_rate": 3.284321328385842e-06, + "loss": 0.225, + "step": 9370 + }, + { + "epoch": 0.74, + "learning_rate": 3.282420266130022e-06, + "loss": 0.2821, + "step": 9371 + }, + { + "epoch": 0.74, + "learning_rate": 3.280519646194509e-06, + "loss": 0.3791, + "step": 9372 + }, + { + "epoch": 0.74, + "learning_rate": 3.278619468704445e-06, + "loss": 0.3292, + "step": 9373 + }, + { + "epoch": 0.74, + "learning_rate": 3.276719733784943e-06, + "loss": 0.3007, + "step": 9374 + }, + { + "epoch": 0.74, + "learning_rate": 3.2748204415611016e-06, + "loss": 0.3041, + "step": 9375 + }, + { + "epoch": 0.74, + "learning_rate": 3.2729215921579738e-06, + "loss": 0.3626, + "step": 9376 + }, + { + "epoch": 0.74, + "learning_rate": 3.271023185700587e-06, + "loss": 0.3891, + "step": 9377 + }, + { + "epoch": 0.74, + "learning_rate": 3.269125222313949e-06, + "loss": 0.467, + "step": 9378 + }, + { + "epoch": 0.74, + "learning_rate": 3.2672277021230283e-06, + "loss": 0.2877, + "step": 9379 + }, + { + "epoch": 0.74, + "learning_rate": 3.2653306252527673e-06, + "loss": 0.2857, + "step": 9380 + }, + { + "epoch": 0.74, + "learning_rate": 3.2634339918280765e-06, + "loss": 0.3995, + "step": 9381 + }, + { + "epoch": 0.74, + "learning_rate": 3.2615378019738455e-06, + "loss": 0.3691, + "step": 9382 + }, + { + "epoch": 0.74, + "learning_rate": 3.2596420558149277e-06, + "loss": 0.3539, + "step": 9383 + }, + { + "epoch": 0.74, + "learning_rate": 3.257746753476144e-06, + "loss": 0.4089, + "step": 9384 + }, + { + "epoch": 0.74, + "learning_rate": 3.255851895082299e-06, + "loss": 0.3331, + "step": 9385 + }, + { + "epoch": 0.74, + "learning_rate": 3.2539574807581555e-06, + "loss": 0.4381, + "step": 9386 + }, + { + "epoch": 0.74, + "learning_rate": 3.2520635106284516e-06, + "loss": 0.3219, + "step": 9387 + }, + { + "epoch": 0.74, + "learning_rate": 3.250169984817897e-06, + "loss": 0.4481, + "step": 9388 + }, + { + "epoch": 0.74, + "learning_rate": 3.248276903451171e-06, + "loss": 0.361, + "step": 9389 + }, + { + "epoch": 0.74, + "learning_rate": 3.24638426665292e-06, + "loss": 0.4268, + "step": 9390 + }, + { + "epoch": 0.74, + "learning_rate": 3.2444920745477727e-06, + "loss": 0.3647, + "step": 9391 + }, + { + "epoch": 0.74, + "learning_rate": 3.2426003272603158e-06, + "loss": 0.3939, + "step": 9392 + }, + { + "epoch": 0.74, + "learning_rate": 3.2407090249151105e-06, + "loss": 0.3039, + "step": 9393 + }, + { + "epoch": 0.74, + "learning_rate": 3.238818167636695e-06, + "loss": 0.3224, + "step": 9394 + }, + { + "epoch": 0.74, + "learning_rate": 3.2369277555495705e-06, + "loss": 0.3251, + "step": 9395 + }, + { + "epoch": 0.74, + "learning_rate": 3.235037788778208e-06, + "loss": 0.3351, + "step": 9396 + }, + { + "epoch": 0.74, + "learning_rate": 3.2331482674470605e-06, + "loss": 0.3688, + "step": 9397 + }, + { + "epoch": 0.74, + "learning_rate": 3.2312591916805382e-06, + "loss": 0.3583, + "step": 9398 + }, + { + "epoch": 0.74, + "learning_rate": 3.2293705616030267e-06, + "loss": 0.2242, + "step": 9399 + }, + { + "epoch": 0.74, + "learning_rate": 3.2274823773388885e-06, + "loss": 0.3151, + "step": 9400 + }, + { + "epoch": 0.74, + "learning_rate": 3.2255946390124482e-06, + "loss": 0.2922, + "step": 9401 + }, + { + "epoch": 0.74, + "learning_rate": 3.223707346748002e-06, + "loss": 0.2684, + "step": 9402 + }, + { + "epoch": 0.74, + "learning_rate": 3.221820500669823e-06, + "loss": 0.3991, + "step": 9403 + }, + { + "epoch": 0.75, + "learning_rate": 3.2199341009021514e-06, + "loss": 0.4486, + "step": 9404 + }, + { + "epoch": 0.75, + "learning_rate": 3.218048147569195e-06, + "loss": 0.4792, + "step": 9405 + }, + { + "epoch": 0.75, + "learning_rate": 3.216162640795133e-06, + "loss": 0.2969, + "step": 9406 + }, + { + "epoch": 0.75, + "learning_rate": 3.2142775807041214e-06, + "loss": 0.3712, + "step": 9407 + }, + { + "epoch": 0.75, + "learning_rate": 3.2123929674202816e-06, + "loss": 0.3895, + "step": 9408 + }, + { + "epoch": 0.75, + "learning_rate": 3.2105088010677e-06, + "loss": 0.383, + "step": 9409 + }, + { + "epoch": 0.75, + "learning_rate": 3.2086250817704488e-06, + "loss": 0.3759, + "step": 9410 + }, + { + "epoch": 0.75, + "learning_rate": 3.2067418096525593e-06, + "loss": 0.4051, + "step": 9411 + }, + { + "epoch": 0.75, + "learning_rate": 3.2048589848380297e-06, + "loss": 0.3771, + "step": 9412 + }, + { + "epoch": 0.75, + "learning_rate": 3.202976607450844e-06, + "loss": 0.2758, + "step": 9413 + }, + { + "epoch": 0.75, + "learning_rate": 3.201094677614943e-06, + "loss": 0.4438, + "step": 9414 + }, + { + "epoch": 0.75, + "learning_rate": 3.1992131954542404e-06, + "loss": 0.4472, + "step": 9415 + }, + { + "epoch": 0.75, + "learning_rate": 3.1973321610926277e-06, + "loss": 0.4277, + "step": 9416 + }, + { + "epoch": 0.75, + "learning_rate": 3.1954515746539616e-06, + "loss": 0.3535, + "step": 9417 + }, + { + "epoch": 0.75, + "learning_rate": 3.193571436262064e-06, + "loss": 0.3299, + "step": 9418 + }, + { + "epoch": 0.75, + "learning_rate": 3.191691746040739e-06, + "loss": 0.259, + "step": 9419 + }, + { + "epoch": 0.75, + "learning_rate": 3.189812504113754e-06, + "loss": 0.2606, + "step": 9420 + }, + { + "epoch": 0.75, + "learning_rate": 3.187933710604847e-06, + "loss": 0.391, + "step": 9421 + }, + { + "epoch": 0.75, + "learning_rate": 3.186055365637725e-06, + "loss": 0.2952, + "step": 9422 + }, + { + "epoch": 0.75, + "learning_rate": 3.184177469336073e-06, + "loss": 0.3632, + "step": 9423 + }, + { + "epoch": 0.75, + "learning_rate": 3.1823000218235388e-06, + "loss": 0.3578, + "step": 9424 + }, + { + "epoch": 0.75, + "learning_rate": 3.180423023223741e-06, + "loss": 0.3186, + "step": 9425 + }, + { + "epoch": 0.75, + "learning_rate": 3.1785464736602754e-06, + "loss": 0.4236, + "step": 9426 + }, + { + "epoch": 0.75, + "learning_rate": 3.1766703732567027e-06, + "loss": 0.3956, + "step": 9427 + }, + { + "epoch": 0.75, + "learning_rate": 3.1747947221365517e-06, + "loss": 0.3283, + "step": 9428 + }, + { + "epoch": 0.75, + "learning_rate": 3.17291952042333e-06, + "loss": 0.2827, + "step": 9429 + }, + { + "epoch": 0.75, + "learning_rate": 3.171044768240508e-06, + "loss": 0.4487, + "step": 9430 + }, + { + "epoch": 0.75, + "learning_rate": 3.169170465711525e-06, + "loss": 0.4489, + "step": 9431 + }, + { + "epoch": 0.75, + "learning_rate": 3.167296612959803e-06, + "loss": 0.257, + "step": 9432 + }, + { + "epoch": 0.75, + "learning_rate": 3.1654232101087225e-06, + "loss": 0.5169, + "step": 9433 + }, + { + "epoch": 0.75, + "learning_rate": 3.1635502572816333e-06, + "loss": 0.2566, + "step": 9434 + }, + { + "epoch": 0.75, + "learning_rate": 3.1616777546018696e-06, + "loss": 0.2953, + "step": 9435 + }, + { + "epoch": 0.75, + "learning_rate": 3.1598057021927207e-06, + "loss": 0.2978, + "step": 9436 + }, + { + "epoch": 0.75, + "learning_rate": 3.1579341001774546e-06, + "loss": 0.2582, + "step": 9437 + }, + { + "epoch": 0.75, + "learning_rate": 3.1560629486793014e-06, + "loss": 0.2674, + "step": 9438 + }, + { + "epoch": 0.75, + "learning_rate": 3.154192247821476e-06, + "loss": 0.4378, + "step": 9439 + }, + { + "epoch": 0.75, + "learning_rate": 3.1523219977271515e-06, + "loss": 0.3112, + "step": 9440 + }, + { + "epoch": 0.75, + "learning_rate": 3.1504521985194715e-06, + "loss": 0.4393, + "step": 9441 + }, + { + "epoch": 0.75, + "learning_rate": 3.1485828503215588e-06, + "loss": 0.3832, + "step": 9442 + }, + { + "epoch": 0.75, + "learning_rate": 3.1467139532564985e-06, + "loss": 0.2693, + "step": 9443 + }, + { + "epoch": 0.75, + "learning_rate": 3.144845507447345e-06, + "loss": 0.2712, + "step": 9444 + }, + { + "epoch": 0.75, + "learning_rate": 3.1429775130171337e-06, + "loss": 0.4154, + "step": 9445 + }, + { + "epoch": 0.75, + "learning_rate": 3.141109970088859e-06, + "loss": 0.3627, + "step": 9446 + }, + { + "epoch": 0.75, + "learning_rate": 3.1392428787854865e-06, + "loss": 0.3005, + "step": 9447 + }, + { + "epoch": 0.75, + "learning_rate": 3.1373762392299632e-06, + "loss": 0.3822, + "step": 9448 + }, + { + "epoch": 0.75, + "learning_rate": 3.135510051545192e-06, + "loss": 0.4045, + "step": 9449 + }, + { + "epoch": 0.75, + "learning_rate": 3.133644315854055e-06, + "loss": 0.3328, + "step": 9450 + }, + { + "epoch": 0.75, + "learning_rate": 3.131779032279397e-06, + "loss": 0.3754, + "step": 9451 + }, + { + "epoch": 0.75, + "learning_rate": 3.1299142009440463e-06, + "loss": 0.3713, + "step": 9452 + }, + { + "epoch": 0.75, + "learning_rate": 3.1280498219707876e-06, + "loss": 0.4234, + "step": 9453 + }, + { + "epoch": 0.75, + "learning_rate": 3.1261858954823798e-06, + "loss": 0.3599, + "step": 9454 + }, + { + "epoch": 0.75, + "learning_rate": 3.12432242160156e-06, + "loss": 0.2933, + "step": 9455 + }, + { + "epoch": 0.75, + "learning_rate": 3.1224594004510246e-06, + "loss": 0.351, + "step": 9456 + }, + { + "epoch": 0.75, + "learning_rate": 3.1205968321534406e-06, + "loss": 0.2861, + "step": 9457 + }, + { + "epoch": 0.75, + "learning_rate": 3.1187347168314586e-06, + "loss": 0.3211, + "step": 9458 + }, + { + "epoch": 0.75, + "learning_rate": 3.1168730546076844e-06, + "loss": 0.3184, + "step": 9459 + }, + { + "epoch": 0.75, + "learning_rate": 3.1150118456046963e-06, + "loss": 0.3131, + "step": 9460 + }, + { + "epoch": 0.75, + "learning_rate": 3.1131510899450533e-06, + "loss": 0.3546, + "step": 9461 + }, + { + "epoch": 0.75, + "learning_rate": 3.1112907877512732e-06, + "loss": 0.3487, + "step": 9462 + }, + { + "epoch": 0.75, + "learning_rate": 3.1094309391458455e-06, + "loss": 0.4239, + "step": 9463 + }, + { + "epoch": 0.75, + "learning_rate": 3.107571544251241e-06, + "loss": 0.4704, + "step": 9464 + }, + { + "epoch": 0.75, + "learning_rate": 3.1057126031898843e-06, + "loss": 0.2992, + "step": 9465 + }, + { + "epoch": 0.75, + "learning_rate": 3.1038541160841752e-06, + "loss": 0.2157, + "step": 9466 + }, + { + "epoch": 0.75, + "learning_rate": 3.1019960830564945e-06, + "loss": 0.2859, + "step": 9467 + }, + { + "epoch": 0.75, + "learning_rate": 3.1001385042291797e-06, + "loss": 0.3781, + "step": 9468 + }, + { + "epoch": 0.75, + "learning_rate": 3.0982813797245413e-06, + "loss": 0.4546, + "step": 9469 + }, + { + "epoch": 0.75, + "learning_rate": 3.096424709664868e-06, + "loss": 0.4021, + "step": 9470 + }, + { + "epoch": 0.75, + "learning_rate": 3.094568494172411e-06, + "loss": 0.3259, + "step": 9471 + }, + { + "epoch": 0.75, + "learning_rate": 3.0927127333693872e-06, + "loss": 0.3373, + "step": 9472 + }, + { + "epoch": 0.75, + "learning_rate": 3.090857427377998e-06, + "loss": 0.3532, + "step": 9473 + }, + { + "epoch": 0.75, + "learning_rate": 3.0890025763204025e-06, + "loss": 0.4042, + "step": 9474 + }, + { + "epoch": 0.75, + "learning_rate": 3.087148180318734e-06, + "loss": 0.2648, + "step": 9475 + }, + { + "epoch": 0.75, + "learning_rate": 3.0852942394950915e-06, + "loss": 0.3829, + "step": 9476 + }, + { + "epoch": 0.75, + "learning_rate": 3.083440753971556e-06, + "loss": 0.2699, + "step": 9477 + }, + { + "epoch": 0.75, + "learning_rate": 3.0815877238701653e-06, + "loss": 0.3614, + "step": 9478 + }, + { + "epoch": 0.75, + "learning_rate": 3.079735149312931e-06, + "loss": 0.4007, + "step": 9479 + }, + { + "epoch": 0.75, + "learning_rate": 3.077883030421843e-06, + "loss": 0.2768, + "step": 9480 + }, + { + "epoch": 0.75, + "learning_rate": 3.0760313673188493e-06, + "loss": 0.3694, + "step": 9481 + }, + { + "epoch": 0.75, + "learning_rate": 3.0741801601258714e-06, + "loss": 0.3022, + "step": 9482 + }, + { + "epoch": 0.75, + "learning_rate": 3.072329408964808e-06, + "loss": 0.2869, + "step": 9483 + }, + { + "epoch": 0.75, + "learning_rate": 3.0704791139575195e-06, + "loss": 0.2161, + "step": 9484 + }, + { + "epoch": 0.75, + "learning_rate": 3.0686292752258352e-06, + "loss": 0.3573, + "step": 9485 + }, + { + "epoch": 0.75, + "learning_rate": 3.066779892891564e-06, + "loss": 0.3234, + "step": 9486 + }, + { + "epoch": 0.75, + "learning_rate": 3.064930967076477e-06, + "loss": 0.2543, + "step": 9487 + }, + { + "epoch": 0.75, + "learning_rate": 3.063082497902313e-06, + "loss": 0.3473, + "step": 9488 + }, + { + "epoch": 0.75, + "learning_rate": 3.0612344854907917e-06, + "loss": 0.3582, + "step": 9489 + }, + { + "epoch": 0.75, + "learning_rate": 3.0593869299635925e-06, + "loss": 0.3261, + "step": 9490 + }, + { + "epoch": 0.75, + "learning_rate": 3.0575398314423677e-06, + "loss": 0.4154, + "step": 9491 + }, + { + "epoch": 0.75, + "learning_rate": 3.0556931900487365e-06, + "loss": 0.2326, + "step": 9492 + }, + { + "epoch": 0.75, + "learning_rate": 3.053847005904298e-06, + "loss": 0.4461, + "step": 9493 + }, + { + "epoch": 0.75, + "learning_rate": 3.052001279130612e-06, + "loss": 0.4163, + "step": 9494 + }, + { + "epoch": 0.75, + "learning_rate": 3.0501560098492056e-06, + "loss": 0.4178, + "step": 9495 + }, + { + "epoch": 0.75, + "learning_rate": 3.0483111981815906e-06, + "loss": 0.3449, + "step": 9496 + }, + { + "epoch": 0.75, + "learning_rate": 3.046466844249232e-06, + "loss": 0.3038, + "step": 9497 + }, + { + "epoch": 0.75, + "learning_rate": 3.0446229481735713e-06, + "loss": 0.4211, + "step": 9498 + }, + { + "epoch": 0.75, + "learning_rate": 3.042779510076025e-06, + "loss": 0.3102, + "step": 9499 + }, + { + "epoch": 0.75, + "learning_rate": 3.0409365300779725e-06, + "loss": 0.3651, + "step": 9500 + }, + { + "epoch": 0.75, + "learning_rate": 3.039094008300761e-06, + "loss": 0.2825, + "step": 9501 + }, + { + "epoch": 0.75, + "learning_rate": 3.0372519448657188e-06, + "loss": 0.3035, + "step": 9502 + }, + { + "epoch": 0.75, + "learning_rate": 3.0354103398941327e-06, + "loss": 0.3077, + "step": 9503 + }, + { + "epoch": 0.75, + "learning_rate": 3.0335691935072618e-06, + "loss": 0.3839, + "step": 9504 + }, + { + "epoch": 0.75, + "learning_rate": 3.0317285058263426e-06, + "loss": 0.3595, + "step": 9505 + }, + { + "epoch": 0.75, + "learning_rate": 3.029888276972571e-06, + "loss": 0.423, + "step": 9506 + }, + { + "epoch": 0.75, + "learning_rate": 3.0280485070671197e-06, + "loss": 0.4112, + "step": 9507 + }, + { + "epoch": 0.75, + "learning_rate": 3.0262091962311234e-06, + "loss": 0.2934, + "step": 9508 + }, + { + "epoch": 0.75, + "learning_rate": 3.0243703445856985e-06, + "loss": 0.3043, + "step": 9509 + }, + { + "epoch": 0.75, + "learning_rate": 3.0225319522519226e-06, + "loss": 0.2763, + "step": 9510 + }, + { + "epoch": 0.75, + "learning_rate": 3.0206940193508404e-06, + "loss": 0.2953, + "step": 9511 + }, + { + "epoch": 0.75, + "learning_rate": 3.018856546003479e-06, + "loss": 0.3377, + "step": 9512 + }, + { + "epoch": 0.75, + "learning_rate": 3.0170195323308216e-06, + "loss": 0.3542, + "step": 9513 + }, + { + "epoch": 0.75, + "learning_rate": 3.0151829784538257e-06, + "loss": 0.4486, + "step": 9514 + }, + { + "epoch": 0.75, + "learning_rate": 3.0133468844934245e-06, + "loss": 0.3888, + "step": 9515 + }, + { + "epoch": 0.75, + "learning_rate": 3.0115112505705134e-06, + "loss": 0.34, + "step": 9516 + }, + { + "epoch": 0.75, + "learning_rate": 3.0096760768059576e-06, + "loss": 0.3176, + "step": 9517 + }, + { + "epoch": 0.75, + "learning_rate": 3.0078413633205995e-06, + "loss": 0.2884, + "step": 9518 + }, + { + "epoch": 0.75, + "learning_rate": 3.0060071102352438e-06, + "loss": 0.3984, + "step": 9519 + }, + { + "epoch": 0.75, + "learning_rate": 3.0041733176706668e-06, + "loss": 0.3684, + "step": 9520 + }, + { + "epoch": 0.75, + "learning_rate": 3.002339985747611e-06, + "loss": 0.3709, + "step": 9521 + }, + { + "epoch": 0.75, + "learning_rate": 3.0005071145868004e-06, + "loss": 0.3277, + "step": 9522 + }, + { + "epoch": 0.75, + "learning_rate": 2.998674704308917e-06, + "loss": 0.3279, + "step": 9523 + }, + { + "epoch": 0.75, + "learning_rate": 2.9968427550346136e-06, + "loss": 0.3645, + "step": 9524 + }, + { + "epoch": 0.75, + "learning_rate": 2.9950112668845198e-06, + "loss": 0.2854, + "step": 9525 + }, + { + "epoch": 0.75, + "learning_rate": 2.9931802399792285e-06, + "loss": 0.3934, + "step": 9526 + }, + { + "epoch": 0.75, + "learning_rate": 2.9913496744393e-06, + "loss": 0.3652, + "step": 9527 + }, + { + "epoch": 0.75, + "learning_rate": 2.9895195703852763e-06, + "loss": 0.315, + "step": 9528 + }, + { + "epoch": 0.75, + "learning_rate": 2.987689927937656e-06, + "loss": 0.4005, + "step": 9529 + }, + { + "epoch": 0.76, + "learning_rate": 2.98586074721691e-06, + "loss": 0.3609, + "step": 9530 + }, + { + "epoch": 0.76, + "learning_rate": 2.9840320283434865e-06, + "loss": 0.4062, + "step": 9531 + }, + { + "epoch": 0.76, + "learning_rate": 2.982203771437796e-06, + "loss": 0.4446, + "step": 9532 + }, + { + "epoch": 0.76, + "learning_rate": 2.9803759766202157e-06, + "loss": 0.3579, + "step": 9533 + }, + { + "epoch": 0.76, + "learning_rate": 2.9785486440111044e-06, + "loss": 0.3912, + "step": 9534 + }, + { + "epoch": 0.76, + "learning_rate": 2.9767217737307805e-06, + "loss": 0.2922, + "step": 9535 + }, + { + "epoch": 0.76, + "learning_rate": 2.974895365899534e-06, + "loss": 0.3956, + "step": 9536 + }, + { + "epoch": 0.76, + "learning_rate": 2.973069420637621e-06, + "loss": 0.2709, + "step": 9537 + }, + { + "epoch": 0.76, + "learning_rate": 2.971243938065279e-06, + "loss": 0.3933, + "step": 9538 + }, + { + "epoch": 0.76, + "learning_rate": 2.9694189183027034e-06, + "loss": 0.2705, + "step": 9539 + }, + { + "epoch": 0.76, + "learning_rate": 2.9675943614700588e-06, + "loss": 0.3114, + "step": 9540 + }, + { + "epoch": 0.76, + "learning_rate": 2.965770267687492e-06, + "loss": 0.3371, + "step": 9541 + }, + { + "epoch": 0.76, + "learning_rate": 2.963946637075107e-06, + "loss": 0.302, + "step": 9542 + }, + { + "epoch": 0.76, + "learning_rate": 2.9621234697529787e-06, + "loss": 0.3742, + "step": 9543 + }, + { + "epoch": 0.76, + "learning_rate": 2.9603007658411575e-06, + "loss": 0.3287, + "step": 9544 + }, + { + "epoch": 0.76, + "learning_rate": 2.958478525459657e-06, + "loss": 0.2846, + "step": 9545 + }, + { + "epoch": 0.76, + "learning_rate": 2.9566567487284613e-06, + "loss": 0.4347, + "step": 9546 + }, + { + "epoch": 0.76, + "learning_rate": 2.9548354357675325e-06, + "loss": 0.2836, + "step": 9547 + }, + { + "epoch": 0.76, + "learning_rate": 2.9530145866967897e-06, + "loss": 0.2995, + "step": 9548 + }, + { + "epoch": 0.76, + "learning_rate": 2.951194201636125e-06, + "loss": 0.375, + "step": 9549 + }, + { + "epoch": 0.76, + "learning_rate": 2.9493742807054094e-06, + "loss": 0.413, + "step": 9550 + }, + { + "epoch": 0.76, + "learning_rate": 2.947554824024472e-06, + "loss": 0.3989, + "step": 9551 + }, + { + "epoch": 0.76, + "learning_rate": 2.9457358317131125e-06, + "loss": 0.3561, + "step": 9552 + }, + { + "epoch": 0.76, + "learning_rate": 2.943917303891107e-06, + "loss": 0.3811, + "step": 9553 + }, + { + "epoch": 0.76, + "learning_rate": 2.942099240678197e-06, + "loss": 0.4479, + "step": 9554 + }, + { + "epoch": 0.76, + "learning_rate": 2.940281642194087e-06, + "loss": 0.3275, + "step": 9555 + }, + { + "epoch": 0.76, + "learning_rate": 2.938464508558466e-06, + "loss": 0.3332, + "step": 9556 + }, + { + "epoch": 0.76, + "learning_rate": 2.936647839890979e-06, + "loss": 0.3152, + "step": 9557 + }, + { + "epoch": 0.76, + "learning_rate": 2.9348316363112417e-06, + "loss": 0.304, + "step": 9558 + }, + { + "epoch": 0.76, + "learning_rate": 2.933015897938849e-06, + "loss": 0.4631, + "step": 9559 + }, + { + "epoch": 0.76, + "learning_rate": 2.9312006248933543e-06, + "loss": 0.4456, + "step": 9560 + }, + { + "epoch": 0.76, + "learning_rate": 2.9293858172942867e-06, + "loss": 0.2622, + "step": 9561 + }, + { + "epoch": 0.76, + "learning_rate": 2.9275714752611383e-06, + "loss": 0.3464, + "step": 9562 + }, + { + "epoch": 0.76, + "learning_rate": 2.9257575989133803e-06, + "loss": 0.3656, + "step": 9563 + }, + { + "epoch": 0.76, + "learning_rate": 2.9239441883704455e-06, + "loss": 0.3541, + "step": 9564 + }, + { + "epoch": 0.76, + "learning_rate": 2.9221312437517357e-06, + "loss": 0.4349, + "step": 9565 + }, + { + "epoch": 0.76, + "learning_rate": 2.9203187651766297e-06, + "loss": 0.3307, + "step": 9566 + }, + { + "epoch": 0.76, + "learning_rate": 2.918506752764467e-06, + "loss": 0.3778, + "step": 9567 + }, + { + "epoch": 0.76, + "learning_rate": 2.916695206634558e-06, + "loss": 0.3351, + "step": 9568 + }, + { + "epoch": 0.76, + "learning_rate": 2.91488412690619e-06, + "loss": 0.345, + "step": 9569 + }, + { + "epoch": 0.76, + "learning_rate": 2.913073513698611e-06, + "loss": 0.3026, + "step": 9570 + }, + { + "epoch": 0.76, + "learning_rate": 2.9112633671310387e-06, + "loss": 0.2162, + "step": 9571 + }, + { + "epoch": 0.76, + "learning_rate": 2.9094536873226663e-06, + "loss": 0.3057, + "step": 9572 + }, + { + "epoch": 0.76, + "learning_rate": 2.9076444743926524e-06, + "loss": 0.4514, + "step": 9573 + }, + { + "epoch": 0.76, + "learning_rate": 2.9058357284601204e-06, + "loss": 0.3437, + "step": 9574 + }, + { + "epoch": 0.76, + "learning_rate": 2.9040274496441732e-06, + "loss": 0.37, + "step": 9575 + }, + { + "epoch": 0.76, + "learning_rate": 2.902219638063876e-06, + "loss": 0.35, + "step": 9576 + }, + { + "epoch": 0.76, + "learning_rate": 2.9004122938382617e-06, + "loss": 0.3685, + "step": 9577 + }, + { + "epoch": 0.76, + "learning_rate": 2.8986054170863344e-06, + "loss": 0.3007, + "step": 9578 + }, + { + "epoch": 0.76, + "learning_rate": 2.8967990079270736e-06, + "loss": 0.3161, + "step": 9579 + }, + { + "epoch": 0.76, + "learning_rate": 2.89499306647942e-06, + "loss": 0.3861, + "step": 9580 + }, + { + "epoch": 0.76, + "learning_rate": 2.8931875928622833e-06, + "loss": 0.3134, + "step": 9581 + }, + { + "epoch": 0.76, + "learning_rate": 2.89138258719455e-06, + "loss": 0.3917, + "step": 9582 + }, + { + "epoch": 0.76, + "learning_rate": 2.8895780495950687e-06, + "loss": 0.3551, + "step": 9583 + }, + { + "epoch": 0.76, + "learning_rate": 2.8877739801826577e-06, + "loss": 0.4045, + "step": 9584 + }, + { + "epoch": 0.76, + "learning_rate": 2.8859703790761095e-06, + "loss": 0.2705, + "step": 9585 + }, + { + "epoch": 0.76, + "learning_rate": 2.8841672463941827e-06, + "loss": 0.3583, + "step": 9586 + }, + { + "epoch": 0.76, + "learning_rate": 2.8823645822556e-06, + "loss": 0.3411, + "step": 9587 + }, + { + "epoch": 0.76, + "learning_rate": 2.8805623867790655e-06, + "loss": 0.3382, + "step": 9588 + }, + { + "epoch": 0.76, + "learning_rate": 2.8787606600832408e-06, + "loss": 0.3503, + "step": 9589 + }, + { + "epoch": 0.76, + "learning_rate": 2.876959402286759e-06, + "loss": 0.2645, + "step": 9590 + }, + { + "epoch": 0.76, + "learning_rate": 2.8751586135082275e-06, + "loss": 0.4255, + "step": 9591 + }, + { + "epoch": 0.76, + "learning_rate": 2.873358293866221e-06, + "loss": 0.3298, + "step": 9592 + }, + { + "epoch": 0.76, + "learning_rate": 2.8715584434792786e-06, + "loss": 0.3635, + "step": 9593 + }, + { + "epoch": 0.76, + "learning_rate": 2.86975906246591e-06, + "loss": 0.3228, + "step": 9594 + }, + { + "epoch": 0.76, + "learning_rate": 2.867960150944602e-06, + "loss": 0.3483, + "step": 9595 + }, + { + "epoch": 0.76, + "learning_rate": 2.8661617090338e-06, + "loss": 0.334, + "step": 9596 + }, + { + "epoch": 0.76, + "learning_rate": 2.864363736851922e-06, + "loss": 0.3795, + "step": 9597 + }, + { + "epoch": 0.76, + "learning_rate": 2.86256623451736e-06, + "loss": 0.2853, + "step": 9598 + }, + { + "epoch": 0.76, + "learning_rate": 2.860769202148468e-06, + "loss": 0.2994, + "step": 9599 + }, + { + "epoch": 0.76, + "learning_rate": 2.8589726398635688e-06, + "loss": 0.3356, + "step": 9600 + }, + { + "epoch": 0.76, + "learning_rate": 2.8571765477809645e-06, + "loss": 0.3613, + "step": 9601 + }, + { + "epoch": 0.76, + "learning_rate": 2.8553809260189145e-06, + "loss": 0.3238, + "step": 9602 + }, + { + "epoch": 0.76, + "learning_rate": 2.8535857746956507e-06, + "loss": 0.275, + "step": 9603 + }, + { + "epoch": 0.76, + "learning_rate": 2.8517910939293804e-06, + "loss": 0.3068, + "step": 9604 + }, + { + "epoch": 0.76, + "learning_rate": 2.849996883838271e-06, + "loss": 0.3102, + "step": 9605 + }, + { + "epoch": 0.76, + "learning_rate": 2.8482031445404634e-06, + "loss": 0.3446, + "step": 9606 + }, + { + "epoch": 0.76, + "learning_rate": 2.8464098761540637e-06, + "loss": 0.2926, + "step": 9607 + }, + { + "epoch": 0.76, + "learning_rate": 2.844617078797155e-06, + "loss": 0.3671, + "step": 9608 + }, + { + "epoch": 0.76, + "learning_rate": 2.842824752587783e-06, + "loss": 0.3044, + "step": 9609 + }, + { + "epoch": 0.76, + "learning_rate": 2.8410328976439595e-06, + "loss": 0.3466, + "step": 9610 + }, + { + "epoch": 0.76, + "learning_rate": 2.839241514083676e-06, + "loss": 0.5594, + "step": 9611 + }, + { + "epoch": 0.76, + "learning_rate": 2.837450602024884e-06, + "loss": 0.3791, + "step": 9612 + }, + { + "epoch": 0.76, + "learning_rate": 2.8356601615855027e-06, + "loss": 0.2811, + "step": 9613 + }, + { + "epoch": 0.76, + "learning_rate": 2.83387019288343e-06, + "loss": 0.277, + "step": 9614 + }, + { + "epoch": 0.76, + "learning_rate": 2.8320806960365234e-06, + "loss": 0.374, + "step": 9615 + }, + { + "epoch": 0.76, + "learning_rate": 2.8302916711626106e-06, + "loss": 0.188, + "step": 9616 + }, + { + "epoch": 0.76, + "learning_rate": 2.8285031183794955e-06, + "loss": 0.4342, + "step": 9617 + }, + { + "epoch": 0.76, + "learning_rate": 2.8267150378049437e-06, + "loss": 0.3741, + "step": 9618 + }, + { + "epoch": 0.76, + "learning_rate": 2.8249274295566863e-06, + "loss": 0.3748, + "step": 9619 + }, + { + "epoch": 0.76, + "learning_rate": 2.823140293752441e-06, + "loss": 0.3559, + "step": 9620 + }, + { + "epoch": 0.76, + "learning_rate": 2.821353630509871e-06, + "loss": 0.4461, + "step": 9621 + }, + { + "epoch": 0.76, + "learning_rate": 2.819567439946621e-06, + "loss": 0.2963, + "step": 9622 + }, + { + "epoch": 0.76, + "learning_rate": 2.8177817221803074e-06, + "loss": 0.3681, + "step": 9623 + }, + { + "epoch": 0.76, + "learning_rate": 2.8159964773285074e-06, + "loss": 0.3183, + "step": 9624 + }, + { + "epoch": 0.76, + "learning_rate": 2.8142117055087704e-06, + "loss": 0.2605, + "step": 9625 + }, + { + "epoch": 0.76, + "learning_rate": 2.8124274068386203e-06, + "loss": 0.3648, + "step": 9626 + }, + { + "epoch": 0.76, + "learning_rate": 2.8106435814355404e-06, + "loss": 0.4149, + "step": 9627 + }, + { + "epoch": 0.76, + "learning_rate": 2.808860229416984e-06, + "loss": 0.3277, + "step": 9628 + }, + { + "epoch": 0.76, + "learning_rate": 2.8070773509003846e-06, + "loss": 0.3432, + "step": 9629 + }, + { + "epoch": 0.76, + "learning_rate": 2.80529494600313e-06, + "loss": 0.3806, + "step": 9630 + }, + { + "epoch": 0.76, + "learning_rate": 2.8035130148425847e-06, + "loss": 0.2582, + "step": 9631 + }, + { + "epoch": 0.76, + "learning_rate": 2.801731557536078e-06, + "loss": 0.3462, + "step": 9632 + }, + { + "epoch": 0.76, + "learning_rate": 2.799950574200915e-06, + "loss": 0.3296, + "step": 9633 + }, + { + "epoch": 0.76, + "learning_rate": 2.7981700649543618e-06, + "loss": 0.3542, + "step": 9634 + }, + { + "epoch": 0.76, + "learning_rate": 2.796390029913655e-06, + "loss": 0.2958, + "step": 9635 + }, + { + "epoch": 0.76, + "learning_rate": 2.794610469196004e-06, + "loss": 0.363, + "step": 9636 + }, + { + "epoch": 0.76, + "learning_rate": 2.792831382918585e-06, + "loss": 0.4462, + "step": 9637 + }, + { + "epoch": 0.76, + "learning_rate": 2.791052771198538e-06, + "loss": 0.2444, + "step": 9638 + }, + { + "epoch": 0.76, + "learning_rate": 2.7892746341529807e-06, + "loss": 0.3943, + "step": 9639 + }, + { + "epoch": 0.76, + "learning_rate": 2.7874969718989943e-06, + "loss": 0.272, + "step": 9640 + }, + { + "epoch": 0.76, + "learning_rate": 2.785719784553624e-06, + "loss": 0.3173, + "step": 9641 + }, + { + "epoch": 0.76, + "learning_rate": 2.7839430722338956e-06, + "loss": 0.2876, + "step": 9642 + }, + { + "epoch": 0.76, + "learning_rate": 2.7821668350567956e-06, + "loss": 0.3691, + "step": 9643 + }, + { + "epoch": 0.76, + "learning_rate": 2.7803910731392757e-06, + "loss": 0.3849, + "step": 9644 + }, + { + "epoch": 0.76, + "learning_rate": 2.778615786598269e-06, + "loss": 0.2583, + "step": 9645 + }, + { + "epoch": 0.76, + "learning_rate": 2.776840975550664e-06, + "loss": 0.3846, + "step": 9646 + }, + { + "epoch": 0.76, + "learning_rate": 2.7750666401133263e-06, + "loss": 0.3168, + "step": 9647 + }, + { + "epoch": 0.76, + "learning_rate": 2.773292780403083e-06, + "loss": 0.2704, + "step": 9648 + }, + { + "epoch": 0.76, + "learning_rate": 2.7715193965367403e-06, + "loss": 0.3041, + "step": 9649 + }, + { + "epoch": 0.76, + "learning_rate": 2.769746488631064e-06, + "loss": 0.3292, + "step": 9650 + }, + { + "epoch": 0.76, + "learning_rate": 2.767974056802789e-06, + "loss": 0.3373, + "step": 9651 + }, + { + "epoch": 0.76, + "learning_rate": 2.766202101168628e-06, + "loss": 0.2957, + "step": 9652 + }, + { + "epoch": 0.76, + "learning_rate": 2.76443062184525e-06, + "loss": 0.2792, + "step": 9653 + }, + { + "epoch": 0.76, + "learning_rate": 2.7626596189492983e-06, + "loss": 0.3977, + "step": 9654 + }, + { + "epoch": 0.76, + "learning_rate": 2.76088909259739e-06, + "loss": 0.2594, + "step": 9655 + }, + { + "epoch": 0.76, + "learning_rate": 2.7591190429061023e-06, + "loss": 0.342, + "step": 9656 + }, + { + "epoch": 0.77, + "learning_rate": 2.757349469991981e-06, + "loss": 0.3592, + "step": 9657 + }, + { + "epoch": 0.77, + "learning_rate": 2.7555803739715512e-06, + "loss": 0.2572, + "step": 9658 + }, + { + "epoch": 0.77, + "learning_rate": 2.7538117549612963e-06, + "loss": 0.2865, + "step": 9659 + }, + { + "epoch": 0.77, + "learning_rate": 2.752043613077667e-06, + "loss": 0.3857, + "step": 9660 + }, + { + "epoch": 0.77, + "learning_rate": 2.7502759484370946e-06, + "loss": 0.3821, + "step": 9661 + }, + { + "epoch": 0.77, + "learning_rate": 2.748508761155967e-06, + "loss": 0.3549, + "step": 9662 + }, + { + "epoch": 0.77, + "learning_rate": 2.746742051350646e-06, + "loss": 0.3801, + "step": 9663 + }, + { + "epoch": 0.77, + "learning_rate": 2.7449758191374574e-06, + "loss": 0.3993, + "step": 9664 + }, + { + "epoch": 0.77, + "learning_rate": 2.7432100646327043e-06, + "loss": 0.2516, + "step": 9665 + }, + { + "epoch": 0.77, + "learning_rate": 2.7414447879526517e-06, + "loss": 0.3115, + "step": 9666 + }, + { + "epoch": 0.77, + "learning_rate": 2.739679989213532e-06, + "loss": 0.4341, + "step": 9667 + }, + { + "epoch": 0.77, + "learning_rate": 2.7379156685315523e-06, + "loss": 0.2652, + "step": 9668 + }, + { + "epoch": 0.77, + "learning_rate": 2.7361518260228827e-06, + "loss": 0.3183, + "step": 9669 + }, + { + "epoch": 0.77, + "learning_rate": 2.734388461803661e-06, + "loss": 0.3074, + "step": 9670 + }, + { + "epoch": 0.77, + "learning_rate": 2.7326255759900024e-06, + "loss": 0.3819, + "step": 9671 + }, + { + "epoch": 0.77, + "learning_rate": 2.7308631686979816e-06, + "loss": 0.3418, + "step": 9672 + }, + { + "epoch": 0.77, + "learning_rate": 2.7291012400436414e-06, + "loss": 0.3323, + "step": 9673 + }, + { + "epoch": 0.77, + "learning_rate": 2.7273397901430023e-06, + "loss": 0.2969, + "step": 9674 + }, + { + "epoch": 0.77, + "learning_rate": 2.7255788191120435e-06, + "loss": 0.4505, + "step": 9675 + }, + { + "epoch": 0.77, + "learning_rate": 2.723818327066717e-06, + "loss": 0.4766, + "step": 9676 + }, + { + "epoch": 0.77, + "learning_rate": 2.722058314122941e-06, + "loss": 0.3496, + "step": 9677 + }, + { + "epoch": 0.77, + "learning_rate": 2.7202987803966073e-06, + "loss": 0.4452, + "step": 9678 + }, + { + "epoch": 0.77, + "learning_rate": 2.718539726003573e-06, + "loss": 0.3426, + "step": 9679 + }, + { + "epoch": 0.77, + "learning_rate": 2.7167811510596577e-06, + "loss": 0.3433, + "step": 9680 + }, + { + "epoch": 0.77, + "learning_rate": 2.715023055680661e-06, + "loss": 0.4033, + "step": 9681 + }, + { + "epoch": 0.77, + "learning_rate": 2.7132654399823444e-06, + "loss": 0.3261, + "step": 9682 + }, + { + "epoch": 0.77, + "learning_rate": 2.7115083040804337e-06, + "loss": 0.3434, + "step": 9683 + }, + { + "epoch": 0.77, + "learning_rate": 2.709751648090634e-06, + "loss": 0.3639, + "step": 9684 + }, + { + "epoch": 0.77, + "learning_rate": 2.7079954721286108e-06, + "loss": 0.3482, + "step": 9685 + }, + { + "epoch": 0.77, + "learning_rate": 2.7062397763099945e-06, + "loss": 0.3512, + "step": 9686 + }, + { + "epoch": 0.77, + "learning_rate": 2.7044845607503967e-06, + "loss": 0.2915, + "step": 9687 + }, + { + "epoch": 0.77, + "learning_rate": 2.7027298255653878e-06, + "loss": 0.4245, + "step": 9688 + }, + { + "epoch": 0.77, + "learning_rate": 2.700975570870503e-06, + "loss": 0.3227, + "step": 9689 + }, + { + "epoch": 0.77, + "learning_rate": 2.6992217967812606e-06, + "loss": 0.3209, + "step": 9690 + }, + { + "epoch": 0.77, + "learning_rate": 2.697468503413134e-06, + "loss": 0.3623, + "step": 9691 + }, + { + "epoch": 0.77, + "learning_rate": 2.6957156908815684e-06, + "loss": 0.4157, + "step": 9692 + }, + { + "epoch": 0.77, + "learning_rate": 2.6939633593019754e-06, + "loss": 0.3762, + "step": 9693 + }, + { + "epoch": 0.77, + "learning_rate": 2.692211508789744e-06, + "loss": 0.3878, + "step": 9694 + }, + { + "epoch": 0.77, + "learning_rate": 2.6904601394602216e-06, + "loss": 0.2681, + "step": 9695 + }, + { + "epoch": 0.77, + "learning_rate": 2.688709251428725e-06, + "loss": 0.3952, + "step": 9696 + }, + { + "epoch": 0.77, + "learning_rate": 2.6869588448105475e-06, + "loss": 0.3707, + "step": 9697 + }, + { + "epoch": 0.77, + "learning_rate": 2.685208919720942e-06, + "loss": 0.3045, + "step": 9698 + }, + { + "epoch": 0.77, + "learning_rate": 2.683459476275133e-06, + "loss": 0.3631, + "step": 9699 + }, + { + "epoch": 0.77, + "learning_rate": 2.6817105145883117e-06, + "loss": 0.3454, + "step": 9700 + }, + { + "epoch": 0.77, + "learning_rate": 2.6799620347756407e-06, + "loss": 0.3646, + "step": 9701 + }, + { + "epoch": 0.77, + "learning_rate": 2.6782140369522435e-06, + "loss": 0.4212, + "step": 9702 + }, + { + "epoch": 0.77, + "learning_rate": 2.676466521233225e-06, + "loss": 0.3333, + "step": 9703 + }, + { + "epoch": 0.77, + "learning_rate": 2.674719487733649e-06, + "loss": 0.398, + "step": 9704 + }, + { + "epoch": 0.77, + "learning_rate": 2.672972936568543e-06, + "loss": 0.3809, + "step": 9705 + }, + { + "epoch": 0.77, + "learning_rate": 2.6712268678529187e-06, + "loss": 0.4477, + "step": 9706 + }, + { + "epoch": 0.77, + "learning_rate": 2.669481281701739e-06, + "loss": 0.393, + "step": 9707 + }, + { + "epoch": 0.77, + "learning_rate": 2.6677361782299437e-06, + "loss": 0.3458, + "step": 9708 + }, + { + "epoch": 0.77, + "learning_rate": 2.665991557552442e-06, + "loss": 0.2674, + "step": 9709 + }, + { + "epoch": 0.77, + "learning_rate": 2.6642474197841086e-06, + "loss": 0.413, + "step": 9710 + }, + { + "epoch": 0.77, + "learning_rate": 2.6625037650397812e-06, + "loss": 0.3643, + "step": 9711 + }, + { + "epoch": 0.77, + "learning_rate": 2.6607605934342785e-06, + "loss": 0.3827, + "step": 9712 + }, + { + "epoch": 0.77, + "learning_rate": 2.659017905082376e-06, + "loss": 0.4144, + "step": 9713 + }, + { + "epoch": 0.77, + "learning_rate": 2.657275700098819e-06, + "loss": 0.3094, + "step": 9714 + }, + { + "epoch": 0.77, + "learning_rate": 2.65553397859833e-06, + "loss": 0.3508, + "step": 9715 + }, + { + "epoch": 0.77, + "learning_rate": 2.6537927406955888e-06, + "loss": 0.363, + "step": 9716 + }, + { + "epoch": 0.77, + "learning_rate": 2.6520519865052476e-06, + "loss": 0.2584, + "step": 9717 + }, + { + "epoch": 0.77, + "learning_rate": 2.6503117161419246e-06, + "loss": 0.3972, + "step": 9718 + }, + { + "epoch": 0.77, + "learning_rate": 2.6485719297202127e-06, + "loss": 0.2282, + "step": 9719 + }, + { + "epoch": 0.77, + "learning_rate": 2.646832627354667e-06, + "loss": 0.387, + "step": 9720 + }, + { + "epoch": 0.77, + "learning_rate": 2.645093809159809e-06, + "loss": 0.3002, + "step": 9721 + }, + { + "epoch": 0.77, + "learning_rate": 2.643355475250137e-06, + "loss": 0.4303, + "step": 9722 + }, + { + "epoch": 0.77, + "learning_rate": 2.6416176257401083e-06, + "loss": 0.3712, + "step": 9723 + }, + { + "epoch": 0.77, + "learning_rate": 2.639880260744151e-06, + "loss": 0.3011, + "step": 9724 + }, + { + "epoch": 0.77, + "learning_rate": 2.6381433803766654e-06, + "loss": 0.4551, + "step": 9725 + }, + { + "epoch": 0.77, + "learning_rate": 2.6364069847520155e-06, + "loss": 0.3271, + "step": 9726 + }, + { + "epoch": 0.77, + "learning_rate": 2.6346710739845317e-06, + "loss": 0.2818, + "step": 9727 + }, + { + "epoch": 0.77, + "learning_rate": 2.6329356481885215e-06, + "loss": 0.2699, + "step": 9728 + }, + { + "epoch": 0.77, + "learning_rate": 2.6312007074782497e-06, + "loss": 0.2777, + "step": 9729 + }, + { + "epoch": 0.77, + "learning_rate": 2.6294662519679525e-06, + "loss": 0.4429, + "step": 9730 + }, + { + "epoch": 0.77, + "learning_rate": 2.627732281771841e-06, + "loss": 0.284, + "step": 9731 + }, + { + "epoch": 0.77, + "learning_rate": 2.6259987970040858e-06, + "loss": 0.2714, + "step": 9732 + }, + { + "epoch": 0.77, + "learning_rate": 2.6242657977788277e-06, + "loss": 0.3068, + "step": 9733 + }, + { + "epoch": 0.77, + "learning_rate": 2.6225332842101746e-06, + "loss": 0.3265, + "step": 9734 + }, + { + "epoch": 0.77, + "learning_rate": 2.6208012564122097e-06, + "loss": 0.3525, + "step": 9735 + }, + { + "epoch": 0.77, + "learning_rate": 2.6190697144989753e-06, + "loss": 0.3789, + "step": 9736 + }, + { + "epoch": 0.77, + "learning_rate": 2.617338658584483e-06, + "loss": 0.406, + "step": 9737 + }, + { + "epoch": 0.77, + "learning_rate": 2.6156080887827183e-06, + "loss": 0.2724, + "step": 9738 + }, + { + "epoch": 0.77, + "learning_rate": 2.613878005207631e-06, + "loss": 0.3339, + "step": 9739 + }, + { + "epoch": 0.77, + "learning_rate": 2.612148407973134e-06, + "loss": 0.2042, + "step": 9740 + }, + { + "epoch": 0.77, + "learning_rate": 2.6104192971931197e-06, + "loss": 0.341, + "step": 9741 + }, + { + "epoch": 0.77, + "learning_rate": 2.6086906729814378e-06, + "loss": 0.4029, + "step": 9742 + }, + { + "epoch": 0.77, + "learning_rate": 2.606962535451907e-06, + "loss": 0.295, + "step": 9743 + }, + { + "epoch": 0.77, + "learning_rate": 2.605234884718324e-06, + "loss": 0.2956, + "step": 9744 + }, + { + "epoch": 0.77, + "learning_rate": 2.6035077208944416e-06, + "loss": 0.4066, + "step": 9745 + }, + { + "epoch": 0.77, + "learning_rate": 2.601781044093984e-06, + "loss": 0.3812, + "step": 9746 + }, + { + "epoch": 0.77, + "learning_rate": 2.600054854430649e-06, + "loss": 0.3465, + "step": 9747 + }, + { + "epoch": 0.77, + "learning_rate": 2.5983291520180965e-06, + "loss": 0.3366, + "step": 9748 + }, + { + "epoch": 0.77, + "learning_rate": 2.5966039369699537e-06, + "loss": 0.3645, + "step": 9749 + }, + { + "epoch": 0.77, + "learning_rate": 2.5948792093998167e-06, + "loss": 0.4079, + "step": 9750 + }, + { + "epoch": 0.77, + "learning_rate": 2.5931549694212545e-06, + "loss": 0.4068, + "step": 9751 + }, + { + "epoch": 0.77, + "learning_rate": 2.5914312171477983e-06, + "loss": 0.4143, + "step": 9752 + }, + { + "epoch": 0.77, + "learning_rate": 2.589707952692947e-06, + "loss": 0.2833, + "step": 9753 + }, + { + "epoch": 0.77, + "learning_rate": 2.5879851761701724e-06, + "loss": 0.3273, + "step": 9754 + }, + { + "epoch": 0.77, + "learning_rate": 2.586262887692911e-06, + "loss": 0.2565, + "step": 9755 + }, + { + "epoch": 0.77, + "learning_rate": 2.5845410873745614e-06, + "loss": 0.398, + "step": 9756 + }, + { + "epoch": 0.77, + "learning_rate": 2.5828197753285043e-06, + "loss": 0.4203, + "step": 9757 + }, + { + "epoch": 0.77, + "learning_rate": 2.581098951668075e-06, + "loss": 0.308, + "step": 9758 + }, + { + "epoch": 0.77, + "learning_rate": 2.5793786165065805e-06, + "loss": 0.2743, + "step": 9759 + }, + { + "epoch": 0.77, + "learning_rate": 2.5776587699573007e-06, + "loss": 0.3655, + "step": 9760 + }, + { + "epoch": 0.77, + "learning_rate": 2.5759394121334767e-06, + "loss": 0.2966, + "step": 9761 + }, + { + "epoch": 0.77, + "learning_rate": 2.57422054314832e-06, + "loss": 0.3354, + "step": 9762 + }, + { + "epoch": 0.77, + "learning_rate": 2.572502163115007e-06, + "loss": 0.2957, + "step": 9763 + }, + { + "epoch": 0.77, + "learning_rate": 2.5707842721466914e-06, + "loss": 0.4191, + "step": 9764 + }, + { + "epoch": 0.77, + "learning_rate": 2.5690668703564835e-06, + "loss": 0.3676, + "step": 9765 + }, + { + "epoch": 0.77, + "learning_rate": 2.5673499578574644e-06, + "loss": 0.3114, + "step": 9766 + }, + { + "epoch": 0.77, + "learning_rate": 2.565633534762689e-06, + "loss": 0.3624, + "step": 9767 + }, + { + "epoch": 0.77, + "learning_rate": 2.5639176011851753e-06, + "loss": 0.3915, + "step": 9768 + }, + { + "epoch": 0.77, + "learning_rate": 2.562202157237903e-06, + "loss": 0.3877, + "step": 9769 + }, + { + "epoch": 0.77, + "learning_rate": 2.5604872030338336e-06, + "loss": 0.3067, + "step": 9770 + }, + { + "epoch": 0.77, + "learning_rate": 2.5587727386858853e-06, + "loss": 0.3364, + "step": 9771 + }, + { + "epoch": 0.77, + "learning_rate": 2.5570587643069435e-06, + "loss": 0.338, + "step": 9772 + }, + { + "epoch": 0.77, + "learning_rate": 2.555345280009872e-06, + "loss": 0.3951, + "step": 9773 + }, + { + "epoch": 0.77, + "learning_rate": 2.5536322859074934e-06, + "loss": 0.3601, + "step": 9774 + }, + { + "epoch": 0.77, + "learning_rate": 2.551919782112596e-06, + "loss": 0.4162, + "step": 9775 + }, + { + "epoch": 0.77, + "learning_rate": 2.550207768737949e-06, + "loss": 0.3614, + "step": 9776 + }, + { + "epoch": 0.77, + "learning_rate": 2.54849624589627e-06, + "loss": 0.3412, + "step": 9777 + }, + { + "epoch": 0.77, + "learning_rate": 2.546785213700258e-06, + "loss": 0.2334, + "step": 9778 + }, + { + "epoch": 0.77, + "learning_rate": 2.5450746722625785e-06, + "loss": 0.2637, + "step": 9779 + }, + { + "epoch": 0.77, + "learning_rate": 2.5433646216958617e-06, + "loss": 0.3728, + "step": 9780 + }, + { + "epoch": 0.77, + "learning_rate": 2.5416550621127024e-06, + "loss": 0.2998, + "step": 9781 + }, + { + "epoch": 0.77, + "learning_rate": 2.539945993625673e-06, + "loss": 0.3408, + "step": 9782 + }, + { + "epoch": 0.78, + "learning_rate": 2.5382374163473046e-06, + "loss": 0.3198, + "step": 9783 + }, + { + "epoch": 0.78, + "learning_rate": 2.536529330390095e-06, + "loss": 0.2911, + "step": 9784 + }, + { + "epoch": 0.78, + "learning_rate": 2.5348217358665207e-06, + "loss": 0.2734, + "step": 9785 + }, + { + "epoch": 0.78, + "learning_rate": 2.5331146328890145e-06, + "loss": 0.3271, + "step": 9786 + }, + { + "epoch": 0.78, + "learning_rate": 2.5314080215699822e-06, + "loss": 0.3924, + "step": 9787 + }, + { + "epoch": 0.78, + "learning_rate": 2.5297019020217904e-06, + "loss": 0.4303, + "step": 9788 + }, + { + "epoch": 0.78, + "learning_rate": 2.5279962743567877e-06, + "loss": 0.3441, + "step": 9789 + }, + { + "epoch": 0.78, + "learning_rate": 2.526291138687278e-06, + "loss": 0.311, + "step": 9790 + }, + { + "epoch": 0.78, + "learning_rate": 2.5245864951255317e-06, + "loss": 0.4471, + "step": 9791 + }, + { + "epoch": 0.78, + "learning_rate": 2.522882343783799e-06, + "loss": 0.3857, + "step": 9792 + }, + { + "epoch": 0.78, + "learning_rate": 2.521178684774286e-06, + "loss": 0.2796, + "step": 9793 + }, + { + "epoch": 0.78, + "learning_rate": 2.519475518209167e-06, + "loss": 0.4918, + "step": 9794 + }, + { + "epoch": 0.78, + "learning_rate": 2.5177728442005956e-06, + "loss": 0.3618, + "step": 9795 + }, + { + "epoch": 0.78, + "learning_rate": 2.516070662860679e-06, + "loss": 0.3793, + "step": 9796 + }, + { + "epoch": 0.78, + "learning_rate": 2.5143689743014966e-06, + "loss": 0.3547, + "step": 9797 + }, + { + "epoch": 0.78, + "learning_rate": 2.5126677786351005e-06, + "loss": 0.3634, + "step": 9798 + }, + { + "epoch": 0.78, + "learning_rate": 2.5109670759735063e-06, + "loss": 0.326, + "step": 9799 + }, + { + "epoch": 0.78, + "learning_rate": 2.509266866428691e-06, + "loss": 0.3278, + "step": 9800 + }, + { + "epoch": 0.78, + "learning_rate": 2.507567150112613e-06, + "loss": 0.3014, + "step": 9801 + }, + { + "epoch": 0.78, + "learning_rate": 2.5058679271371865e-06, + "loss": 0.3474, + "step": 9802 + }, + { + "epoch": 0.78, + "learning_rate": 2.504169197614298e-06, + "loss": 0.2583, + "step": 9803 + }, + { + "epoch": 0.78, + "learning_rate": 2.5024709616557964e-06, + "loss": 0.2861, + "step": 9804 + }, + { + "epoch": 0.78, + "learning_rate": 2.500773219373509e-06, + "loss": 0.3585, + "step": 9805 + }, + { + "epoch": 0.78, + "learning_rate": 2.499075970879222e-06, + "loss": 0.323, + "step": 9806 + }, + { + "epoch": 0.78, + "learning_rate": 2.4973792162846878e-06, + "loss": 0.2918, + "step": 9807 + }, + { + "epoch": 0.78, + "learning_rate": 2.4956829557016336e-06, + "loss": 0.4011, + "step": 9808 + }, + { + "epoch": 0.78, + "learning_rate": 2.493987189241749e-06, + "loss": 0.2676, + "step": 9809 + }, + { + "epoch": 0.78, + "learning_rate": 2.4922919170166883e-06, + "loss": 0.3959, + "step": 9810 + }, + { + "epoch": 0.78, + "learning_rate": 2.4905971391380823e-06, + "loss": 0.379, + "step": 9811 + }, + { + "epoch": 0.78, + "learning_rate": 2.488902855717522e-06, + "loss": 0.3863, + "step": 9812 + }, + { + "epoch": 0.78, + "learning_rate": 2.487209066866565e-06, + "loss": 0.3613, + "step": 9813 + }, + { + "epoch": 0.78, + "learning_rate": 2.485515772696745e-06, + "loss": 0.3971, + "step": 9814 + }, + { + "epoch": 0.78, + "learning_rate": 2.483822973319553e-06, + "loss": 0.4358, + "step": 9815 + }, + { + "epoch": 0.78, + "learning_rate": 2.482130668846451e-06, + "loss": 0.4422, + "step": 9816 + }, + { + "epoch": 0.78, + "learning_rate": 2.480438859388873e-06, + "loss": 0.367, + "step": 9817 + }, + { + "epoch": 0.78, + "learning_rate": 2.4787475450582133e-06, + "loss": 0.2668, + "step": 9818 + }, + { + "epoch": 0.78, + "learning_rate": 2.4770567259658386e-06, + "loss": 0.3116, + "step": 9819 + }, + { + "epoch": 0.78, + "learning_rate": 2.4753664022230783e-06, + "loss": 0.3405, + "step": 9820 + }, + { + "epoch": 0.78, + "learning_rate": 2.473676573941236e-06, + "loss": 0.2761, + "step": 9821 + }, + { + "epoch": 0.78, + "learning_rate": 2.471987241231577e-06, + "loss": 0.3265, + "step": 9822 + }, + { + "epoch": 0.78, + "learning_rate": 2.4702984042053335e-06, + "loss": 0.3158, + "step": 9823 + }, + { + "epoch": 0.78, + "learning_rate": 2.468610062973712e-06, + "loss": 0.347, + "step": 9824 + }, + { + "epoch": 0.78, + "learning_rate": 2.466922217647879e-06, + "loss": 0.3283, + "step": 9825 + }, + { + "epoch": 0.78, + "learning_rate": 2.465234868338968e-06, + "loss": 0.3798, + "step": 9826 + }, + { + "epoch": 0.78, + "learning_rate": 2.4635480151580902e-06, + "loss": 0.3229, + "step": 9827 + }, + { + "epoch": 0.78, + "learning_rate": 2.461861658216311e-06, + "loss": 0.322, + "step": 9828 + }, + { + "epoch": 0.78, + "learning_rate": 2.4601757976246685e-06, + "loss": 0.3145, + "step": 9829 + }, + { + "epoch": 0.78, + "learning_rate": 2.4584904334941728e-06, + "loss": 0.2365, + "step": 9830 + }, + { + "epoch": 0.78, + "learning_rate": 2.456805565935795e-06, + "loss": 0.319, + "step": 9831 + }, + { + "epoch": 0.78, + "learning_rate": 2.4551211950604713e-06, + "loss": 0.3026, + "step": 9832 + }, + { + "epoch": 0.78, + "learning_rate": 2.4534373209791162e-06, + "loss": 0.3184, + "step": 9833 + }, + { + "epoch": 0.78, + "learning_rate": 2.451753943802603e-06, + "loss": 0.3609, + "step": 9834 + }, + { + "epoch": 0.78, + "learning_rate": 2.4500710636417725e-06, + "loss": 0.3415, + "step": 9835 + }, + { + "epoch": 0.78, + "learning_rate": 2.4483886806074308e-06, + "loss": 0.2545, + "step": 9836 + }, + { + "epoch": 0.78, + "learning_rate": 2.4467067948103616e-06, + "loss": 0.3473, + "step": 9837 + }, + { + "epoch": 0.78, + "learning_rate": 2.4450254063613056e-06, + "loss": 0.4582, + "step": 9838 + }, + { + "epoch": 0.78, + "learning_rate": 2.4433445153709722e-06, + "loss": 0.2695, + "step": 9839 + }, + { + "epoch": 0.78, + "learning_rate": 2.441664121950045e-06, + "loss": 0.3573, + "step": 9840 + }, + { + "epoch": 0.78, + "learning_rate": 2.439984226209167e-06, + "loss": 0.3794, + "step": 9841 + }, + { + "epoch": 0.78, + "learning_rate": 2.438304828258947e-06, + "loss": 0.3307, + "step": 9842 + }, + { + "epoch": 0.78, + "learning_rate": 2.4366259282099737e-06, + "loss": 0.3456, + "step": 9843 + }, + { + "epoch": 0.78, + "learning_rate": 2.4349475261727905e-06, + "loss": 0.3142, + "step": 9844 + }, + { + "epoch": 0.78, + "learning_rate": 2.4332696222579078e-06, + "loss": 0.4236, + "step": 9845 + }, + { + "epoch": 0.78, + "learning_rate": 2.4315922165758154e-06, + "loss": 0.3995, + "step": 9846 + }, + { + "epoch": 0.78, + "learning_rate": 2.4299153092369598e-06, + "loss": 0.2543, + "step": 9847 + }, + { + "epoch": 0.78, + "learning_rate": 2.428238900351755e-06, + "loss": 0.3027, + "step": 9848 + }, + { + "epoch": 0.78, + "learning_rate": 2.426562990030582e-06, + "loss": 0.3231, + "step": 9849 + }, + { + "epoch": 0.78, + "learning_rate": 2.424887578383799e-06, + "loss": 0.3664, + "step": 9850 + }, + { + "epoch": 0.78, + "learning_rate": 2.4232126655217202e-06, + "loss": 0.3568, + "step": 9851 + }, + { + "epoch": 0.78, + "learning_rate": 2.421538251554627e-06, + "loss": 0.3163, + "step": 9852 + }, + { + "epoch": 0.78, + "learning_rate": 2.4198643365927767e-06, + "loss": 0.3671, + "step": 9853 + }, + { + "epoch": 0.78, + "learning_rate": 2.4181909207463873e-06, + "loss": 0.2517, + "step": 9854 + }, + { + "epoch": 0.78, + "learning_rate": 2.4165180041256444e-06, + "loss": 0.3625, + "step": 9855 + }, + { + "epoch": 0.78, + "learning_rate": 2.4148455868407015e-06, + "loss": 0.2944, + "step": 9856 + }, + { + "epoch": 0.78, + "learning_rate": 2.413173669001676e-06, + "loss": 0.3154, + "step": 9857 + }, + { + "epoch": 0.78, + "learning_rate": 2.4115022507186626e-06, + "loss": 0.3391, + "step": 9858 + }, + { + "epoch": 0.78, + "learning_rate": 2.409831332101712e-06, + "loss": 0.3382, + "step": 9859 + }, + { + "epoch": 0.78, + "learning_rate": 2.4081609132608464e-06, + "loss": 0.3341, + "step": 9860 + }, + { + "epoch": 0.78, + "learning_rate": 2.406490994306052e-06, + "loss": 0.431, + "step": 9861 + }, + { + "epoch": 0.78, + "learning_rate": 2.4048215753472914e-06, + "loss": 0.2769, + "step": 9862 + }, + { + "epoch": 0.78, + "learning_rate": 2.403152656494485e-06, + "loss": 0.2991, + "step": 9863 + }, + { + "epoch": 0.78, + "learning_rate": 2.401484237857519e-06, + "loss": 0.3947, + "step": 9864 + }, + { + "epoch": 0.78, + "learning_rate": 2.3998163195462565e-06, + "loss": 0.2904, + "step": 9865 + }, + { + "epoch": 0.78, + "learning_rate": 2.398148901670521e-06, + "loss": 0.3454, + "step": 9866 + }, + { + "epoch": 0.78, + "learning_rate": 2.396481984340098e-06, + "loss": 0.3356, + "step": 9867 + }, + { + "epoch": 0.78, + "learning_rate": 2.3948155676647546e-06, + "loss": 0.2797, + "step": 9868 + }, + { + "epoch": 0.78, + "learning_rate": 2.393149651754212e-06, + "loss": 0.3304, + "step": 9869 + }, + { + "epoch": 0.78, + "learning_rate": 2.391484236718159e-06, + "loss": 0.3292, + "step": 9870 + }, + { + "epoch": 0.78, + "learning_rate": 2.389819322666264e-06, + "loss": 0.3205, + "step": 9871 + }, + { + "epoch": 0.78, + "learning_rate": 2.3881549097081467e-06, + "loss": 0.3408, + "step": 9872 + }, + { + "epoch": 0.78, + "learning_rate": 2.3864909979534044e-06, + "loss": 0.3045, + "step": 9873 + }, + { + "epoch": 0.78, + "learning_rate": 2.3848275875115925e-06, + "loss": 0.3226, + "step": 9874 + }, + { + "epoch": 0.78, + "learning_rate": 2.3831646784922446e-06, + "loss": 0.3057, + "step": 9875 + }, + { + "epoch": 0.78, + "learning_rate": 2.381502271004853e-06, + "loss": 0.3903, + "step": 9876 + }, + { + "epoch": 0.78, + "learning_rate": 2.3798403651588765e-06, + "loss": 0.4421, + "step": 9877 + }, + { + "epoch": 0.78, + "learning_rate": 2.3781789610637483e-06, + "loss": 0.3866, + "step": 9878 + }, + { + "epoch": 0.78, + "learning_rate": 2.376518058828863e-06, + "loss": 0.3601, + "step": 9879 + }, + { + "epoch": 0.78, + "learning_rate": 2.3748576585635774e-06, + "loss": 0.3585, + "step": 9880 + }, + { + "epoch": 0.78, + "learning_rate": 2.373197760377228e-06, + "loss": 0.3131, + "step": 9881 + }, + { + "epoch": 0.78, + "learning_rate": 2.371538364379109e-06, + "loss": 0.3786, + "step": 9882 + }, + { + "epoch": 0.78, + "learning_rate": 2.36987947067848e-06, + "loss": 0.3263, + "step": 9883 + }, + { + "epoch": 0.78, + "learning_rate": 2.368221079384577e-06, + "loss": 0.2745, + "step": 9884 + }, + { + "epoch": 0.78, + "learning_rate": 2.3665631906065933e-06, + "loss": 0.3062, + "step": 9885 + }, + { + "epoch": 0.78, + "learning_rate": 2.364905804453692e-06, + "loss": 0.2647, + "step": 9886 + }, + { + "epoch": 0.78, + "learning_rate": 2.3632489210350074e-06, + "loss": 0.3337, + "step": 9887 + }, + { + "epoch": 0.78, + "learning_rate": 2.361592540459636e-06, + "loss": 0.2479, + "step": 9888 + }, + { + "epoch": 0.78, + "learning_rate": 2.3599366628366427e-06, + "loss": 0.3579, + "step": 9889 + }, + { + "epoch": 0.78, + "learning_rate": 2.358281288275055e-06, + "loss": 0.4295, + "step": 9890 + }, + { + "epoch": 0.78, + "learning_rate": 2.356626416883878e-06, + "loss": 0.318, + "step": 9891 + }, + { + "epoch": 0.78, + "learning_rate": 2.354972048772074e-06, + "loss": 0.2762, + "step": 9892 + }, + { + "epoch": 0.78, + "learning_rate": 2.353318184048573e-06, + "loss": 0.2341, + "step": 9893 + }, + { + "epoch": 0.78, + "learning_rate": 2.351664822822277e-06, + "loss": 0.289, + "step": 9894 + }, + { + "epoch": 0.78, + "learning_rate": 2.3500119652020526e-06, + "loss": 0.3646, + "step": 9895 + }, + { + "epoch": 0.78, + "learning_rate": 2.348359611296728e-06, + "loss": 0.3734, + "step": 9896 + }, + { + "epoch": 0.78, + "learning_rate": 2.346707761215108e-06, + "loss": 0.3224, + "step": 9897 + }, + { + "epoch": 0.78, + "learning_rate": 2.345056415065956e-06, + "loss": 0.3393, + "step": 9898 + }, + { + "epoch": 0.78, + "learning_rate": 2.343405572958004e-06, + "loss": 0.3823, + "step": 9899 + }, + { + "epoch": 0.78, + "learning_rate": 2.341755234999956e-06, + "loss": 0.3659, + "step": 9900 + }, + { + "epoch": 0.78, + "learning_rate": 2.3401054013004776e-06, + "loss": 0.3692, + "step": 9901 + }, + { + "epoch": 0.78, + "learning_rate": 2.338456071968198e-06, + "loss": 0.4248, + "step": 9902 + }, + { + "epoch": 0.78, + "learning_rate": 2.336807247111723e-06, + "loss": 0.4237, + "step": 9903 + }, + { + "epoch": 0.78, + "learning_rate": 2.3351589268396193e-06, + "loss": 0.349, + "step": 9904 + }, + { + "epoch": 0.78, + "learning_rate": 2.3335111112604194e-06, + "loss": 0.323, + "step": 9905 + }, + { + "epoch": 0.78, + "learning_rate": 2.33186380048262e-06, + "loss": 0.4243, + "step": 9906 + }, + { + "epoch": 0.78, + "learning_rate": 2.330216994614696e-06, + "loss": 0.3426, + "step": 9907 + }, + { + "epoch": 0.78, + "learning_rate": 2.3285706937650786e-06, + "loss": 0.2958, + "step": 9908 + }, + { + "epoch": 0.79, + "learning_rate": 2.3269248980421653e-06, + "loss": 0.3865, + "step": 9909 + }, + { + "epoch": 0.79, + "learning_rate": 2.3252796075543295e-06, + "loss": 0.2519, + "step": 9910 + }, + { + "epoch": 0.79, + "learning_rate": 2.3236348224099038e-06, + "loss": 0.2706, + "step": 9911 + }, + { + "epoch": 0.79, + "learning_rate": 2.3219905427171864e-06, + "loss": 0.4111, + "step": 9912 + }, + { + "epoch": 0.79, + "learning_rate": 2.320346768584449e-06, + "loss": 0.3698, + "step": 9913 + }, + { + "epoch": 0.79, + "learning_rate": 2.3187035001199254e-06, + "loss": 0.319, + "step": 9914 + }, + { + "epoch": 0.79, + "learning_rate": 2.317060737431813e-06, + "loss": 0.328, + "step": 9915 + }, + { + "epoch": 0.79, + "learning_rate": 2.3154184806282863e-06, + "loss": 0.2343, + "step": 9916 + }, + { + "epoch": 0.79, + "learning_rate": 2.3137767298174774e-06, + "loss": 0.3193, + "step": 9917 + }, + { + "epoch": 0.79, + "learning_rate": 2.312135485107486e-06, + "loss": 0.305, + "step": 9918 + }, + { + "epoch": 0.79, + "learning_rate": 2.3104947466063785e-06, + "loss": 0.3053, + "step": 9919 + }, + { + "epoch": 0.79, + "learning_rate": 2.3088545144221964e-06, + "loss": 0.207, + "step": 9920 + }, + { + "epoch": 0.79, + "learning_rate": 2.307214788662936e-06, + "loss": 0.5311, + "step": 9921 + }, + { + "epoch": 0.79, + "learning_rate": 2.3055755694365644e-06, + "loss": 0.3456, + "step": 9922 + }, + { + "epoch": 0.79, + "learning_rate": 2.303936856851021e-06, + "loss": 0.2522, + "step": 9923 + }, + { + "epoch": 0.79, + "learning_rate": 2.302298651014204e-06, + "loss": 0.2279, + "step": 9924 + }, + { + "epoch": 0.79, + "learning_rate": 2.3006609520339796e-06, + "loss": 0.2817, + "step": 9925 + }, + { + "epoch": 0.79, + "learning_rate": 2.2990237600181864e-06, + "loss": 0.365, + "step": 9926 + }, + { + "epoch": 0.79, + "learning_rate": 2.2973870750746253e-06, + "loss": 0.292, + "step": 9927 + }, + { + "epoch": 0.79, + "learning_rate": 2.2957508973110586e-06, + "loss": 0.3198, + "step": 9928 + }, + { + "epoch": 0.79, + "learning_rate": 2.2941152268352284e-06, + "loss": 0.3635, + "step": 9929 + }, + { + "epoch": 0.79, + "learning_rate": 2.292480063754833e-06, + "loss": 0.3726, + "step": 9930 + }, + { + "epoch": 0.79, + "learning_rate": 2.2908454081775344e-06, + "loss": 0.3581, + "step": 9931 + }, + { + "epoch": 0.79, + "learning_rate": 2.2892112602109783e-06, + "loss": 0.3376, + "step": 9932 + }, + { + "epoch": 0.79, + "learning_rate": 2.2875776199627564e-06, + "loss": 0.2749, + "step": 9933 + }, + { + "epoch": 0.79, + "learning_rate": 2.2859444875404347e-06, + "loss": 0.3311, + "step": 9934 + }, + { + "epoch": 0.79, + "learning_rate": 2.2843118630515536e-06, + "loss": 0.409, + "step": 9935 + }, + { + "epoch": 0.79, + "learning_rate": 2.282679746603611e-06, + "loss": 0.3573, + "step": 9936 + }, + { + "epoch": 0.79, + "learning_rate": 2.281048138304072e-06, + "loss": 0.3202, + "step": 9937 + }, + { + "epoch": 0.79, + "learning_rate": 2.279417038260373e-06, + "loss": 0.3641, + "step": 9938 + }, + { + "epoch": 0.79, + "learning_rate": 2.2777864465799137e-06, + "loss": 0.3782, + "step": 9939 + }, + { + "epoch": 0.79, + "learning_rate": 2.276156363370058e-06, + "loss": 0.38, + "step": 9940 + }, + { + "epoch": 0.79, + "learning_rate": 2.274526788738143e-06, + "loss": 0.3007, + "step": 9941 + }, + { + "epoch": 0.79, + "learning_rate": 2.272897722791466e-06, + "loss": 0.3973, + "step": 9942 + }, + { + "epoch": 0.79, + "learning_rate": 2.271269165637294e-06, + "loss": 0.4765, + "step": 9943 + }, + { + "epoch": 0.79, + "learning_rate": 2.2696411173828557e-06, + "loss": 0.3343, + "step": 9944 + }, + { + "epoch": 0.79, + "learning_rate": 2.268013578135357e-06, + "loss": 0.3588, + "step": 9945 + }, + { + "epoch": 0.79, + "learning_rate": 2.266386548001961e-06, + "loss": 0.3481, + "step": 9946 + }, + { + "epoch": 0.79, + "learning_rate": 2.264760027089795e-06, + "loss": 0.4395, + "step": 9947 + }, + { + "epoch": 0.79, + "learning_rate": 2.2631340155059656e-06, + "loss": 0.2559, + "step": 9948 + }, + { + "epoch": 0.79, + "learning_rate": 2.261508513357532e-06, + "loss": 0.3723, + "step": 9949 + }, + { + "epoch": 0.79, + "learning_rate": 2.2598835207515267e-06, + "loss": 0.2055, + "step": 9950 + }, + { + "epoch": 0.79, + "learning_rate": 2.2582590377949497e-06, + "loss": 0.3446, + "step": 9951 + }, + { + "epoch": 0.79, + "learning_rate": 2.2566350645947656e-06, + "loss": 0.3887, + "step": 9952 + }, + { + "epoch": 0.79, + "learning_rate": 2.2550116012579004e-06, + "loss": 0.3261, + "step": 9953 + }, + { + "epoch": 0.79, + "learning_rate": 2.253388647891258e-06, + "loss": 0.3276, + "step": 9954 + }, + { + "epoch": 0.79, + "learning_rate": 2.2517662046016975e-06, + "loss": 0.1945, + "step": 9955 + }, + { + "epoch": 0.79, + "learning_rate": 2.250144271496049e-06, + "loss": 0.3976, + "step": 9956 + }, + { + "epoch": 0.79, + "learning_rate": 2.2485228486811128e-06, + "loss": 0.3173, + "step": 9957 + }, + { + "epoch": 0.79, + "learning_rate": 2.2469019362636478e-06, + "loss": 0.291, + "step": 9958 + }, + { + "epoch": 0.79, + "learning_rate": 2.2452815343503862e-06, + "loss": 0.295, + "step": 9959 + }, + { + "epoch": 0.79, + "learning_rate": 2.2436616430480197e-06, + "loss": 0.51, + "step": 9960 + }, + { + "epoch": 0.79, + "learning_rate": 2.2420422624632153e-06, + "loss": 0.39, + "step": 9961 + }, + { + "epoch": 0.79, + "learning_rate": 2.2404233927025985e-06, + "loss": 0.3205, + "step": 9962 + }, + { + "epoch": 0.79, + "learning_rate": 2.238805033872762e-06, + "loss": 0.3108, + "step": 9963 + }, + { + "epoch": 0.79, + "learning_rate": 2.237187186080273e-06, + "loss": 0.3487, + "step": 9964 + }, + { + "epoch": 0.79, + "learning_rate": 2.235569849431655e-06, + "loss": 0.3614, + "step": 9965 + }, + { + "epoch": 0.79, + "learning_rate": 2.2339530240333993e-06, + "loss": 0.3391, + "step": 9966 + }, + { + "epoch": 0.79, + "learning_rate": 2.2323367099919724e-06, + "loss": 0.3776, + "step": 9967 + }, + { + "epoch": 0.79, + "learning_rate": 2.230720907413797e-06, + "loss": 0.4767, + "step": 9968 + }, + { + "epoch": 0.79, + "learning_rate": 2.2291056164052638e-06, + "loss": 0.3223, + "step": 9969 + }, + { + "epoch": 0.79, + "learning_rate": 2.2274908370727376e-06, + "loss": 0.3156, + "step": 9970 + }, + { + "epoch": 0.79, + "learning_rate": 2.2258765695225416e-06, + "loss": 0.2964, + "step": 9971 + }, + { + "epoch": 0.79, + "learning_rate": 2.224262813860962e-06, + "loss": 0.2617, + "step": 9972 + }, + { + "epoch": 0.79, + "learning_rate": 2.2226495701942663e-06, + "loss": 0.3655, + "step": 9973 + }, + { + "epoch": 0.79, + "learning_rate": 2.2210368386286742e-06, + "loss": 0.3915, + "step": 9974 + }, + { + "epoch": 0.79, + "learning_rate": 2.219424619270375e-06, + "loss": 0.2435, + "step": 9975 + }, + { + "epoch": 0.79, + "learning_rate": 2.2178129122255255e-06, + "loss": 0.2612, + "step": 9976 + }, + { + "epoch": 0.79, + "learning_rate": 2.2162017176002514e-06, + "loss": 0.2895, + "step": 9977 + }, + { + "epoch": 0.79, + "learning_rate": 2.2145910355006415e-06, + "loss": 0.3867, + "step": 9978 + }, + { + "epoch": 0.79, + "learning_rate": 2.212980866032749e-06, + "loss": 0.4037, + "step": 9979 + }, + { + "epoch": 0.79, + "learning_rate": 2.2113712093025997e-06, + "loss": 0.3213, + "step": 9980 + }, + { + "epoch": 0.79, + "learning_rate": 2.20976206541618e-06, + "loss": 0.3341, + "step": 9981 + }, + { + "epoch": 0.79, + "learning_rate": 2.208153434479442e-06, + "loss": 0.3326, + "step": 9982 + }, + { + "epoch": 0.79, + "learning_rate": 2.20654531659831e-06, + "loss": 0.3498, + "step": 9983 + }, + { + "epoch": 0.79, + "learning_rate": 2.2049377118786696e-06, + "loss": 0.4275, + "step": 9984 + }, + { + "epoch": 0.79, + "learning_rate": 2.2033306204263704e-06, + "loss": 0.2749, + "step": 9985 + }, + { + "epoch": 0.79, + "learning_rate": 2.2017240423472384e-06, + "loss": 0.2952, + "step": 9986 + }, + { + "epoch": 0.79, + "learning_rate": 2.200117977747055e-06, + "loss": 0.2698, + "step": 9987 + }, + { + "epoch": 0.79, + "learning_rate": 2.198512426731568e-06, + "loss": 0.3201, + "step": 9988 + }, + { + "epoch": 0.79, + "learning_rate": 2.196907389406504e-06, + "loss": 0.3209, + "step": 9989 + }, + { + "epoch": 0.79, + "learning_rate": 2.195302865877541e-06, + "loss": 0.4504, + "step": 9990 + }, + { + "epoch": 0.79, + "learning_rate": 2.193698856250331e-06, + "loss": 0.3648, + "step": 9991 + }, + { + "epoch": 0.79, + "learning_rate": 2.1920953606304875e-06, + "loss": 0.4737, + "step": 9992 + }, + { + "epoch": 0.79, + "learning_rate": 2.1904923791235965e-06, + "loss": 0.3232, + "step": 9993 + }, + { + "epoch": 0.79, + "learning_rate": 2.188889911835207e-06, + "loss": 0.3326, + "step": 9994 + }, + { + "epoch": 0.79, + "learning_rate": 2.1872879588708286e-06, + "loss": 0.3592, + "step": 9995 + }, + { + "epoch": 0.79, + "learning_rate": 2.185686520335948e-06, + "loss": 0.3998, + "step": 9996 + }, + { + "epoch": 0.79, + "learning_rate": 2.184085596336011e-06, + "loss": 0.2959, + "step": 9997 + }, + { + "epoch": 0.79, + "learning_rate": 2.1824851869764262e-06, + "loss": 0.32, + "step": 9998 + }, + { + "epoch": 0.79, + "learning_rate": 2.1808852923625802e-06, + "loss": 0.3967, + "step": 9999 + }, + { + "epoch": 0.79, + "learning_rate": 2.1792859125998134e-06, + "loss": 0.3737, + "step": 10000 + }, + { + "epoch": 0.79, + "learning_rate": 2.1776870477934353e-06, + "loss": 0.2691, + "step": 10001 + }, + { + "epoch": 0.79, + "learning_rate": 2.1760886980487307e-06, + "loss": 0.3095, + "step": 10002 + }, + { + "epoch": 0.79, + "learning_rate": 2.174490863470938e-06, + "loss": 0.447, + "step": 10003 + }, + { + "epoch": 0.79, + "learning_rate": 2.1728935441652687e-06, + "loss": 0.2223, + "step": 10004 + }, + { + "epoch": 0.79, + "learning_rate": 2.1712967402368947e-06, + "loss": 0.2612, + "step": 10005 + }, + { + "epoch": 0.79, + "learning_rate": 2.169700451790964e-06, + "loss": 0.2888, + "step": 10006 + }, + { + "epoch": 0.79, + "learning_rate": 2.168104678932581e-06, + "loss": 0.3819, + "step": 10007 + }, + { + "epoch": 0.79, + "learning_rate": 2.166509421766818e-06, + "loss": 0.3267, + "step": 10008 + }, + { + "epoch": 0.79, + "learning_rate": 2.1649146803987197e-06, + "loss": 0.2047, + "step": 10009 + }, + { + "epoch": 0.79, + "learning_rate": 2.1633204549332897e-06, + "loss": 0.2415, + "step": 10010 + }, + { + "epoch": 0.79, + "learning_rate": 2.1617267454754996e-06, + "loss": 0.2991, + "step": 10011 + }, + { + "epoch": 0.79, + "learning_rate": 2.160133552130289e-06, + "loss": 0.2863, + "step": 10012 + }, + { + "epoch": 0.79, + "learning_rate": 2.1585408750025584e-06, + "loss": 0.417, + "step": 10013 + }, + { + "epoch": 0.79, + "learning_rate": 2.1569487141971824e-06, + "loss": 0.3136, + "step": 10014 + }, + { + "epoch": 0.79, + "learning_rate": 2.155357069818995e-06, + "loss": 0.2859, + "step": 10015 + }, + { + "epoch": 0.79, + "learning_rate": 2.1537659419727987e-06, + "loss": 0.3176, + "step": 10016 + }, + { + "epoch": 0.79, + "learning_rate": 2.152175330763359e-06, + "loss": 0.2705, + "step": 10017 + }, + { + "epoch": 0.79, + "learning_rate": 2.150585236295415e-06, + "loss": 0.2958, + "step": 10018 + }, + { + "epoch": 0.79, + "learning_rate": 2.148995658673665e-06, + "loss": 0.2892, + "step": 10019 + }, + { + "epoch": 0.79, + "learning_rate": 2.14740659800277e-06, + "loss": 0.2877, + "step": 10020 + }, + { + "epoch": 0.79, + "learning_rate": 2.1458180543873697e-06, + "loss": 0.2868, + "step": 10021 + }, + { + "epoch": 0.79, + "learning_rate": 2.1442300279320593e-06, + "loss": 0.3426, + "step": 10022 + }, + { + "epoch": 0.79, + "learning_rate": 2.142642518741399e-06, + "loss": 0.3862, + "step": 10023 + }, + { + "epoch": 0.79, + "learning_rate": 2.141055526919924e-06, + "loss": 0.3117, + "step": 10024 + }, + { + "epoch": 0.79, + "learning_rate": 2.1394690525721275e-06, + "loss": 0.3273, + "step": 10025 + }, + { + "epoch": 0.79, + "learning_rate": 2.137883095802469e-06, + "loss": 0.3798, + "step": 10026 + }, + { + "epoch": 0.79, + "learning_rate": 2.1362976567153813e-06, + "loss": 0.331, + "step": 10027 + }, + { + "epoch": 0.79, + "learning_rate": 2.134712735415255e-06, + "loss": 0.3822, + "step": 10028 + }, + { + "epoch": 0.79, + "learning_rate": 2.13312833200645e-06, + "loss": 0.3281, + "step": 10029 + }, + { + "epoch": 0.79, + "learning_rate": 2.131544446593289e-06, + "loss": 0.4041, + "step": 10030 + }, + { + "epoch": 0.79, + "learning_rate": 2.1299610792800675e-06, + "loss": 0.2411, + "step": 10031 + }, + { + "epoch": 0.79, + "learning_rate": 2.1283782301710408e-06, + "loss": 0.2827, + "step": 10032 + }, + { + "epoch": 0.79, + "learning_rate": 2.1267958993704297e-06, + "loss": 0.3901, + "step": 10033 + }, + { + "epoch": 0.79, + "learning_rate": 2.1252140869824266e-06, + "loss": 0.2449, + "step": 10034 + }, + { + "epoch": 0.8, + "learning_rate": 2.1236327931111868e-06, + "loss": 0.3191, + "step": 10035 + }, + { + "epoch": 0.8, + "learning_rate": 2.122052017860825e-06, + "loss": 0.2443, + "step": 10036 + }, + { + "epoch": 0.8, + "learning_rate": 2.120471761335434e-06, + "loss": 0.3571, + "step": 10037 + }, + { + "epoch": 0.8, + "learning_rate": 2.118892023639064e-06, + "loss": 0.2484, + "step": 10038 + }, + { + "epoch": 0.8, + "learning_rate": 2.1173128048757307e-06, + "loss": 0.3453, + "step": 10039 + }, + { + "epoch": 0.8, + "learning_rate": 2.115734105149422e-06, + "loss": 0.4595, + "step": 10040 + }, + { + "epoch": 0.8, + "learning_rate": 2.1141559245640865e-06, + "loss": 0.2666, + "step": 10041 + }, + { + "epoch": 0.8, + "learning_rate": 2.1125782632236357e-06, + "loss": 0.3196, + "step": 10042 + }, + { + "epoch": 0.8, + "learning_rate": 2.111001121231957e-06, + "loss": 0.3723, + "step": 10043 + }, + { + "epoch": 0.8, + "learning_rate": 2.1094244986928956e-06, + "loss": 0.3599, + "step": 10044 + }, + { + "epoch": 0.8, + "learning_rate": 2.1078483957102637e-06, + "loss": 0.3695, + "step": 10045 + }, + { + "epoch": 0.8, + "learning_rate": 2.1062728123878383e-06, + "loss": 0.2795, + "step": 10046 + }, + { + "epoch": 0.8, + "learning_rate": 2.1046977488293675e-06, + "loss": 0.3241, + "step": 10047 + }, + { + "epoch": 0.8, + "learning_rate": 2.1031232051385606e-06, + "loss": 0.3601, + "step": 10048 + }, + { + "epoch": 0.8, + "learning_rate": 2.1015491814190913e-06, + "loss": 0.4151, + "step": 10049 + }, + { + "epoch": 0.8, + "learning_rate": 2.099975677774606e-06, + "loss": 0.2869, + "step": 10050 + }, + { + "epoch": 0.8, + "learning_rate": 2.0984026943087087e-06, + "loss": 0.3454, + "step": 10051 + }, + { + "epoch": 0.8, + "learning_rate": 2.096830231124972e-06, + "loss": 0.3564, + "step": 10052 + }, + { + "epoch": 0.8, + "learning_rate": 2.0952582883269403e-06, + "loss": 0.4453, + "step": 10053 + }, + { + "epoch": 0.8, + "learning_rate": 2.093686866018114e-06, + "loss": 0.3426, + "step": 10054 + }, + { + "epoch": 0.8, + "learning_rate": 2.0921159643019627e-06, + "loss": 0.2103, + "step": 10055 + }, + { + "epoch": 0.8, + "learning_rate": 2.0905455832819277e-06, + "loss": 0.2486, + "step": 10056 + }, + { + "epoch": 0.8, + "learning_rate": 2.088975723061408e-06, + "loss": 0.3481, + "step": 10057 + }, + { + "epoch": 0.8, + "learning_rate": 2.0874063837437687e-06, + "loss": 0.3487, + "step": 10058 + }, + { + "epoch": 0.8, + "learning_rate": 2.085837565432349e-06, + "loss": 0.4444, + "step": 10059 + }, + { + "epoch": 0.8, + "learning_rate": 2.0842692682304442e-06, + "loss": 0.3984, + "step": 10060 + }, + { + "epoch": 0.8, + "learning_rate": 2.0827014922413213e-06, + "loss": 0.3417, + "step": 10061 + }, + { + "epoch": 0.8, + "learning_rate": 2.0811342375682065e-06, + "loss": 0.4211, + "step": 10062 + }, + { + "epoch": 0.8, + "learning_rate": 2.0795675043143016e-06, + "loss": 0.4355, + "step": 10063 + }, + { + "epoch": 0.8, + "learning_rate": 2.0780012925827653e-06, + "loss": 0.2519, + "step": 10064 + }, + { + "epoch": 0.8, + "learning_rate": 2.0764356024767228e-06, + "loss": 0.4138, + "step": 10065 + }, + { + "epoch": 0.8, + "learning_rate": 2.0748704340992743e-06, + "loss": 0.3389, + "step": 10066 + }, + { + "epoch": 0.8, + "learning_rate": 2.0733057875534734e-06, + "loss": 0.3125, + "step": 10067 + }, + { + "epoch": 0.8, + "learning_rate": 2.0717416629423425e-06, + "loss": 0.2433, + "step": 10068 + }, + { + "epoch": 0.8, + "learning_rate": 2.0701780603688783e-06, + "loss": 0.2112, + "step": 10069 + }, + { + "epoch": 0.8, + "learning_rate": 2.068614979936032e-06, + "loss": 0.3082, + "step": 10070 + }, + { + "epoch": 0.8, + "learning_rate": 2.0670524217467237e-06, + "loss": 0.3384, + "step": 10071 + }, + { + "epoch": 0.8, + "learning_rate": 2.0654903859038457e-06, + "loss": 0.3282, + "step": 10072 + }, + { + "epoch": 0.8, + "learning_rate": 2.0639288725102467e-06, + "loss": 0.311, + "step": 10073 + }, + { + "epoch": 0.8, + "learning_rate": 2.0623678816687433e-06, + "loss": 0.234, + "step": 10074 + }, + { + "epoch": 0.8, + "learning_rate": 2.0608074134821243e-06, + "loss": 0.3946, + "step": 10075 + }, + { + "epoch": 0.8, + "learning_rate": 2.0592474680531347e-06, + "loss": 0.2988, + "step": 10076 + }, + { + "epoch": 0.8, + "learning_rate": 2.0576880454844926e-06, + "loss": 0.3428, + "step": 10077 + }, + { + "epoch": 0.8, + "learning_rate": 2.0561291458788736e-06, + "loss": 0.2452, + "step": 10078 + }, + { + "epoch": 0.8, + "learning_rate": 2.0545707693389296e-06, + "loss": 0.247, + "step": 10079 + }, + { + "epoch": 0.8, + "learning_rate": 2.0530129159672685e-06, + "loss": 0.3277, + "step": 10080 + }, + { + "epoch": 0.8, + "learning_rate": 2.0514555858664663e-06, + "loss": 0.2131, + "step": 10081 + }, + { + "epoch": 0.8, + "learning_rate": 2.0498987791390713e-06, + "loss": 0.3316, + "step": 10082 + }, + { + "epoch": 0.8, + "learning_rate": 2.0483424958875876e-06, + "loss": 0.2409, + "step": 10083 + }, + { + "epoch": 0.8, + "learning_rate": 2.0467867362144867e-06, + "loss": 0.3455, + "step": 10084 + }, + { + "epoch": 0.8, + "learning_rate": 2.0452315002222134e-06, + "loss": 0.3251, + "step": 10085 + }, + { + "epoch": 0.8, + "learning_rate": 2.04367678801317e-06, + "loss": 0.2859, + "step": 10086 + }, + { + "epoch": 0.8, + "learning_rate": 2.0421225996897243e-06, + "loss": 0.304, + "step": 10087 + }, + { + "epoch": 0.8, + "learning_rate": 2.0405689353542204e-06, + "loss": 0.2735, + "step": 10088 + }, + { + "epoch": 0.8, + "learning_rate": 2.0390157951089506e-06, + "loss": 0.3677, + "step": 10089 + }, + { + "epoch": 0.8, + "learning_rate": 2.0374631790561815e-06, + "loss": 0.2916, + "step": 10090 + }, + { + "epoch": 0.8, + "learning_rate": 2.0359110872981526e-06, + "loss": 0.3299, + "step": 10091 + }, + { + "epoch": 0.8, + "learning_rate": 2.034359519937057e-06, + "loss": 0.4379, + "step": 10092 + }, + { + "epoch": 0.8, + "learning_rate": 2.032808477075057e-06, + "loss": 0.2472, + "step": 10093 + }, + { + "epoch": 0.8, + "learning_rate": 2.0312579588142846e-06, + "loss": 0.2783, + "step": 10094 + }, + { + "epoch": 0.8, + "learning_rate": 2.029707965256833e-06, + "loss": 0.3665, + "step": 10095 + }, + { + "epoch": 0.8, + "learning_rate": 2.0281584965047585e-06, + "loss": 0.2583, + "step": 10096 + }, + { + "epoch": 0.8, + "learning_rate": 2.0266095526600925e-06, + "loss": 0.2845, + "step": 10097 + }, + { + "epoch": 0.8, + "learning_rate": 2.0250611338248215e-06, + "loss": 0.3616, + "step": 10098 + }, + { + "epoch": 0.8, + "learning_rate": 2.0235132401008985e-06, + "loss": 0.2069, + "step": 10099 + }, + { + "epoch": 0.8, + "learning_rate": 2.0219658715902514e-06, + "loss": 0.2663, + "step": 10100 + }, + { + "epoch": 0.8, + "learning_rate": 2.0204190283947645e-06, + "loss": 0.4124, + "step": 10101 + }, + { + "epoch": 0.8, + "learning_rate": 2.0188727106162874e-06, + "loss": 0.3287, + "step": 10102 + }, + { + "epoch": 0.8, + "learning_rate": 2.017326918356639e-06, + "loss": 0.36, + "step": 10103 + }, + { + "epoch": 0.8, + "learning_rate": 2.0157816517176045e-06, + "loss": 0.4011, + "step": 10104 + }, + { + "epoch": 0.8, + "learning_rate": 2.0142369108009306e-06, + "loss": 0.4137, + "step": 10105 + }, + { + "epoch": 0.8, + "learning_rate": 2.012692695708328e-06, + "loss": 0.2625, + "step": 10106 + }, + { + "epoch": 0.8, + "learning_rate": 2.011149006541483e-06, + "loss": 0.2774, + "step": 10107 + }, + { + "epoch": 0.8, + "learning_rate": 2.0096058434020348e-06, + "loss": 0.3235, + "step": 10108 + }, + { + "epoch": 0.8, + "learning_rate": 2.0080632063915927e-06, + "loss": 0.2747, + "step": 10109 + }, + { + "epoch": 0.8, + "learning_rate": 2.0065210956117354e-06, + "loss": 0.3834, + "step": 10110 + }, + { + "epoch": 0.8, + "learning_rate": 2.0049795111640023e-06, + "loss": 0.4268, + "step": 10111 + }, + { + "epoch": 0.8, + "learning_rate": 2.0034384531498962e-06, + "loss": 0.2218, + "step": 10112 + }, + { + "epoch": 0.8, + "learning_rate": 2.0018979216708935e-06, + "loss": 0.4542, + "step": 10113 + }, + { + "epoch": 0.8, + "learning_rate": 2.000357916828428e-06, + "loss": 0.5005, + "step": 10114 + }, + { + "epoch": 0.8, + "learning_rate": 1.9988184387239027e-06, + "loss": 0.2409, + "step": 10115 + }, + { + "epoch": 0.8, + "learning_rate": 1.9972794874586808e-06, + "loss": 0.3844, + "step": 10116 + }, + { + "epoch": 0.8, + "learning_rate": 1.9957410631341e-06, + "loss": 0.3586, + "step": 10117 + }, + { + "epoch": 0.8, + "learning_rate": 1.9942031658514573e-06, + "loss": 0.2994, + "step": 10118 + }, + { + "epoch": 0.8, + "learning_rate": 1.992665795712011e-06, + "loss": 0.2893, + "step": 10119 + }, + { + "epoch": 0.8, + "learning_rate": 1.991128952816996e-06, + "loss": 0.363, + "step": 10120 + }, + { + "epoch": 0.8, + "learning_rate": 1.9895926372676042e-06, + "loss": 0.325, + "step": 10121 + }, + { + "epoch": 0.8, + "learning_rate": 1.988056849164991e-06, + "loss": 0.4384, + "step": 10122 + }, + { + "epoch": 0.8, + "learning_rate": 1.986521588610285e-06, + "loss": 0.2779, + "step": 10123 + }, + { + "epoch": 0.8, + "learning_rate": 1.9849868557045738e-06, + "loss": 0.3683, + "step": 10124 + }, + { + "epoch": 0.8, + "learning_rate": 1.9834526505489105e-06, + "loss": 0.3617, + "step": 10125 + }, + { + "epoch": 0.8, + "learning_rate": 1.9819189732443187e-06, + "loss": 0.3174, + "step": 10126 + }, + { + "epoch": 0.8, + "learning_rate": 1.9803858238917826e-06, + "loss": 0.2511, + "step": 10127 + }, + { + "epoch": 0.8, + "learning_rate": 1.97885320259225e-06, + "loss": 0.353, + "step": 10128 + }, + { + "epoch": 0.8, + "learning_rate": 1.9773211094466404e-06, + "loss": 0.3266, + "step": 10129 + }, + { + "epoch": 0.8, + "learning_rate": 1.975789544555834e-06, + "loss": 0.378, + "step": 10130 + }, + { + "epoch": 0.8, + "learning_rate": 1.9742585080206754e-06, + "loss": 0.1475, + "step": 10131 + }, + { + "epoch": 0.8, + "learning_rate": 1.9727279999419745e-06, + "loss": 0.2484, + "step": 10132 + }, + { + "epoch": 0.8, + "learning_rate": 1.9711980204205115e-06, + "loss": 0.3646, + "step": 10133 + }, + { + "epoch": 0.8, + "learning_rate": 1.9696685695570285e-06, + "loss": 0.3461, + "step": 10134 + }, + { + "epoch": 0.8, + "learning_rate": 1.9681396474522264e-06, + "loss": 0.2905, + "step": 10135 + }, + { + "epoch": 0.8, + "learning_rate": 1.966611254206785e-06, + "loss": 0.3694, + "step": 10136 + }, + { + "epoch": 0.8, + "learning_rate": 1.9650833899213383e-06, + "loss": 0.4209, + "step": 10137 + }, + { + "epoch": 0.8, + "learning_rate": 1.963556054696487e-06, + "loss": 0.3066, + "step": 10138 + }, + { + "epoch": 0.8, + "learning_rate": 1.962029248632802e-06, + "loss": 0.3505, + "step": 10139 + }, + { + "epoch": 0.8, + "learning_rate": 1.9605029718308156e-06, + "loss": 0.3128, + "step": 10140 + }, + { + "epoch": 0.8, + "learning_rate": 1.958977224391021e-06, + "loss": 0.2732, + "step": 10141 + }, + { + "epoch": 0.8, + "learning_rate": 1.957452006413889e-06, + "loss": 0.4498, + "step": 10142 + }, + { + "epoch": 0.8, + "learning_rate": 1.955927317999844e-06, + "loss": 0.2811, + "step": 10143 + }, + { + "epoch": 0.8, + "learning_rate": 1.9544031592492763e-06, + "loss": 0.3613, + "step": 10144 + }, + { + "epoch": 0.8, + "learning_rate": 1.9528795302625515e-06, + "loss": 0.3773, + "step": 10145 + }, + { + "epoch": 0.8, + "learning_rate": 1.951356431139988e-06, + "loss": 0.3774, + "step": 10146 + }, + { + "epoch": 0.8, + "learning_rate": 1.949833861981877e-06, + "loss": 0.2824, + "step": 10147 + }, + { + "epoch": 0.8, + "learning_rate": 1.948311822888468e-06, + "loss": 0.4257, + "step": 10148 + }, + { + "epoch": 0.8, + "learning_rate": 1.9467903139599853e-06, + "loss": 0.2307, + "step": 10149 + }, + { + "epoch": 0.8, + "learning_rate": 1.945269335296611e-06, + "loss": 0.2715, + "step": 10150 + }, + { + "epoch": 0.8, + "learning_rate": 1.943748886998492e-06, + "loss": 0.3346, + "step": 10151 + }, + { + "epoch": 0.8, + "learning_rate": 1.942228969165748e-06, + "loss": 0.39, + "step": 10152 + }, + { + "epoch": 0.8, + "learning_rate": 1.940709581898453e-06, + "loss": 0.3102, + "step": 10153 + }, + { + "epoch": 0.8, + "learning_rate": 1.9391907252966522e-06, + "loss": 0.3582, + "step": 10154 + }, + { + "epoch": 0.8, + "learning_rate": 1.9376723994603574e-06, + "loss": 0.3232, + "step": 10155 + }, + { + "epoch": 0.8, + "learning_rate": 1.936154604489543e-06, + "loss": 0.3323, + "step": 10156 + }, + { + "epoch": 0.8, + "learning_rate": 1.9346373404841433e-06, + "loss": 0.3353, + "step": 10157 + }, + { + "epoch": 0.8, + "learning_rate": 1.93312060754407e-06, + "loss": 0.2937, + "step": 10158 + }, + { + "epoch": 0.8, + "learning_rate": 1.9316044057691886e-06, + "loss": 0.3082, + "step": 10159 + }, + { + "epoch": 0.8, + "learning_rate": 1.9300887352593355e-06, + "loss": 0.3295, + "step": 10160 + }, + { + "epoch": 0.8, + "learning_rate": 1.928573596114306e-06, + "loss": 0.3534, + "step": 10161 + }, + { + "epoch": 0.81, + "learning_rate": 1.9270589884338706e-06, + "loss": 0.3041, + "step": 10162 + }, + { + "epoch": 0.81, + "learning_rate": 1.9255449123177563e-06, + "loss": 0.2565, + "step": 10163 + }, + { + "epoch": 0.81, + "learning_rate": 1.924031367865655e-06, + "loss": 0.3702, + "step": 10164 + }, + { + "epoch": 0.81, + "learning_rate": 1.922518355177232e-06, + "loss": 0.2522, + "step": 10165 + }, + { + "epoch": 0.81, + "learning_rate": 1.921005874352109e-06, + "loss": 0.414, + "step": 10166 + }, + { + "epoch": 0.81, + "learning_rate": 1.9194939254898746e-06, + "loss": 0.3986, + "step": 10167 + }, + { + "epoch": 0.81, + "learning_rate": 1.917982508690085e-06, + "loss": 0.4709, + "step": 10168 + }, + { + "epoch": 0.81, + "learning_rate": 1.916471624052256e-06, + "loss": 0.402, + "step": 10169 + }, + { + "epoch": 0.81, + "learning_rate": 1.914961271675879e-06, + "loss": 0.3442, + "step": 10170 + }, + { + "epoch": 0.81, + "learning_rate": 1.9134514516603987e-06, + "loss": 0.326, + "step": 10171 + }, + { + "epoch": 0.81, + "learning_rate": 1.9119421641052294e-06, + "loss": 0.2905, + "step": 10172 + }, + { + "epoch": 0.81, + "learning_rate": 1.91043340910975e-06, + "loss": 0.3756, + "step": 10173 + }, + { + "epoch": 0.81, + "learning_rate": 1.908925186773308e-06, + "loss": 0.2288, + "step": 10174 + }, + { + "epoch": 0.81, + "learning_rate": 1.907417497195211e-06, + "loss": 0.3354, + "step": 10175 + }, + { + "epoch": 0.81, + "learning_rate": 1.9059103404747303e-06, + "loss": 0.4009, + "step": 10176 + }, + { + "epoch": 0.81, + "learning_rate": 1.9044037167111096e-06, + "loss": 0.3411, + "step": 10177 + }, + { + "epoch": 0.81, + "learning_rate": 1.9028976260035515e-06, + "loss": 0.2682, + "step": 10178 + }, + { + "epoch": 0.81, + "learning_rate": 1.901392068451221e-06, + "loss": 0.281, + "step": 10179 + }, + { + "epoch": 0.81, + "learning_rate": 1.8998870441532569e-06, + "loss": 0.3024, + "step": 10180 + }, + { + "epoch": 0.81, + "learning_rate": 1.8983825532087551e-06, + "loss": 0.3141, + "step": 10181 + }, + { + "epoch": 0.81, + "learning_rate": 1.8968785957167779e-06, + "loss": 0.3746, + "step": 10182 + }, + { + "epoch": 0.81, + "learning_rate": 1.8953751717763592e-06, + "loss": 0.283, + "step": 10183 + }, + { + "epoch": 0.81, + "learning_rate": 1.8938722814864863e-06, + "loss": 0.2674, + "step": 10184 + }, + { + "epoch": 0.81, + "learning_rate": 1.8923699249461214e-06, + "loss": 0.3943, + "step": 10185 + }, + { + "epoch": 0.81, + "learning_rate": 1.890868102254182e-06, + "loss": 0.341, + "step": 10186 + }, + { + "epoch": 0.81, + "learning_rate": 1.8893668135095611e-06, + "loss": 0.4204, + "step": 10187 + }, + { + "epoch": 0.81, + "learning_rate": 1.8878660588111108e-06, + "loss": 0.4325, + "step": 10188 + }, + { + "epoch": 0.81, + "learning_rate": 1.8863658382576444e-06, + "loss": 0.237, + "step": 10189 + }, + { + "epoch": 0.81, + "learning_rate": 1.8848661519479504e-06, + "loss": 0.2423, + "step": 10190 + }, + { + "epoch": 0.81, + "learning_rate": 1.8833669999807723e-06, + "loss": 0.3515, + "step": 10191 + }, + { + "epoch": 0.81, + "learning_rate": 1.88186838245482e-06, + "loss": 0.4092, + "step": 10192 + }, + { + "epoch": 0.81, + "learning_rate": 1.8803702994687755e-06, + "loss": 0.3721, + "step": 10193 + }, + { + "epoch": 0.81, + "learning_rate": 1.8788727511212768e-06, + "loss": 0.3617, + "step": 10194 + }, + { + "epoch": 0.81, + "learning_rate": 1.8773757375109292e-06, + "loss": 0.2681, + "step": 10195 + }, + { + "epoch": 0.81, + "learning_rate": 1.8758792587363084e-06, + "loss": 0.3408, + "step": 10196 + }, + { + "epoch": 0.81, + "learning_rate": 1.8743833148959479e-06, + "loss": 0.3189, + "step": 10197 + }, + { + "epoch": 0.81, + "learning_rate": 1.8728879060883443e-06, + "loss": 0.3039, + "step": 10198 + }, + { + "epoch": 0.81, + "learning_rate": 1.8713930324119711e-06, + "loss": 0.3761, + "step": 10199 + }, + { + "epoch": 0.81, + "learning_rate": 1.869898693965253e-06, + "loss": 0.361, + "step": 10200 + }, + { + "epoch": 0.81, + "learning_rate": 1.868404890846587e-06, + "loss": 0.3607, + "step": 10201 + }, + { + "epoch": 0.81, + "learning_rate": 1.8669116231543294e-06, + "loss": 0.2248, + "step": 10202 + }, + { + "epoch": 0.81, + "learning_rate": 1.865418890986811e-06, + "loss": 0.3339, + "step": 10203 + }, + { + "epoch": 0.81, + "learning_rate": 1.8639266944423163e-06, + "loss": 0.2136, + "step": 10204 + }, + { + "epoch": 0.81, + "learning_rate": 1.8624350336190977e-06, + "loss": 0.4078, + "step": 10205 + }, + { + "epoch": 0.81, + "learning_rate": 1.8609439086153803e-06, + "loss": 0.417, + "step": 10206 + }, + { + "epoch": 0.81, + "learning_rate": 1.859453319529343e-06, + "loss": 0.4414, + "step": 10207 + }, + { + "epoch": 0.81, + "learning_rate": 1.857963266459133e-06, + "loss": 0.3941, + "step": 10208 + }, + { + "epoch": 0.81, + "learning_rate": 1.8564737495028673e-06, + "loss": 0.3069, + "step": 10209 + }, + { + "epoch": 0.81, + "learning_rate": 1.854984768758621e-06, + "loss": 0.4573, + "step": 10210 + }, + { + "epoch": 0.81, + "learning_rate": 1.853496324324434e-06, + "loss": 0.2994, + "step": 10211 + }, + { + "epoch": 0.81, + "learning_rate": 1.8520084162983176e-06, + "loss": 0.3622, + "step": 10212 + }, + { + "epoch": 0.81, + "learning_rate": 1.8505210447782418e-06, + "loss": 0.3393, + "step": 10213 + }, + { + "epoch": 0.81, + "learning_rate": 1.8490342098621395e-06, + "loss": 0.3585, + "step": 10214 + }, + { + "epoch": 0.81, + "learning_rate": 1.8475479116479166e-06, + "loss": 0.2994, + "step": 10215 + }, + { + "epoch": 0.81, + "learning_rate": 1.8460621502334375e-06, + "loss": 0.4245, + "step": 10216 + }, + { + "epoch": 0.81, + "learning_rate": 1.8445769257165314e-06, + "loss": 0.3659, + "step": 10217 + }, + { + "epoch": 0.81, + "learning_rate": 1.8430922381949912e-06, + "loss": 0.2858, + "step": 10218 + }, + { + "epoch": 0.81, + "learning_rate": 1.84160808776658e-06, + "loss": 0.2989, + "step": 10219 + }, + { + "epoch": 0.81, + "learning_rate": 1.8401244745290214e-06, + "loss": 0.3664, + "step": 10220 + }, + { + "epoch": 0.81, + "learning_rate": 1.838641398580001e-06, + "loss": 0.365, + "step": 10221 + }, + { + "epoch": 0.81, + "learning_rate": 1.8371588600171764e-06, + "loss": 0.3149, + "step": 10222 + }, + { + "epoch": 0.81, + "learning_rate": 1.8356768589381646e-06, + "loss": 0.3916, + "step": 10223 + }, + { + "epoch": 0.81, + "learning_rate": 1.8341953954405434e-06, + "loss": 0.2544, + "step": 10224 + }, + { + "epoch": 0.81, + "learning_rate": 1.832714469621868e-06, + "loss": 0.2711, + "step": 10225 + }, + { + "epoch": 0.81, + "learning_rate": 1.8312340815796458e-06, + "loss": 0.3366, + "step": 10226 + }, + { + "epoch": 0.81, + "learning_rate": 1.8297542314113515e-06, + "loss": 0.4361, + "step": 10227 + }, + { + "epoch": 0.81, + "learning_rate": 1.82827491921443e-06, + "loss": 0.3626, + "step": 10228 + }, + { + "epoch": 0.81, + "learning_rate": 1.8267961450862859e-06, + "loss": 0.2263, + "step": 10229 + }, + { + "epoch": 0.81, + "learning_rate": 1.8253179091242868e-06, + "loss": 0.3195, + "step": 10230 + }, + { + "epoch": 0.81, + "learning_rate": 1.8238402114257714e-06, + "loss": 0.3837, + "step": 10231 + }, + { + "epoch": 0.81, + "learning_rate": 1.8223630520880365e-06, + "loss": 0.3653, + "step": 10232 + }, + { + "epoch": 0.81, + "learning_rate": 1.8208864312083462e-06, + "loss": 0.3573, + "step": 10233 + }, + { + "epoch": 0.81, + "learning_rate": 1.8194103488839265e-06, + "loss": 0.2869, + "step": 10234 + }, + { + "epoch": 0.81, + "learning_rate": 1.817934805211976e-06, + "loss": 0.3562, + "step": 10235 + }, + { + "epoch": 0.81, + "learning_rate": 1.8164598002896484e-06, + "loss": 0.2596, + "step": 10236 + }, + { + "epoch": 0.81, + "learning_rate": 1.8149853342140644e-06, + "loss": 0.3183, + "step": 10237 + }, + { + "epoch": 0.81, + "learning_rate": 1.8135114070823145e-06, + "loss": 0.2953, + "step": 10238 + }, + { + "epoch": 0.81, + "learning_rate": 1.8120380189914476e-06, + "loss": 0.2717, + "step": 10239 + }, + { + "epoch": 0.81, + "learning_rate": 1.8105651700384764e-06, + "loss": 0.3414, + "step": 10240 + }, + { + "epoch": 0.81, + "learning_rate": 1.8090928603203871e-06, + "loss": 0.3361, + "step": 10241 + }, + { + "epoch": 0.81, + "learning_rate": 1.8076210899341196e-06, + "loss": 0.2393, + "step": 10242 + }, + { + "epoch": 0.81, + "learning_rate": 1.8061498589765824e-06, + "loss": 0.3512, + "step": 10243 + }, + { + "epoch": 0.81, + "learning_rate": 1.804679167544655e-06, + "loss": 0.3301, + "step": 10244 + }, + { + "epoch": 0.81, + "learning_rate": 1.8032090157351701e-06, + "loss": 0.3543, + "step": 10245 + }, + { + "epoch": 0.81, + "learning_rate": 1.8017394036449276e-06, + "loss": 0.2832, + "step": 10246 + }, + { + "epoch": 0.81, + "learning_rate": 1.8002703313706993e-06, + "loss": 0.2833, + "step": 10247 + }, + { + "epoch": 0.81, + "learning_rate": 1.7988017990092167e-06, + "loss": 0.2705, + "step": 10248 + }, + { + "epoch": 0.81, + "learning_rate": 1.797333806657171e-06, + "loss": 0.2907, + "step": 10249 + }, + { + "epoch": 0.81, + "learning_rate": 1.7958663544112277e-06, + "loss": 0.3612, + "step": 10250 + }, + { + "epoch": 0.81, + "learning_rate": 1.794399442368009e-06, + "loss": 0.3972, + "step": 10251 + }, + { + "epoch": 0.81, + "learning_rate": 1.7929330706241023e-06, + "loss": 0.3217, + "step": 10252 + }, + { + "epoch": 0.81, + "learning_rate": 1.7914672392760645e-06, + "loss": 0.3491, + "step": 10253 + }, + { + "epoch": 0.81, + "learning_rate": 1.7900019484204135e-06, + "loss": 0.4378, + "step": 10254 + }, + { + "epoch": 0.81, + "learning_rate": 1.788537198153627e-06, + "loss": 0.4221, + "step": 10255 + }, + { + "epoch": 0.81, + "learning_rate": 1.787072988572157e-06, + "loss": 0.3116, + "step": 10256 + }, + { + "epoch": 0.81, + "learning_rate": 1.7856093197724133e-06, + "loss": 0.3566, + "step": 10257 + }, + { + "epoch": 0.81, + "learning_rate": 1.7841461918507708e-06, + "loss": 0.3454, + "step": 10258 + }, + { + "epoch": 0.81, + "learning_rate": 1.7826836049035655e-06, + "loss": 0.477, + "step": 10259 + }, + { + "epoch": 0.81, + "learning_rate": 1.7812215590271099e-06, + "loss": 0.3467, + "step": 10260 + }, + { + "epoch": 0.81, + "learning_rate": 1.7797600543176675e-06, + "loss": 0.3882, + "step": 10261 + }, + { + "epoch": 0.81, + "learning_rate": 1.7782990908714703e-06, + "loss": 0.4153, + "step": 10262 + }, + { + "epoch": 0.81, + "learning_rate": 1.7768386687847194e-06, + "loss": 0.3274, + "step": 10263 + }, + { + "epoch": 0.81, + "learning_rate": 1.7753787881535757e-06, + "loss": 0.2615, + "step": 10264 + }, + { + "epoch": 0.81, + "learning_rate": 1.7739194490741607e-06, + "loss": 0.371, + "step": 10265 + }, + { + "epoch": 0.81, + "learning_rate": 1.7724606516425724e-06, + "loss": 0.2937, + "step": 10266 + }, + { + "epoch": 0.81, + "learning_rate": 1.7710023959548617e-06, + "loss": 0.4487, + "step": 10267 + }, + { + "epoch": 0.81, + "learning_rate": 1.7695446821070438e-06, + "loss": 0.3757, + "step": 10268 + }, + { + "epoch": 0.81, + "learning_rate": 1.76808751019511e-06, + "loss": 0.309, + "step": 10269 + }, + { + "epoch": 0.81, + "learning_rate": 1.7666308803150045e-06, + "loss": 0.3393, + "step": 10270 + }, + { + "epoch": 0.81, + "learning_rate": 1.7651747925626383e-06, + "loss": 0.4164, + "step": 10271 + }, + { + "epoch": 0.81, + "learning_rate": 1.763719247033886e-06, + "loss": 0.3572, + "step": 10272 + }, + { + "epoch": 0.81, + "learning_rate": 1.762264243824594e-06, + "loss": 0.3376, + "step": 10273 + }, + { + "epoch": 0.81, + "learning_rate": 1.7608097830305637e-06, + "loss": 0.3581, + "step": 10274 + }, + { + "epoch": 0.81, + "learning_rate": 1.7593558647475627e-06, + "loss": 0.3794, + "step": 10275 + }, + { + "epoch": 0.81, + "learning_rate": 1.7579024890713282e-06, + "loss": 0.3314, + "step": 10276 + }, + { + "epoch": 0.81, + "learning_rate": 1.7564496560975574e-06, + "loss": 0.4118, + "step": 10277 + }, + { + "epoch": 0.81, + "learning_rate": 1.7549973659219077e-06, + "loss": 0.2665, + "step": 10278 + }, + { + "epoch": 0.81, + "learning_rate": 1.7535456186400123e-06, + "loss": 0.2748, + "step": 10279 + }, + { + "epoch": 0.81, + "learning_rate": 1.7520944143474584e-06, + "loss": 0.2505, + "step": 10280 + }, + { + "epoch": 0.81, + "learning_rate": 1.750643753139798e-06, + "loss": 0.3807, + "step": 10281 + }, + { + "epoch": 0.81, + "learning_rate": 1.749193635112556e-06, + "loss": 0.3905, + "step": 10282 + }, + { + "epoch": 0.81, + "learning_rate": 1.7477440603612127e-06, + "loss": 0.3531, + "step": 10283 + }, + { + "epoch": 0.81, + "learning_rate": 1.746295028981213e-06, + "loss": 0.4261, + "step": 10284 + }, + { + "epoch": 0.81, + "learning_rate": 1.7448465410679737e-06, + "loss": 0.2564, + "step": 10285 + }, + { + "epoch": 0.81, + "learning_rate": 1.7433985967168686e-06, + "loss": 0.3112, + "step": 10286 + }, + { + "epoch": 0.81, + "learning_rate": 1.7419511960232384e-06, + "loss": 0.3838, + "step": 10287 + }, + { + "epoch": 0.82, + "learning_rate": 1.7405043390823827e-06, + "loss": 0.3549, + "step": 10288 + }, + { + "epoch": 0.82, + "learning_rate": 1.7390580259895783e-06, + "loss": 0.2876, + "step": 10289 + }, + { + "epoch": 0.82, + "learning_rate": 1.7376122568400533e-06, + "loss": 0.3527, + "step": 10290 + }, + { + "epoch": 0.82, + "learning_rate": 1.7361670317290014e-06, + "loss": 0.3601, + "step": 10291 + }, + { + "epoch": 0.82, + "learning_rate": 1.7347223507515908e-06, + "loss": 0.2923, + "step": 10292 + }, + { + "epoch": 0.82, + "learning_rate": 1.7332782140029436e-06, + "loss": 0.3708, + "step": 10293 + }, + { + "epoch": 0.82, + "learning_rate": 1.7318346215781468e-06, + "loss": 0.3406, + "step": 10294 + }, + { + "epoch": 0.82, + "learning_rate": 1.7303915735722586e-06, + "loss": 0.3228, + "step": 10295 + }, + { + "epoch": 0.82, + "learning_rate": 1.7289490700802947e-06, + "loss": 0.4189, + "step": 10296 + }, + { + "epoch": 0.82, + "learning_rate": 1.727507111197233e-06, + "loss": 0.3679, + "step": 10297 + }, + { + "epoch": 0.82, + "learning_rate": 1.7260656970180268e-06, + "loss": 0.2652, + "step": 10298 + }, + { + "epoch": 0.82, + "learning_rate": 1.7246248276375832e-06, + "loss": 0.3565, + "step": 10299 + }, + { + "epoch": 0.82, + "learning_rate": 1.7231845031507732e-06, + "loss": 0.3053, + "step": 10300 + }, + { + "epoch": 0.82, + "learning_rate": 1.72174472365244e-06, + "loss": 0.42, + "step": 10301 + }, + { + "epoch": 0.82, + "learning_rate": 1.720305489237385e-06, + "loss": 0.4335, + "step": 10302 + }, + { + "epoch": 0.82, + "learning_rate": 1.718866800000375e-06, + "loss": 0.312, + "step": 10303 + }, + { + "epoch": 0.82, + "learning_rate": 1.7174286560361364e-06, + "loss": 0.4007, + "step": 10304 + }, + { + "epoch": 0.82, + "learning_rate": 1.7159910574393702e-06, + "loss": 0.3226, + "step": 10305 + }, + { + "epoch": 0.82, + "learning_rate": 1.7145540043047327e-06, + "loss": 0.378, + "step": 10306 + }, + { + "epoch": 0.82, + "learning_rate": 1.713117496726845e-06, + "loss": 0.2767, + "step": 10307 + }, + { + "epoch": 0.82, + "learning_rate": 1.711681534800298e-06, + "loss": 0.4383, + "step": 10308 + }, + { + "epoch": 0.82, + "learning_rate": 1.7102461186196418e-06, + "loss": 0.3961, + "step": 10309 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088112482793872e-06, + "loss": 0.3433, + "step": 10310 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073769238740213e-06, + "loss": 0.4698, + "step": 10311 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059431454979825e-06, + "loss": 0.3494, + "step": 10312 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045099132456766e-06, + "loss": 0.3626, + "step": 10313 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030772272114803e-06, + "loss": 0.4136, + "step": 10314 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016450874897273e-06, + "loss": 0.275, + "step": 10315 + }, + { + "epoch": 0.82, + "learning_rate": 1.7002134941747116e-06, + "loss": 0.3383, + "step": 10316 + }, + { + "epoch": 0.82, + "learning_rate": 1.698782447360705e-06, + "loss": 0.3057, + "step": 10317 + }, + { + "epoch": 0.82, + "learning_rate": 1.697351947141932e-06, + "loss": 0.2761, + "step": 10318 + }, + { + "epoch": 0.82, + "learning_rate": 1.6959219936125827e-06, + "loss": 0.3718, + "step": 10319 + }, + { + "epoch": 0.82, + "learning_rate": 1.6944925868668106e-06, + "loss": 0.3512, + "step": 10320 + }, + { + "epoch": 0.82, + "learning_rate": 1.6930637269987415e-06, + "loss": 0.3478, + "step": 10321 + }, + { + "epoch": 0.82, + "learning_rate": 1.691635414102455e-06, + "loss": 0.3923, + "step": 10322 + }, + { + "epoch": 0.82, + "learning_rate": 1.6902076482719987e-06, + "loss": 0.4553, + "step": 10323 + }, + { + "epoch": 0.82, + "learning_rate": 1.6887804296013854e-06, + "loss": 0.3749, + "step": 10324 + }, + { + "epoch": 0.82, + "learning_rate": 1.6873537581845866e-06, + "loss": 0.3488, + "step": 10325 + }, + { + "epoch": 0.82, + "learning_rate": 1.6859276341155483e-06, + "loss": 0.3784, + "step": 10326 + }, + { + "epoch": 0.82, + "learning_rate": 1.68450205748817e-06, + "loss": 0.4157, + "step": 10327 + }, + { + "epoch": 0.82, + "learning_rate": 1.6830770283963194e-06, + "loss": 0.3039, + "step": 10328 + }, + { + "epoch": 0.82, + "learning_rate": 1.6816525469338252e-06, + "loss": 0.2946, + "step": 10329 + }, + { + "epoch": 0.82, + "learning_rate": 1.6802286131944889e-06, + "loss": 0.2995, + "step": 10330 + }, + { + "epoch": 0.82, + "learning_rate": 1.6788052272720656e-06, + "loss": 0.2854, + "step": 10331 + }, + { + "epoch": 0.82, + "learning_rate": 1.677382389260277e-06, + "loss": 0.3684, + "step": 10332 + }, + { + "epoch": 0.82, + "learning_rate": 1.6759600992528147e-06, + "loss": 0.3097, + "step": 10333 + }, + { + "epoch": 0.82, + "learning_rate": 1.674538357343326e-06, + "loss": 0.3842, + "step": 10334 + }, + { + "epoch": 0.82, + "learning_rate": 1.6731171636254263e-06, + "loss": 0.3835, + "step": 10335 + }, + { + "epoch": 0.82, + "learning_rate": 1.6716965181926959e-06, + "loss": 0.361, + "step": 10336 + }, + { + "epoch": 0.82, + "learning_rate": 1.670276421138677e-06, + "loss": 0.3729, + "step": 10337 + }, + { + "epoch": 0.82, + "learning_rate": 1.6688568725568732e-06, + "loss": 0.4115, + "step": 10338 + }, + { + "epoch": 0.82, + "learning_rate": 1.6674378725407603e-06, + "loss": 0.3192, + "step": 10339 + }, + { + "epoch": 0.82, + "learning_rate": 1.6660194211837687e-06, + "loss": 0.3109, + "step": 10340 + }, + { + "epoch": 0.82, + "learning_rate": 1.6646015185792963e-06, + "loss": 0.3759, + "step": 10341 + }, + { + "epoch": 0.82, + "learning_rate": 1.6631841648207092e-06, + "loss": 0.3854, + "step": 10342 + }, + { + "epoch": 0.82, + "learning_rate": 1.6617673600013295e-06, + "loss": 0.3062, + "step": 10343 + }, + { + "epoch": 0.82, + "learning_rate": 1.6603511042144494e-06, + "loss": 0.284, + "step": 10344 + }, + { + "epoch": 0.82, + "learning_rate": 1.6589353975533174e-06, + "loss": 0.3639, + "step": 10345 + }, + { + "epoch": 0.82, + "learning_rate": 1.6575202401111578e-06, + "loss": 0.3559, + "step": 10346 + }, + { + "epoch": 0.82, + "learning_rate": 1.6561056319811497e-06, + "loss": 0.3893, + "step": 10347 + }, + { + "epoch": 0.82, + "learning_rate": 1.654691573256434e-06, + "loss": 0.3813, + "step": 10348 + }, + { + "epoch": 0.82, + "learning_rate": 1.653278064030126e-06, + "loss": 0.3312, + "step": 10349 + }, + { + "epoch": 0.82, + "learning_rate": 1.651865104395296e-06, + "loss": 0.4636, + "step": 10350 + }, + { + "epoch": 0.82, + "learning_rate": 1.6504526944449772e-06, + "loss": 0.3962, + "step": 10351 + }, + { + "epoch": 0.82, + "learning_rate": 1.6490408342721764e-06, + "loss": 0.2636, + "step": 10352 + }, + { + "epoch": 0.82, + "learning_rate": 1.6476295239698537e-06, + "loss": 0.3748, + "step": 10353 + }, + { + "epoch": 0.82, + "learning_rate": 1.6462187636309345e-06, + "loss": 0.3277, + "step": 10354 + }, + { + "epoch": 0.82, + "learning_rate": 1.6448085533483172e-06, + "loss": 0.4327, + "step": 10355 + }, + { + "epoch": 0.82, + "learning_rate": 1.6433988932148547e-06, + "loss": 0.3312, + "step": 10356 + }, + { + "epoch": 0.82, + "learning_rate": 1.6419897833233644e-06, + "loss": 0.3831, + "step": 10357 + }, + { + "epoch": 0.82, + "learning_rate": 1.6405812237666296e-06, + "loss": 0.3363, + "step": 10358 + }, + { + "epoch": 0.82, + "learning_rate": 1.6391732146373994e-06, + "loss": 0.3088, + "step": 10359 + }, + { + "epoch": 0.82, + "learning_rate": 1.6377657560283844e-06, + "loss": 0.2947, + "step": 10360 + }, + { + "epoch": 0.82, + "learning_rate": 1.6363588480322545e-06, + "loss": 0.3777, + "step": 10361 + }, + { + "epoch": 0.82, + "learning_rate": 1.6349524907416536e-06, + "loss": 0.3596, + "step": 10362 + }, + { + "epoch": 0.82, + "learning_rate": 1.6335466842491821e-06, + "loss": 0.272, + "step": 10363 + }, + { + "epoch": 0.82, + "learning_rate": 1.6321414286474014e-06, + "loss": 0.3955, + "step": 10364 + }, + { + "epoch": 0.82, + "learning_rate": 1.6307367240288463e-06, + "loss": 0.3796, + "step": 10365 + }, + { + "epoch": 0.82, + "learning_rate": 1.6293325704860087e-06, + "loss": 0.3149, + "step": 10366 + }, + { + "epoch": 0.82, + "learning_rate": 1.6279289681113407e-06, + "loss": 0.3472, + "step": 10367 + }, + { + "epoch": 0.82, + "learning_rate": 1.626525916997269e-06, + "loss": 0.3156, + "step": 10368 + }, + { + "epoch": 0.82, + "learning_rate": 1.6251234172361763e-06, + "loss": 0.3058, + "step": 10369 + }, + { + "epoch": 0.82, + "learning_rate": 1.623721468920405e-06, + "loss": 0.2971, + "step": 10370 + }, + { + "epoch": 0.82, + "learning_rate": 1.6223200721422739e-06, + "loss": 0.3186, + "step": 10371 + }, + { + "epoch": 0.82, + "learning_rate": 1.6209192269940555e-06, + "loss": 0.351, + "step": 10372 + }, + { + "epoch": 0.82, + "learning_rate": 1.6195189335679884e-06, + "loss": 0.3274, + "step": 10373 + }, + { + "epoch": 0.82, + "learning_rate": 1.6181191919562734e-06, + "loss": 0.4711, + "step": 10374 + }, + { + "epoch": 0.82, + "learning_rate": 1.6167200022510799e-06, + "loss": 0.2851, + "step": 10375 + }, + { + "epoch": 0.82, + "learning_rate": 1.6153213645445376e-06, + "loss": 0.3999, + "step": 10376 + }, + { + "epoch": 0.82, + "learning_rate": 1.613923278928735e-06, + "loss": 0.3799, + "step": 10377 + }, + { + "epoch": 0.82, + "learning_rate": 1.6125257454957365e-06, + "loss": 0.4959, + "step": 10378 + }, + { + "epoch": 0.82, + "learning_rate": 1.6111287643375607e-06, + "loss": 0.4206, + "step": 10379 + }, + { + "epoch": 0.82, + "learning_rate": 1.6097323355461869e-06, + "loss": 0.3561, + "step": 10380 + }, + { + "epoch": 0.82, + "learning_rate": 1.6083364592135708e-06, + "loss": 0.3039, + "step": 10381 + }, + { + "epoch": 0.82, + "learning_rate": 1.6069411354316212e-06, + "loss": 0.4248, + "step": 10382 + }, + { + "epoch": 0.82, + "learning_rate": 1.6055463642922098e-06, + "loss": 0.2318, + "step": 10383 + }, + { + "epoch": 0.82, + "learning_rate": 1.6041521458871812e-06, + "loss": 0.3111, + "step": 10384 + }, + { + "epoch": 0.82, + "learning_rate": 1.6027584803083351e-06, + "loss": 0.3581, + "step": 10385 + }, + { + "epoch": 0.82, + "learning_rate": 1.6013653676474371e-06, + "loss": 0.367, + "step": 10386 + }, + { + "epoch": 0.82, + "learning_rate": 1.5999728079962197e-06, + "loss": 0.3411, + "step": 10387 + }, + { + "epoch": 0.82, + "learning_rate": 1.5985808014463745e-06, + "loss": 0.3894, + "step": 10388 + }, + { + "epoch": 0.82, + "learning_rate": 1.5971893480895583e-06, + "loss": 0.3213, + "step": 10389 + }, + { + "epoch": 0.82, + "learning_rate": 1.5957984480173893e-06, + "loss": 0.3015, + "step": 10390 + }, + { + "epoch": 0.82, + "learning_rate": 1.5944081013214575e-06, + "loss": 0.2749, + "step": 10391 + }, + { + "epoch": 0.82, + "learning_rate": 1.593018308093306e-06, + "loss": 0.4122, + "step": 10392 + }, + { + "epoch": 0.82, + "learning_rate": 1.5916290684244452e-06, + "loss": 0.4815, + "step": 10393 + }, + { + "epoch": 0.82, + "learning_rate": 1.5902403824063539e-06, + "loss": 0.3773, + "step": 10394 + }, + { + "epoch": 0.82, + "learning_rate": 1.5888522501304682e-06, + "loss": 0.3444, + "step": 10395 + }, + { + "epoch": 0.82, + "learning_rate": 1.587464671688187e-06, + "loss": 0.3946, + "step": 10396 + }, + { + "epoch": 0.82, + "learning_rate": 1.5860776471708816e-06, + "loss": 0.3627, + "step": 10397 + }, + { + "epoch": 0.82, + "learning_rate": 1.5846911766698781e-06, + "loss": 0.3157, + "step": 10398 + }, + { + "epoch": 0.82, + "learning_rate": 1.5833052602764664e-06, + "loss": 0.3756, + "step": 10399 + }, + { + "epoch": 0.82, + "learning_rate": 1.5819198980819096e-06, + "loss": 0.2642, + "step": 10400 + }, + { + "epoch": 0.82, + "learning_rate": 1.5805350901774197e-06, + "loss": 0.3205, + "step": 10401 + }, + { + "epoch": 0.82, + "learning_rate": 1.5791508366541797e-06, + "loss": 0.3131, + "step": 10402 + }, + { + "epoch": 0.82, + "learning_rate": 1.577767137603341e-06, + "loss": 0.3313, + "step": 10403 + }, + { + "epoch": 0.82, + "learning_rate": 1.5763839931160108e-06, + "loss": 0.266, + "step": 10404 + }, + { + "epoch": 0.82, + "learning_rate": 1.5750014032832617e-06, + "loss": 0.3413, + "step": 10405 + }, + { + "epoch": 0.82, + "learning_rate": 1.5736193681961332e-06, + "loss": 0.2329, + "step": 10406 + }, + { + "epoch": 0.82, + "learning_rate": 1.5722378879456234e-06, + "loss": 0.3391, + "step": 10407 + }, + { + "epoch": 0.82, + "learning_rate": 1.5708569626226954e-06, + "loss": 0.2625, + "step": 10408 + }, + { + "epoch": 0.82, + "learning_rate": 1.5694765923182798e-06, + "loss": 0.2468, + "step": 10409 + }, + { + "epoch": 0.82, + "learning_rate": 1.5680967771232659e-06, + "loss": 0.2782, + "step": 10410 + }, + { + "epoch": 0.82, + "learning_rate": 1.5667175171285054e-06, + "loss": 0.2928, + "step": 10411 + }, + { + "epoch": 0.82, + "learning_rate": 1.5653388124248203e-06, + "loss": 0.3225, + "step": 10412 + }, + { + "epoch": 0.82, + "learning_rate": 1.5639606631029892e-06, + "loss": 0.3813, + "step": 10413 + }, + { + "epoch": 0.83, + "learning_rate": 1.5625830692537569e-06, + "loss": 0.4223, + "step": 10414 + }, + { + "epoch": 0.83, + "learning_rate": 1.561206030967828e-06, + "loss": 0.3123, + "step": 10415 + }, + { + "epoch": 0.83, + "learning_rate": 1.5598295483358804e-06, + "loss": 0.2991, + "step": 10416 + }, + { + "epoch": 0.83, + "learning_rate": 1.5584536214485457e-06, + "loss": 0.3187, + "step": 10417 + }, + { + "epoch": 0.83, + "learning_rate": 1.5570782503964188e-06, + "loss": 0.4159, + "step": 10418 + }, + { + "epoch": 0.83, + "learning_rate": 1.5557034352700672e-06, + "loss": 0.3835, + "step": 10419 + }, + { + "epoch": 0.83, + "learning_rate": 1.5543291761600133e-06, + "loss": 0.3484, + "step": 10420 + }, + { + "epoch": 0.83, + "learning_rate": 1.552955473156742e-06, + "loss": 0.3486, + "step": 10421 + }, + { + "epoch": 0.83, + "learning_rate": 1.5515823263507112e-06, + "loss": 0.3809, + "step": 10422 + }, + { + "epoch": 0.83, + "learning_rate": 1.5502097358323321e-06, + "loss": 0.2467, + "step": 10423 + }, + { + "epoch": 0.83, + "learning_rate": 1.548837701691983e-06, + "loss": 0.2482, + "step": 10424 + }, + { + "epoch": 0.83, + "learning_rate": 1.547466224020009e-06, + "loss": 0.2519, + "step": 10425 + }, + { + "epoch": 0.83, + "learning_rate": 1.5460953029067128e-06, + "loss": 0.3761, + "step": 10426 + }, + { + "epoch": 0.83, + "learning_rate": 1.5447249384423624e-06, + "loss": 0.347, + "step": 10427 + }, + { + "epoch": 0.83, + "learning_rate": 1.543355130717189e-06, + "loss": 0.2783, + "step": 10428 + }, + { + "epoch": 0.83, + "learning_rate": 1.5419858798213928e-06, + "loss": 0.3838, + "step": 10429 + }, + { + "epoch": 0.83, + "learning_rate": 1.540617185845128e-06, + "loss": 0.417, + "step": 10430 + }, + { + "epoch": 0.83, + "learning_rate": 1.5392490488785151e-06, + "loss": 0.2912, + "step": 10431 + }, + { + "epoch": 0.83, + "learning_rate": 1.537881469011645e-06, + "loss": 0.3933, + "step": 10432 + }, + { + "epoch": 0.83, + "learning_rate": 1.5365144463345627e-06, + "loss": 0.3174, + "step": 10433 + }, + { + "epoch": 0.83, + "learning_rate": 1.5351479809372772e-06, + "loss": 0.4494, + "step": 10434 + }, + { + "epoch": 0.83, + "learning_rate": 1.5337820729097697e-06, + "loss": 0.332, + "step": 10435 + }, + { + "epoch": 0.83, + "learning_rate": 1.5324167223419762e-06, + "loss": 0.4241, + "step": 10436 + }, + { + "epoch": 0.83, + "learning_rate": 1.5310519293237958e-06, + "loss": 0.3308, + "step": 10437 + }, + { + "epoch": 0.83, + "learning_rate": 1.5296876939450978e-06, + "loss": 0.3042, + "step": 10438 + }, + { + "epoch": 0.83, + "learning_rate": 1.528324016295709e-06, + "loss": 0.3652, + "step": 10439 + }, + { + "epoch": 0.83, + "learning_rate": 1.5269608964654181e-06, + "loss": 0.2761, + "step": 10440 + }, + { + "epoch": 0.83, + "learning_rate": 1.525598334543985e-06, + "loss": 0.2442, + "step": 10441 + }, + { + "epoch": 0.83, + "learning_rate": 1.524236330621125e-06, + "loss": 0.4285, + "step": 10442 + }, + { + "epoch": 0.83, + "learning_rate": 1.5228748847865205e-06, + "loss": 0.3242, + "step": 10443 + }, + { + "epoch": 0.83, + "learning_rate": 1.5215139971298131e-06, + "loss": 0.3698, + "step": 10444 + }, + { + "epoch": 0.83, + "learning_rate": 1.5201536677406147e-06, + "loss": 0.3542, + "step": 10445 + }, + { + "epoch": 0.83, + "learning_rate": 1.518793896708496e-06, + "loss": 0.2441, + "step": 10446 + }, + { + "epoch": 0.83, + "learning_rate": 1.517434684122987e-06, + "loss": 0.3038, + "step": 10447 + }, + { + "epoch": 0.83, + "learning_rate": 1.5160760300735911e-06, + "loss": 0.3217, + "step": 10448 + }, + { + "epoch": 0.83, + "learning_rate": 1.5147179346497665e-06, + "loss": 0.4435, + "step": 10449 + }, + { + "epoch": 0.83, + "learning_rate": 1.513360397940935e-06, + "loss": 0.4437, + "step": 10450 + }, + { + "epoch": 0.83, + "learning_rate": 1.5120034200364885e-06, + "loss": 0.4014, + "step": 10451 + }, + { + "epoch": 0.83, + "learning_rate": 1.5106470010257758e-06, + "loss": 0.2862, + "step": 10452 + }, + { + "epoch": 0.83, + "learning_rate": 1.509291140998107e-06, + "loss": 0.356, + "step": 10453 + }, + { + "epoch": 0.83, + "learning_rate": 1.5079358400427635e-06, + "loss": 0.3415, + "step": 10454 + }, + { + "epoch": 0.83, + "learning_rate": 1.5065810982489849e-06, + "loss": 0.3114, + "step": 10455 + }, + { + "epoch": 0.83, + "learning_rate": 1.5052269157059707e-06, + "loss": 0.2953, + "step": 10456 + }, + { + "epoch": 0.83, + "learning_rate": 1.503873292502892e-06, + "loss": 0.2538, + "step": 10457 + }, + { + "epoch": 0.83, + "learning_rate": 1.5025202287288764e-06, + "loss": 0.3714, + "step": 10458 + }, + { + "epoch": 0.83, + "learning_rate": 1.501167724473016e-06, + "loss": 0.3786, + "step": 10459 + }, + { + "epoch": 0.83, + "learning_rate": 1.499815779824365e-06, + "loss": 0.2611, + "step": 10460 + }, + { + "epoch": 0.83, + "learning_rate": 1.4984643948719469e-06, + "loss": 0.3154, + "step": 10461 + }, + { + "epoch": 0.83, + "learning_rate": 1.4971135697047422e-06, + "loss": 0.2922, + "step": 10462 + }, + { + "epoch": 0.83, + "learning_rate": 1.4957633044116925e-06, + "loss": 0.3288, + "step": 10463 + }, + { + "epoch": 0.83, + "learning_rate": 1.4944135990817121e-06, + "loss": 0.3059, + "step": 10464 + }, + { + "epoch": 0.83, + "learning_rate": 1.4930644538036709e-06, + "loss": 0.2652, + "step": 10465 + }, + { + "epoch": 0.83, + "learning_rate": 1.4917158686663992e-06, + "loss": 0.3141, + "step": 10466 + }, + { + "epoch": 0.83, + "learning_rate": 1.490367843758701e-06, + "loss": 0.3095, + "step": 10467 + }, + { + "epoch": 0.83, + "learning_rate": 1.4890203791693337e-06, + "loss": 0.3905, + "step": 10468 + }, + { + "epoch": 0.83, + "learning_rate": 1.4876734749870213e-06, + "loss": 0.2918, + "step": 10469 + }, + { + "epoch": 0.83, + "learning_rate": 1.4863271313004535e-06, + "loss": 0.3596, + "step": 10470 + }, + { + "epoch": 0.83, + "learning_rate": 1.4849813481982788e-06, + "loss": 0.4063, + "step": 10471 + }, + { + "epoch": 0.83, + "learning_rate": 1.483636125769108e-06, + "loss": 0.3299, + "step": 10472 + }, + { + "epoch": 0.83, + "learning_rate": 1.482291464101523e-06, + "loss": 0.3762, + "step": 10473 + }, + { + "epoch": 0.83, + "learning_rate": 1.480947363284061e-06, + "loss": 0.4178, + "step": 10474 + }, + { + "epoch": 0.83, + "learning_rate": 1.4796038234052235e-06, + "loss": 0.3604, + "step": 10475 + }, + { + "epoch": 0.83, + "learning_rate": 1.4782608445534741e-06, + "loss": 0.381, + "step": 10476 + }, + { + "epoch": 0.83, + "learning_rate": 1.4769184268172465e-06, + "loss": 0.3417, + "step": 10477 + }, + { + "epoch": 0.83, + "learning_rate": 1.4755765702849311e-06, + "loss": 0.4154, + "step": 10478 + }, + { + "epoch": 0.83, + "learning_rate": 1.4742352750448806e-06, + "loss": 0.3495, + "step": 10479 + }, + { + "epoch": 0.83, + "learning_rate": 1.4728945411854135e-06, + "loss": 0.4597, + "step": 10480 + }, + { + "epoch": 0.83, + "learning_rate": 1.4715543687948096e-06, + "loss": 0.3367, + "step": 10481 + }, + { + "epoch": 0.83, + "learning_rate": 1.470214757961317e-06, + "loss": 0.2748, + "step": 10482 + }, + { + "epoch": 0.83, + "learning_rate": 1.4688757087731386e-06, + "loss": 0.3359, + "step": 10483 + }, + { + "epoch": 0.83, + "learning_rate": 1.4675372213184458e-06, + "loss": 0.433, + "step": 10484 + }, + { + "epoch": 0.83, + "learning_rate": 1.4661992956853699e-06, + "loss": 0.3268, + "step": 10485 + }, + { + "epoch": 0.83, + "learning_rate": 1.4648619319620105e-06, + "loss": 0.3991, + "step": 10486 + }, + { + "epoch": 0.83, + "learning_rate": 1.463525130236424e-06, + "loss": 0.349, + "step": 10487 + }, + { + "epoch": 0.83, + "learning_rate": 1.4621888905966308e-06, + "loss": 0.3259, + "step": 10488 + }, + { + "epoch": 0.83, + "learning_rate": 1.4608532131306198e-06, + "loss": 0.438, + "step": 10489 + }, + { + "epoch": 0.83, + "learning_rate": 1.459518097926337e-06, + "loss": 0.3894, + "step": 10490 + }, + { + "epoch": 0.83, + "learning_rate": 1.4581835450716907e-06, + "loss": 0.3436, + "step": 10491 + }, + { + "epoch": 0.83, + "learning_rate": 1.4568495546545603e-06, + "loss": 0.3847, + "step": 10492 + }, + { + "epoch": 0.83, + "learning_rate": 1.4555161267627793e-06, + "loss": 0.4298, + "step": 10493 + }, + { + "epoch": 0.83, + "learning_rate": 1.4541832614841455e-06, + "loss": 0.3539, + "step": 10494 + }, + { + "epoch": 0.83, + "learning_rate": 1.4528509589064276e-06, + "loss": 0.2452, + "step": 10495 + }, + { + "epoch": 0.83, + "learning_rate": 1.4515192191173466e-06, + "loss": 0.3504, + "step": 10496 + }, + { + "epoch": 0.83, + "learning_rate": 1.45018804220459e-06, + "loss": 0.3249, + "step": 10497 + }, + { + "epoch": 0.83, + "learning_rate": 1.4488574282558143e-06, + "loss": 0.3262, + "step": 10498 + }, + { + "epoch": 0.83, + "learning_rate": 1.4475273773586319e-06, + "loss": 0.3119, + "step": 10499 + }, + { + "epoch": 0.83, + "learning_rate": 1.446197889600619e-06, + "loss": 0.3539, + "step": 10500 + }, + { + "epoch": 0.83, + "learning_rate": 1.444868965069315e-06, + "loss": 0.4093, + "step": 10501 + }, + { + "epoch": 0.83, + "learning_rate": 1.443540603852227e-06, + "loss": 0.2802, + "step": 10502 + }, + { + "epoch": 0.83, + "learning_rate": 1.4422128060368201e-06, + "loss": 0.2875, + "step": 10503 + }, + { + "epoch": 0.83, + "learning_rate": 1.4408855717105197e-06, + "loss": 0.3544, + "step": 10504 + }, + { + "epoch": 0.83, + "learning_rate": 1.4395589009607225e-06, + "loss": 0.2702, + "step": 10505 + }, + { + "epoch": 0.83, + "learning_rate": 1.4382327938747808e-06, + "loss": 0.2779, + "step": 10506 + }, + { + "epoch": 0.83, + "learning_rate": 1.4369072505400117e-06, + "loss": 0.3095, + "step": 10507 + }, + { + "epoch": 0.83, + "learning_rate": 1.4355822710436995e-06, + "loss": 0.3023, + "step": 10508 + }, + { + "epoch": 0.83, + "learning_rate": 1.4342578554730858e-06, + "loss": 0.3323, + "step": 10509 + }, + { + "epoch": 0.83, + "learning_rate": 1.4329340039153738e-06, + "loss": 0.2667, + "step": 10510 + }, + { + "epoch": 0.83, + "learning_rate": 1.4316107164577376e-06, + "loss": 0.3244, + "step": 10511 + }, + { + "epoch": 0.83, + "learning_rate": 1.430287993187307e-06, + "loss": 0.378, + "step": 10512 + }, + { + "epoch": 0.83, + "learning_rate": 1.4289658341911782e-06, + "loss": 0.2719, + "step": 10513 + }, + { + "epoch": 0.83, + "learning_rate": 1.4276442395564049e-06, + "loss": 0.3784, + "step": 10514 + }, + { + "epoch": 0.83, + "learning_rate": 1.426323209370014e-06, + "loss": 0.2881, + "step": 10515 + }, + { + "epoch": 0.83, + "learning_rate": 1.425002743718985e-06, + "loss": 0.4383, + "step": 10516 + }, + { + "epoch": 0.83, + "learning_rate": 1.4236828426902626e-06, + "loss": 0.3704, + "step": 10517 + }, + { + "epoch": 0.83, + "learning_rate": 1.4223635063707619e-06, + "loss": 0.3369, + "step": 10518 + }, + { + "epoch": 0.83, + "learning_rate": 1.421044734847351e-06, + "loss": 0.3026, + "step": 10519 + }, + { + "epoch": 0.83, + "learning_rate": 1.4197265282068618e-06, + "loss": 0.3863, + "step": 10520 + }, + { + "epoch": 0.83, + "learning_rate": 1.4184088865360978e-06, + "loss": 0.4496, + "step": 10521 + }, + { + "epoch": 0.83, + "learning_rate": 1.4170918099218166e-06, + "loss": 0.3204, + "step": 10522 + }, + { + "epoch": 0.83, + "learning_rate": 1.41577529845074e-06, + "loss": 0.4398, + "step": 10523 + }, + { + "epoch": 0.83, + "learning_rate": 1.4144593522095563e-06, + "loss": 0.3507, + "step": 10524 + }, + { + "epoch": 0.83, + "learning_rate": 1.4131439712849148e-06, + "loss": 0.3205, + "step": 10525 + }, + { + "epoch": 0.83, + "learning_rate": 1.4118291557634223e-06, + "loss": 0.4328, + "step": 10526 + }, + { + "epoch": 0.83, + "learning_rate": 1.410514905731658e-06, + "loss": 0.4305, + "step": 10527 + }, + { + "epoch": 0.83, + "learning_rate": 1.4092012212761574e-06, + "loss": 0.3708, + "step": 10528 + }, + { + "epoch": 0.83, + "learning_rate": 1.4078881024834213e-06, + "loss": 0.2158, + "step": 10529 + }, + { + "epoch": 0.83, + "learning_rate": 1.406575549439907e-06, + "loss": 0.2734, + "step": 10530 + }, + { + "epoch": 0.83, + "learning_rate": 1.4052635622320477e-06, + "loss": 0.4027, + "step": 10531 + }, + { + "epoch": 0.83, + "learning_rate": 1.4039521409462265e-06, + "loss": 0.287, + "step": 10532 + }, + { + "epoch": 0.83, + "learning_rate": 1.4026412856687931e-06, + "loss": 0.363, + "step": 10533 + }, + { + "epoch": 0.83, + "learning_rate": 1.4013309964860667e-06, + "loss": 0.3272, + "step": 10534 + }, + { + "epoch": 0.83, + "learning_rate": 1.4000212734843187e-06, + "loss": 0.2633, + "step": 10535 + }, + { + "epoch": 0.83, + "learning_rate": 1.3987121167497874e-06, + "loss": 0.2985, + "step": 10536 + }, + { + "epoch": 0.83, + "learning_rate": 1.3974035263686792e-06, + "loss": 0.2284, + "step": 10537 + }, + { + "epoch": 0.83, + "learning_rate": 1.396095502427155e-06, + "loss": 0.2549, + "step": 10538 + }, + { + "epoch": 0.83, + "learning_rate": 1.3947880450113404e-06, + "loss": 0.3367, + "step": 10539 + }, + { + "epoch": 0.84, + "learning_rate": 1.39348115420733e-06, + "loss": 0.3812, + "step": 10540 + }, + { + "epoch": 0.84, + "learning_rate": 1.392174830101174e-06, + "loss": 0.3971, + "step": 10541 + }, + { + "epoch": 0.84, + "learning_rate": 1.3908690727788842e-06, + "loss": 0.2392, + "step": 10542 + }, + { + "epoch": 0.84, + "learning_rate": 1.3895638823264447e-06, + "loss": 0.3823, + "step": 10543 + }, + { + "epoch": 0.84, + "learning_rate": 1.3882592588297917e-06, + "loss": 0.3389, + "step": 10544 + }, + { + "epoch": 0.84, + "learning_rate": 1.38695520237483e-06, + "loss": 0.233, + "step": 10545 + }, + { + "epoch": 0.84, + "learning_rate": 1.3856517130474235e-06, + "loss": 0.3553, + "step": 10546 + }, + { + "epoch": 0.84, + "learning_rate": 1.384348790933403e-06, + "loss": 0.4307, + "step": 10547 + }, + { + "epoch": 0.84, + "learning_rate": 1.3830464361185592e-06, + "loss": 0.3362, + "step": 10548 + }, + { + "epoch": 0.84, + "learning_rate": 1.3817446486886433e-06, + "loss": 0.2946, + "step": 10549 + }, + { + "epoch": 0.84, + "learning_rate": 1.3804434287293756e-06, + "loss": 0.3045, + "step": 10550 + }, + { + "epoch": 0.84, + "learning_rate": 1.3791427763264342e-06, + "loss": 0.4323, + "step": 10551 + }, + { + "epoch": 0.84, + "learning_rate": 1.3778426915654575e-06, + "loss": 0.3355, + "step": 10552 + }, + { + "epoch": 0.84, + "learning_rate": 1.3765431745320546e-06, + "loss": 0.3174, + "step": 10553 + }, + { + "epoch": 0.84, + "learning_rate": 1.3752442253117903e-06, + "loss": 0.3991, + "step": 10554 + }, + { + "epoch": 0.84, + "learning_rate": 1.373945843990192e-06, + "loss": 0.302, + "step": 10555 + }, + { + "epoch": 0.84, + "learning_rate": 1.3726480306527578e-06, + "loss": 0.2774, + "step": 10556 + }, + { + "epoch": 0.84, + "learning_rate": 1.3713507853849373e-06, + "loss": 0.4032, + "step": 10557 + }, + { + "epoch": 0.84, + "learning_rate": 1.3700541082721464e-06, + "loss": 0.3331, + "step": 10558 + }, + { + "epoch": 0.84, + "learning_rate": 1.3687579993997703e-06, + "loss": 0.419, + "step": 10559 + }, + { + "epoch": 0.84, + "learning_rate": 1.3674624588531481e-06, + "loss": 0.2634, + "step": 10560 + }, + { + "epoch": 0.84, + "learning_rate": 1.3661674867175844e-06, + "loss": 0.2641, + "step": 10561 + }, + { + "epoch": 0.84, + "learning_rate": 1.3648730830783507e-06, + "loss": 0.4362, + "step": 10562 + }, + { + "epoch": 0.84, + "learning_rate": 1.3635792480206744e-06, + "loss": 0.3362, + "step": 10563 + }, + { + "epoch": 0.84, + "learning_rate": 1.3622859816297473e-06, + "loss": 0.3493, + "step": 10564 + }, + { + "epoch": 0.84, + "learning_rate": 1.3609932839907281e-06, + "loss": 0.3093, + "step": 10565 + }, + { + "epoch": 0.84, + "learning_rate": 1.3597011551887329e-06, + "loss": 0.4282, + "step": 10566 + }, + { + "epoch": 0.84, + "learning_rate": 1.3584095953088405e-06, + "loss": 0.3181, + "step": 10567 + }, + { + "epoch": 0.84, + "learning_rate": 1.3571186044360973e-06, + "loss": 0.2797, + "step": 10568 + }, + { + "epoch": 0.84, + "learning_rate": 1.3558281826555065e-06, + "loss": 0.3707, + "step": 10569 + }, + { + "epoch": 0.84, + "learning_rate": 1.3545383300520375e-06, + "loss": 0.4279, + "step": 10570 + }, + { + "epoch": 0.84, + "learning_rate": 1.3532490467106186e-06, + "loss": 0.3558, + "step": 10571 + }, + { + "epoch": 0.84, + "learning_rate": 1.3519603327161456e-06, + "loss": 0.4063, + "step": 10572 + }, + { + "epoch": 0.84, + "learning_rate": 1.3506721881534734e-06, + "loss": 0.2538, + "step": 10573 + }, + { + "epoch": 0.84, + "learning_rate": 1.3493846131074173e-06, + "loss": 0.2626, + "step": 10574 + }, + { + "epoch": 0.84, + "learning_rate": 1.3480976076627617e-06, + "loss": 0.4668, + "step": 10575 + }, + { + "epoch": 0.84, + "learning_rate": 1.3468111719042497e-06, + "loss": 0.4082, + "step": 10576 + }, + { + "epoch": 0.84, + "learning_rate": 1.345525305916583e-06, + "loss": 0.2054, + "step": 10577 + }, + { + "epoch": 0.84, + "learning_rate": 1.3442400097844344e-06, + "loss": 0.2974, + "step": 10578 + }, + { + "epoch": 0.84, + "learning_rate": 1.342955283592432e-06, + "loss": 0.3436, + "step": 10579 + }, + { + "epoch": 0.84, + "learning_rate": 1.3416711274251671e-06, + "loss": 0.3425, + "step": 10580 + }, + { + "epoch": 0.84, + "learning_rate": 1.3403875413671997e-06, + "loss": 0.3221, + "step": 10581 + }, + { + "epoch": 0.84, + "learning_rate": 1.3391045255030444e-06, + "loss": 0.3786, + "step": 10582 + }, + { + "epoch": 0.84, + "learning_rate": 1.3378220799171815e-06, + "loss": 0.3, + "step": 10583 + }, + { + "epoch": 0.84, + "learning_rate": 1.3365402046940569e-06, + "loss": 0.3804, + "step": 10584 + }, + { + "epoch": 0.84, + "learning_rate": 1.3352588999180726e-06, + "loss": 0.3541, + "step": 10585 + }, + { + "epoch": 0.84, + "learning_rate": 1.3339781656735995e-06, + "loss": 0.2559, + "step": 10586 + }, + { + "epoch": 0.84, + "learning_rate": 1.3326980020449621e-06, + "loss": 0.2831, + "step": 10587 + }, + { + "epoch": 0.84, + "learning_rate": 1.3314184091164605e-06, + "loss": 0.2941, + "step": 10588 + }, + { + "epoch": 0.84, + "learning_rate": 1.3301393869723457e-06, + "loss": 0.4065, + "step": 10589 + }, + { + "epoch": 0.84, + "learning_rate": 1.328860935696833e-06, + "loss": 0.3475, + "step": 10590 + }, + { + "epoch": 0.84, + "learning_rate": 1.3275830553741066e-06, + "loss": 0.3014, + "step": 10591 + }, + { + "epoch": 0.84, + "learning_rate": 1.3263057460883078e-06, + "loss": 0.2264, + "step": 10592 + }, + { + "epoch": 0.84, + "learning_rate": 1.3250290079235383e-06, + "loss": 0.3168, + "step": 10593 + }, + { + "epoch": 0.84, + "learning_rate": 1.3237528409638688e-06, + "loss": 0.3347, + "step": 10594 + }, + { + "epoch": 0.84, + "learning_rate": 1.3224772452933277e-06, + "loss": 0.4263, + "step": 10595 + }, + { + "epoch": 0.84, + "learning_rate": 1.321202220995904e-06, + "loss": 0.3918, + "step": 10596 + }, + { + "epoch": 0.84, + "learning_rate": 1.3199277681555578e-06, + "loss": 0.3775, + "step": 10597 + }, + { + "epoch": 0.84, + "learning_rate": 1.3186538868562004e-06, + "loss": 0.3669, + "step": 10598 + }, + { + "epoch": 0.84, + "learning_rate": 1.3173805771817138e-06, + "loss": 0.2561, + "step": 10599 + }, + { + "epoch": 0.84, + "learning_rate": 1.3161078392159355e-06, + "loss": 0.4233, + "step": 10600 + }, + { + "epoch": 0.84, + "learning_rate": 1.3148356730426737e-06, + "loss": 0.2583, + "step": 10601 + }, + { + "epoch": 0.84, + "learning_rate": 1.3135640787456926e-06, + "loss": 0.3147, + "step": 10602 + }, + { + "epoch": 0.84, + "learning_rate": 1.312293056408719e-06, + "loss": 0.3961, + "step": 10603 + }, + { + "epoch": 0.84, + "learning_rate": 1.3110226061154462e-06, + "loss": 0.4568, + "step": 10604 + }, + { + "epoch": 0.84, + "learning_rate": 1.309752727949527e-06, + "loss": 0.2417, + "step": 10605 + }, + { + "epoch": 0.84, + "learning_rate": 1.3084834219945731e-06, + "loss": 0.2799, + "step": 10606 + }, + { + "epoch": 0.84, + "learning_rate": 1.3072146883341675e-06, + "loss": 0.4194, + "step": 10607 + }, + { + "epoch": 0.84, + "learning_rate": 1.3059465270518469e-06, + "loss": 0.3491, + "step": 10608 + }, + { + "epoch": 0.84, + "learning_rate": 1.3046789382311132e-06, + "loss": 0.2492, + "step": 10609 + }, + { + "epoch": 0.84, + "learning_rate": 1.3034119219554341e-06, + "loss": 0.2483, + "step": 10610 + }, + { + "epoch": 0.84, + "learning_rate": 1.3021454783082344e-06, + "loss": 0.2997, + "step": 10611 + }, + { + "epoch": 0.84, + "learning_rate": 1.3008796073729013e-06, + "loss": 0.365, + "step": 10612 + }, + { + "epoch": 0.84, + "learning_rate": 1.2996143092327906e-06, + "loss": 0.2266, + "step": 10613 + }, + { + "epoch": 0.84, + "learning_rate": 1.2983495839712146e-06, + "loss": 0.5668, + "step": 10614 + }, + { + "epoch": 0.84, + "learning_rate": 1.2970854316714477e-06, + "loss": 0.326, + "step": 10615 + }, + { + "epoch": 0.84, + "learning_rate": 1.2958218524167288e-06, + "loss": 0.2967, + "step": 10616 + }, + { + "epoch": 0.84, + "learning_rate": 1.2945588462902603e-06, + "loss": 0.3624, + "step": 10617 + }, + { + "epoch": 0.84, + "learning_rate": 1.2932964133752036e-06, + "loss": 0.2917, + "step": 10618 + }, + { + "epoch": 0.84, + "learning_rate": 1.292034553754683e-06, + "loss": 0.314, + "step": 10619 + }, + { + "epoch": 0.84, + "learning_rate": 1.2907732675117878e-06, + "loss": 0.4199, + "step": 10620 + }, + { + "epoch": 0.84, + "learning_rate": 1.2895125547295672e-06, + "loss": 0.3443, + "step": 10621 + }, + { + "epoch": 0.84, + "learning_rate": 1.2882524154910314e-06, + "loss": 0.3866, + "step": 10622 + }, + { + "epoch": 0.84, + "learning_rate": 1.2869928498791572e-06, + "loss": 0.3626, + "step": 10623 + }, + { + "epoch": 0.84, + "learning_rate": 1.2857338579768796e-06, + "loss": 0.245, + "step": 10624 + }, + { + "epoch": 0.84, + "learning_rate": 1.2844754398670954e-06, + "loss": 0.3584, + "step": 10625 + }, + { + "epoch": 0.84, + "learning_rate": 1.2832175956326686e-06, + "loss": 0.2861, + "step": 10626 + }, + { + "epoch": 0.84, + "learning_rate": 1.2819603253564206e-06, + "loss": 0.305, + "step": 10627 + }, + { + "epoch": 0.84, + "learning_rate": 1.280703629121135e-06, + "loss": 0.369, + "step": 10628 + }, + { + "epoch": 0.84, + "learning_rate": 1.2794475070095624e-06, + "loss": 0.4278, + "step": 10629 + }, + { + "epoch": 0.84, + "learning_rate": 1.2781919591044113e-06, + "loss": 0.3724, + "step": 10630 + }, + { + "epoch": 0.84, + "learning_rate": 1.2769369854883528e-06, + "loss": 0.3972, + "step": 10631 + }, + { + "epoch": 0.84, + "learning_rate": 1.2756825862440192e-06, + "loss": 0.3818, + "step": 10632 + }, + { + "epoch": 0.84, + "learning_rate": 1.2744287614540108e-06, + "loss": 0.3483, + "step": 10633 + }, + { + "epoch": 0.84, + "learning_rate": 1.2731755112008838e-06, + "loss": 0.3757, + "step": 10634 + }, + { + "epoch": 0.84, + "learning_rate": 1.2719228355671576e-06, + "loss": 0.2951, + "step": 10635 + }, + { + "epoch": 0.84, + "learning_rate": 1.2706707346353165e-06, + "loss": 0.2402, + "step": 10636 + }, + { + "epoch": 0.84, + "learning_rate": 1.2694192084878032e-06, + "loss": 0.354, + "step": 10637 + }, + { + "epoch": 0.84, + "learning_rate": 1.2681682572070275e-06, + "loss": 0.3551, + "step": 10638 + }, + { + "epoch": 0.84, + "learning_rate": 1.2669178808753568e-06, + "loss": 0.3005, + "step": 10639 + }, + { + "epoch": 0.84, + "learning_rate": 1.265668079575124e-06, + "loss": 0.3789, + "step": 10640 + }, + { + "epoch": 0.84, + "learning_rate": 1.264418853388618e-06, + "loss": 0.2193, + "step": 10641 + }, + { + "epoch": 0.84, + "learning_rate": 1.2631702023980997e-06, + "loss": 0.2824, + "step": 10642 + }, + { + "epoch": 0.84, + "learning_rate": 1.2619221266857851e-06, + "loss": 0.2757, + "step": 10643 + }, + { + "epoch": 0.84, + "learning_rate": 1.260674626333851e-06, + "loss": 0.3782, + "step": 10644 + }, + { + "epoch": 0.84, + "learning_rate": 1.259427701424445e-06, + "loss": 0.404, + "step": 10645 + }, + { + "epoch": 0.84, + "learning_rate": 1.2581813520396668e-06, + "loss": 0.3112, + "step": 10646 + }, + { + "epoch": 0.84, + "learning_rate": 1.256935578261581e-06, + "loss": 0.2766, + "step": 10647 + }, + { + "epoch": 0.84, + "learning_rate": 1.255690380172222e-06, + "loss": 0.3413, + "step": 10648 + }, + { + "epoch": 0.84, + "learning_rate": 1.2544457578535764e-06, + "loss": 0.4892, + "step": 10649 + }, + { + "epoch": 0.84, + "learning_rate": 1.253201711387594e-06, + "loss": 0.2457, + "step": 10650 + }, + { + "epoch": 0.84, + "learning_rate": 1.2519582408561936e-06, + "loss": 0.3437, + "step": 10651 + }, + { + "epoch": 0.84, + "learning_rate": 1.2507153463412513e-06, + "loss": 0.2739, + "step": 10652 + }, + { + "epoch": 0.84, + "learning_rate": 1.2494730279246014e-06, + "loss": 0.3219, + "step": 10653 + }, + { + "epoch": 0.84, + "learning_rate": 1.2482312856880506e-06, + "loss": 0.3197, + "step": 10654 + }, + { + "epoch": 0.84, + "learning_rate": 1.2469901197133582e-06, + "loss": 0.4678, + "step": 10655 + }, + { + "epoch": 0.84, + "learning_rate": 1.2457495300822497e-06, + "loss": 0.3644, + "step": 10656 + }, + { + "epoch": 0.84, + "learning_rate": 1.244509516876411e-06, + "loss": 0.2478, + "step": 10657 + }, + { + "epoch": 0.84, + "learning_rate": 1.2432700801774923e-06, + "loss": 0.3279, + "step": 10658 + }, + { + "epoch": 0.84, + "learning_rate": 1.2420312200671048e-06, + "loss": 0.364, + "step": 10659 + }, + { + "epoch": 0.84, + "learning_rate": 1.240792936626819e-06, + "loss": 0.3475, + "step": 10660 + }, + { + "epoch": 0.84, + "learning_rate": 1.2395552299381742e-06, + "loss": 0.3244, + "step": 10661 + }, + { + "epoch": 0.84, + "learning_rate": 1.238318100082664e-06, + "loss": 0.3126, + "step": 10662 + }, + { + "epoch": 0.84, + "learning_rate": 1.2370815471417464e-06, + "loss": 0.3963, + "step": 10663 + }, + { + "epoch": 0.84, + "learning_rate": 1.2358455711968463e-06, + "loss": 0.3158, + "step": 10664 + }, + { + "epoch": 0.84, + "learning_rate": 1.2346101723293457e-06, + "loss": 0.3255, + "step": 10665 + }, + { + "epoch": 0.84, + "learning_rate": 1.233375350620587e-06, + "loss": 0.2362, + "step": 10666 + }, + { + "epoch": 0.85, + "learning_rate": 1.2321411061518807e-06, + "loss": 0.245, + "step": 10667 + }, + { + "epoch": 0.85, + "learning_rate": 1.2309074390044939e-06, + "loss": 0.3157, + "step": 10668 + }, + { + "epoch": 0.85, + "learning_rate": 1.2296743492596587e-06, + "loss": 0.2962, + "step": 10669 + }, + { + "epoch": 0.85, + "learning_rate": 1.2284418369985651e-06, + "loss": 0.3481, + "step": 10670 + }, + { + "epoch": 0.85, + "learning_rate": 1.227209902302372e-06, + "loss": 0.3036, + "step": 10671 + }, + { + "epoch": 0.85, + "learning_rate": 1.2259785452521956e-06, + "loss": 0.3451, + "step": 10672 + }, + { + "epoch": 0.85, + "learning_rate": 1.2247477659291118e-06, + "loss": 0.3171, + "step": 10673 + }, + { + "epoch": 0.85, + "learning_rate": 1.223517564414166e-06, + "loss": 0.3245, + "step": 10674 + }, + { + "epoch": 0.85, + "learning_rate": 1.2222879407883592e-06, + "loss": 0.2979, + "step": 10675 + }, + { + "epoch": 0.85, + "learning_rate": 1.2210588951326542e-06, + "loss": 0.3407, + "step": 10676 + }, + { + "epoch": 0.85, + "learning_rate": 1.2198304275279805e-06, + "loss": 0.346, + "step": 10677 + }, + { + "epoch": 0.85, + "learning_rate": 1.2186025380552259e-06, + "loss": 0.3732, + "step": 10678 + }, + { + "epoch": 0.85, + "learning_rate": 1.2173752267952376e-06, + "loss": 0.3852, + "step": 10679 + }, + { + "epoch": 0.85, + "learning_rate": 1.2161484938288348e-06, + "loss": 0.3486, + "step": 10680 + }, + { + "epoch": 0.85, + "learning_rate": 1.214922339236788e-06, + "loss": 0.3659, + "step": 10681 + }, + { + "epoch": 0.85, + "learning_rate": 1.213696763099832e-06, + "loss": 0.3069, + "step": 10682 + }, + { + "epoch": 0.85, + "learning_rate": 1.2124717654986695e-06, + "loss": 0.3087, + "step": 10683 + }, + { + "epoch": 0.85, + "learning_rate": 1.2112473465139586e-06, + "loss": 0.3908, + "step": 10684 + }, + { + "epoch": 0.85, + "learning_rate": 1.210023506226321e-06, + "loss": 0.4491, + "step": 10685 + }, + { + "epoch": 0.85, + "learning_rate": 1.2088002447163383e-06, + "loss": 0.4822, + "step": 10686 + }, + { + "epoch": 0.85, + "learning_rate": 1.2075775620645613e-06, + "loss": 0.2937, + "step": 10687 + }, + { + "epoch": 0.85, + "learning_rate": 1.2063554583514947e-06, + "loss": 0.2986, + "step": 10688 + }, + { + "epoch": 0.85, + "learning_rate": 1.2051339336576074e-06, + "loss": 0.2959, + "step": 10689 + }, + { + "epoch": 0.85, + "learning_rate": 1.203912988063335e-06, + "loss": 0.3579, + "step": 10690 + }, + { + "epoch": 0.85, + "learning_rate": 1.2026926216490675e-06, + "loss": 0.3399, + "step": 10691 + }, + { + "epoch": 0.85, + "learning_rate": 1.2014728344951587e-06, + "loss": 0.3468, + "step": 10692 + }, + { + "epoch": 0.85, + "learning_rate": 1.2002536266819309e-06, + "loss": 0.334, + "step": 10693 + }, + { + "epoch": 0.85, + "learning_rate": 1.1990349982896598e-06, + "loss": 0.4222, + "step": 10694 + }, + { + "epoch": 0.85, + "learning_rate": 1.1978169493985836e-06, + "loss": 0.4048, + "step": 10695 + }, + { + "epoch": 0.85, + "learning_rate": 1.1965994800889113e-06, + "loss": 0.3119, + "step": 10696 + }, + { + "epoch": 0.85, + "learning_rate": 1.1953825904408033e-06, + "loss": 0.3511, + "step": 10697 + }, + { + "epoch": 0.85, + "learning_rate": 1.1941662805343846e-06, + "loss": 0.4062, + "step": 10698 + }, + { + "epoch": 0.85, + "learning_rate": 1.1929505504497464e-06, + "loss": 0.3182, + "step": 10699 + }, + { + "epoch": 0.85, + "learning_rate": 1.191735400266939e-06, + "loss": 0.4408, + "step": 10700 + }, + { + "epoch": 0.85, + "learning_rate": 1.190520830065972e-06, + "loss": 0.4695, + "step": 10701 + }, + { + "epoch": 0.85, + "learning_rate": 1.189306839926818e-06, + "loss": 0.3668, + "step": 10702 + }, + { + "epoch": 0.85, + "learning_rate": 1.1880934299294167e-06, + "loss": 0.3311, + "step": 10703 + }, + { + "epoch": 0.85, + "learning_rate": 1.1868806001536625e-06, + "loss": 0.3227, + "step": 10704 + }, + { + "epoch": 0.85, + "learning_rate": 1.185668350679413e-06, + "loss": 0.24, + "step": 10705 + }, + { + "epoch": 0.85, + "learning_rate": 1.1844566815864921e-06, + "loss": 0.3216, + "step": 10706 + }, + { + "epoch": 0.85, + "learning_rate": 1.1832455929546827e-06, + "loss": 0.2581, + "step": 10707 + }, + { + "epoch": 0.85, + "learning_rate": 1.182035084863724e-06, + "loss": 0.404, + "step": 10708 + }, + { + "epoch": 0.85, + "learning_rate": 1.1808251573933272e-06, + "loss": 0.2695, + "step": 10709 + }, + { + "epoch": 0.85, + "learning_rate": 1.1796158106231603e-06, + "loss": 0.3532, + "step": 10710 + }, + { + "epoch": 0.85, + "learning_rate": 1.1784070446328477e-06, + "loss": 0.2696, + "step": 10711 + }, + { + "epoch": 0.85, + "learning_rate": 1.177198859501989e-06, + "loss": 0.3054, + "step": 10712 + }, + { + "epoch": 0.85, + "learning_rate": 1.1759912553101316e-06, + "loss": 0.3792, + "step": 10713 + }, + { + "epoch": 0.85, + "learning_rate": 1.1747842321367886e-06, + "loss": 0.2847, + "step": 10714 + }, + { + "epoch": 0.85, + "learning_rate": 1.173577790061442e-06, + "loss": 0.3083, + "step": 10715 + }, + { + "epoch": 0.85, + "learning_rate": 1.1723719291635272e-06, + "loss": 0.3941, + "step": 10716 + }, + { + "epoch": 0.85, + "learning_rate": 1.171166649522444e-06, + "loss": 0.3727, + "step": 10717 + }, + { + "epoch": 0.85, + "learning_rate": 1.1699619512175563e-06, + "loss": 0.3519, + "step": 10718 + }, + { + "epoch": 0.85, + "learning_rate": 1.168757834328188e-06, + "loss": 0.3468, + "step": 10719 + }, + { + "epoch": 0.85, + "learning_rate": 1.1675542989336208e-06, + "loss": 0.311, + "step": 10720 + }, + { + "epoch": 0.85, + "learning_rate": 1.1663513451131047e-06, + "loss": 0.3324, + "step": 10721 + }, + { + "epoch": 0.85, + "learning_rate": 1.1651489729458487e-06, + "loss": 0.3934, + "step": 10722 + }, + { + "epoch": 0.85, + "learning_rate": 1.1639471825110205e-06, + "loss": 0.2815, + "step": 10723 + }, + { + "epoch": 0.85, + "learning_rate": 1.1627459738877557e-06, + "loss": 0.4077, + "step": 10724 + }, + { + "epoch": 0.85, + "learning_rate": 1.1615453471551462e-06, + "loss": 0.3533, + "step": 10725 + }, + { + "epoch": 0.85, + "learning_rate": 1.1603453023922473e-06, + "loss": 0.3562, + "step": 10726 + }, + { + "epoch": 0.85, + "learning_rate": 1.1591458396780753e-06, + "loss": 0.4199, + "step": 10727 + }, + { + "epoch": 0.85, + "learning_rate": 1.1579469590916125e-06, + "loss": 0.3777, + "step": 10728 + }, + { + "epoch": 0.85, + "learning_rate": 1.156748660711796e-06, + "loss": 0.419, + "step": 10729 + }, + { + "epoch": 0.85, + "learning_rate": 1.1555509446175284e-06, + "loss": 0.4242, + "step": 10730 + }, + { + "epoch": 0.85, + "learning_rate": 1.1543538108876751e-06, + "loss": 0.3895, + "step": 10731 + }, + { + "epoch": 0.85, + "learning_rate": 1.153157259601062e-06, + "loss": 0.3102, + "step": 10732 + }, + { + "epoch": 0.85, + "learning_rate": 1.1519612908364718e-06, + "loss": 0.4115, + "step": 10733 + }, + { + "epoch": 0.85, + "learning_rate": 1.1507659046726605e-06, + "loss": 0.2498, + "step": 10734 + }, + { + "epoch": 0.85, + "learning_rate": 1.1495711011883325e-06, + "loss": 0.341, + "step": 10735 + }, + { + "epoch": 0.85, + "learning_rate": 1.148376880462161e-06, + "loss": 0.3541, + "step": 10736 + }, + { + "epoch": 0.85, + "learning_rate": 1.1471832425727825e-06, + "loss": 0.3668, + "step": 10737 + }, + { + "epoch": 0.85, + "learning_rate": 1.14599018759879e-06, + "loss": 0.4202, + "step": 10738 + }, + { + "epoch": 0.85, + "learning_rate": 1.1447977156187395e-06, + "loss": 0.3409, + "step": 10739 + }, + { + "epoch": 0.85, + "learning_rate": 1.1436058267111527e-06, + "loss": 0.3013, + "step": 10740 + }, + { + "epoch": 0.85, + "learning_rate": 1.1424145209545079e-06, + "loss": 0.2987, + "step": 10741 + }, + { + "epoch": 0.85, + "learning_rate": 1.1412237984272467e-06, + "loss": 0.3197, + "step": 10742 + }, + { + "epoch": 0.85, + "learning_rate": 1.140033659207771e-06, + "loss": 0.3512, + "step": 10743 + }, + { + "epoch": 0.85, + "learning_rate": 1.1388441033744502e-06, + "loss": 0.3104, + "step": 10744 + }, + { + "epoch": 0.85, + "learning_rate": 1.1376551310056073e-06, + "loss": 0.3744, + "step": 10745 + }, + { + "epoch": 0.85, + "learning_rate": 1.1364667421795283e-06, + "loss": 0.3506, + "step": 10746 + }, + { + "epoch": 0.85, + "learning_rate": 1.1352789369744688e-06, + "loss": 0.2864, + "step": 10747 + }, + { + "epoch": 0.85, + "learning_rate": 1.134091715468636e-06, + "loss": 0.3373, + "step": 10748 + }, + { + "epoch": 0.85, + "learning_rate": 1.132905077740203e-06, + "loss": 0.3334, + "step": 10749 + }, + { + "epoch": 0.85, + "learning_rate": 1.131719023867306e-06, + "loss": 0.3068, + "step": 10750 + }, + { + "epoch": 0.85, + "learning_rate": 1.1305335539280392e-06, + "loss": 0.3783, + "step": 10751 + }, + { + "epoch": 0.85, + "learning_rate": 1.1293486680004607e-06, + "loss": 0.3004, + "step": 10752 + }, + { + "epoch": 0.85, + "learning_rate": 1.1281643661625896e-06, + "loss": 0.3985, + "step": 10753 + }, + { + "epoch": 0.85, + "learning_rate": 1.1269806484924072e-06, + "loss": 0.3357, + "step": 10754 + }, + { + "epoch": 0.85, + "learning_rate": 1.1257975150678557e-06, + "loss": 0.3671, + "step": 10755 + }, + { + "epoch": 0.85, + "learning_rate": 1.124614965966835e-06, + "loss": 0.3457, + "step": 10756 + }, + { + "epoch": 0.85, + "learning_rate": 1.1234330012672146e-06, + "loss": 0.2518, + "step": 10757 + }, + { + "epoch": 0.85, + "learning_rate": 1.1222516210468204e-06, + "loss": 0.3816, + "step": 10758 + }, + { + "epoch": 0.85, + "learning_rate": 1.121070825383438e-06, + "loss": 0.2254, + "step": 10759 + }, + { + "epoch": 0.85, + "learning_rate": 1.1198906143548216e-06, + "loss": 0.3067, + "step": 10760 + }, + { + "epoch": 0.85, + "learning_rate": 1.1187109880386794e-06, + "loss": 0.2539, + "step": 10761 + }, + { + "epoch": 0.85, + "learning_rate": 1.117531946512682e-06, + "loss": 0.3261, + "step": 10762 + }, + { + "epoch": 0.85, + "learning_rate": 1.1163534898544692e-06, + "loss": 0.263, + "step": 10763 + }, + { + "epoch": 0.85, + "learning_rate": 1.1151756181416328e-06, + "loss": 0.3014, + "step": 10764 + }, + { + "epoch": 0.85, + "learning_rate": 1.1139983314517288e-06, + "loss": 0.3084, + "step": 10765 + }, + { + "epoch": 0.85, + "learning_rate": 1.1128216298622808e-06, + "loss": 0.3245, + "step": 10766 + }, + { + "epoch": 0.85, + "learning_rate": 1.1116455134507665e-06, + "loss": 0.2871, + "step": 10767 + }, + { + "epoch": 0.85, + "learning_rate": 1.110469982294624e-06, + "loss": 0.4863, + "step": 10768 + }, + { + "epoch": 0.85, + "learning_rate": 1.1092950364712617e-06, + "loss": 0.3629, + "step": 10769 + }, + { + "epoch": 0.85, + "learning_rate": 1.1081206760580422e-06, + "loss": 0.3071, + "step": 10770 + }, + { + "epoch": 0.85, + "learning_rate": 1.1069469011322908e-06, + "loss": 0.2457, + "step": 10771 + }, + { + "epoch": 0.85, + "learning_rate": 1.1057737117712941e-06, + "loss": 0.3966, + "step": 10772 + }, + { + "epoch": 0.85, + "learning_rate": 1.1046011080523034e-06, + "loss": 0.391, + "step": 10773 + }, + { + "epoch": 0.85, + "learning_rate": 1.1034290900525279e-06, + "loss": 0.4625, + "step": 10774 + }, + { + "epoch": 0.85, + "learning_rate": 1.1022576578491372e-06, + "loss": 0.3455, + "step": 10775 + }, + { + "epoch": 0.85, + "learning_rate": 1.1010868115192696e-06, + "loss": 0.3461, + "step": 10776 + }, + { + "epoch": 0.85, + "learning_rate": 1.0999165511400157e-06, + "loss": 0.4017, + "step": 10777 + }, + { + "epoch": 0.85, + "learning_rate": 1.09874687678843e-06, + "loss": 0.3274, + "step": 10778 + }, + { + "epoch": 0.85, + "learning_rate": 1.097577788541535e-06, + "loss": 0.4006, + "step": 10779 + }, + { + "epoch": 0.85, + "learning_rate": 1.0964092864763065e-06, + "loss": 0.4247, + "step": 10780 + }, + { + "epoch": 0.85, + "learning_rate": 1.095241370669684e-06, + "loss": 0.377, + "step": 10781 + }, + { + "epoch": 0.85, + "learning_rate": 1.0940740411985718e-06, + "loss": 0.2764, + "step": 10782 + }, + { + "epoch": 0.85, + "learning_rate": 1.0929072981398313e-06, + "loss": 0.379, + "step": 10783 + }, + { + "epoch": 0.85, + "learning_rate": 1.091741141570285e-06, + "loss": 0.3096, + "step": 10784 + }, + { + "epoch": 0.85, + "learning_rate": 1.0905755715667222e-06, + "loss": 0.4137, + "step": 10785 + }, + { + "epoch": 0.85, + "learning_rate": 1.0894105882058891e-06, + "loss": 0.4326, + "step": 10786 + }, + { + "epoch": 0.85, + "learning_rate": 1.0882461915644936e-06, + "loss": 0.2565, + "step": 10787 + }, + { + "epoch": 0.85, + "learning_rate": 1.0870823817192045e-06, + "loss": 0.4269, + "step": 10788 + }, + { + "epoch": 0.85, + "learning_rate": 1.0859191587466556e-06, + "loss": 0.3749, + "step": 10789 + }, + { + "epoch": 0.85, + "learning_rate": 1.0847565227234392e-06, + "loss": 0.3637, + "step": 10790 + }, + { + "epoch": 0.85, + "learning_rate": 1.0835944737261072e-06, + "loss": 0.4546, + "step": 10791 + }, + { + "epoch": 0.85, + "learning_rate": 1.0824330118311765e-06, + "loss": 0.3089, + "step": 10792 + }, + { + "epoch": 0.86, + "learning_rate": 1.0812721371151213e-06, + "loss": 0.3541, + "step": 10793 + }, + { + "epoch": 0.86, + "learning_rate": 1.080111849654384e-06, + "loss": 0.2608, + "step": 10794 + }, + { + "epoch": 0.86, + "learning_rate": 1.078952149525362e-06, + "loss": 0.3003, + "step": 10795 + }, + { + "epoch": 0.86, + "learning_rate": 1.0777930368044143e-06, + "loss": 0.3357, + "step": 10796 + }, + { + "epoch": 0.86, + "learning_rate": 1.0766345115678633e-06, + "loss": 0.2904, + "step": 10797 + }, + { + "epoch": 0.86, + "learning_rate": 1.0754765738919947e-06, + "loss": 0.4014, + "step": 10798 + }, + { + "epoch": 0.86, + "learning_rate": 1.074319223853052e-06, + "loss": 0.3764, + "step": 10799 + }, + { + "epoch": 0.86, + "learning_rate": 1.0731624615272385e-06, + "loss": 0.4236, + "step": 10800 + }, + { + "epoch": 0.86, + "learning_rate": 1.0720062869907255e-06, + "loss": 0.324, + "step": 10801 + }, + { + "epoch": 0.86, + "learning_rate": 1.07085070031964e-06, + "loss": 0.2776, + "step": 10802 + }, + { + "epoch": 0.86, + "learning_rate": 1.06969570159007e-06, + "loss": 0.2848, + "step": 10803 + }, + { + "epoch": 0.86, + "learning_rate": 1.0685412908780702e-06, + "loss": 0.458, + "step": 10804 + }, + { + "epoch": 0.86, + "learning_rate": 1.0673874682596497e-06, + "loss": 0.3893, + "step": 10805 + }, + { + "epoch": 0.86, + "learning_rate": 1.0662342338107823e-06, + "loss": 0.2717, + "step": 10806 + }, + { + "epoch": 0.86, + "learning_rate": 1.065081587607406e-06, + "loss": 0.4913, + "step": 10807 + }, + { + "epoch": 0.86, + "learning_rate": 1.0639295297254149e-06, + "loss": 0.2943, + "step": 10808 + }, + { + "epoch": 0.86, + "learning_rate": 1.0627780602406656e-06, + "loss": 0.3794, + "step": 10809 + }, + { + "epoch": 0.86, + "learning_rate": 1.061627179228979e-06, + "loss": 0.3571, + "step": 10810 + }, + { + "epoch": 0.86, + "learning_rate": 1.0604768867661342e-06, + "loss": 0.396, + "step": 10811 + }, + { + "epoch": 0.86, + "learning_rate": 1.0593271829278718e-06, + "loss": 0.4639, + "step": 10812 + }, + { + "epoch": 0.86, + "learning_rate": 1.0581780677898924e-06, + "loss": 0.3837, + "step": 10813 + }, + { + "epoch": 0.86, + "learning_rate": 1.0570295414278642e-06, + "loss": 0.2928, + "step": 10814 + }, + { + "epoch": 0.86, + "learning_rate": 1.0558816039174102e-06, + "loss": 0.2912, + "step": 10815 + }, + { + "epoch": 0.86, + "learning_rate": 1.0547342553341144e-06, + "loss": 0.261, + "step": 10816 + }, + { + "epoch": 0.86, + "learning_rate": 1.0535874957535275e-06, + "loss": 0.3918, + "step": 10817 + }, + { + "epoch": 0.86, + "learning_rate": 1.0524413252511567e-06, + "loss": 0.2859, + "step": 10818 + }, + { + "epoch": 0.86, + "learning_rate": 1.0512957439024697e-06, + "loss": 0.3799, + "step": 10819 + }, + { + "epoch": 0.86, + "learning_rate": 1.0501507517829012e-06, + "loss": 0.2944, + "step": 10820 + }, + { + "epoch": 0.86, + "learning_rate": 1.0490063489678427e-06, + "loss": 0.2934, + "step": 10821 + }, + { + "epoch": 0.86, + "learning_rate": 1.0478625355326445e-06, + "loss": 0.3954, + "step": 10822 + }, + { + "epoch": 0.86, + "learning_rate": 1.0467193115526254e-06, + "loss": 0.282, + "step": 10823 + }, + { + "epoch": 0.86, + "learning_rate": 1.0455766771030585e-06, + "loss": 0.471, + "step": 10824 + }, + { + "epoch": 0.86, + "learning_rate": 1.0444346322591804e-06, + "loss": 0.405, + "step": 10825 + }, + { + "epoch": 0.86, + "learning_rate": 1.0432931770961907e-06, + "loss": 0.3493, + "step": 10826 + }, + { + "epoch": 0.86, + "learning_rate": 1.0421523116892496e-06, + "loss": 0.3471, + "step": 10827 + }, + { + "epoch": 0.86, + "learning_rate": 1.0410120361134767e-06, + "loss": 0.337, + "step": 10828 + }, + { + "epoch": 0.86, + "learning_rate": 1.0398723504439512e-06, + "loss": 0.3679, + "step": 10829 + }, + { + "epoch": 0.86, + "learning_rate": 1.0387332547557194e-06, + "loss": 0.3434, + "step": 10830 + }, + { + "epoch": 0.86, + "learning_rate": 1.0375947491237836e-06, + "loss": 0.2696, + "step": 10831 + }, + { + "epoch": 0.86, + "learning_rate": 1.0364568336231085e-06, + "loss": 0.3575, + "step": 10832 + }, + { + "epoch": 0.86, + "learning_rate": 1.0353195083286226e-06, + "loss": 0.2553, + "step": 10833 + }, + { + "epoch": 0.86, + "learning_rate": 1.034182773315211e-06, + "loss": 0.3833, + "step": 10834 + }, + { + "epoch": 0.86, + "learning_rate": 1.0330466286577224e-06, + "loss": 0.3914, + "step": 10835 + }, + { + "epoch": 0.86, + "learning_rate": 1.031911074430968e-06, + "loss": 0.255, + "step": 10836 + }, + { + "epoch": 0.86, + "learning_rate": 1.030776110709718e-06, + "loss": 0.4914, + "step": 10837 + }, + { + "epoch": 0.86, + "learning_rate": 1.0296417375687017e-06, + "loss": 0.313, + "step": 10838 + }, + { + "epoch": 0.86, + "learning_rate": 1.0285079550826172e-06, + "loss": 0.3399, + "step": 10839 + }, + { + "epoch": 0.86, + "learning_rate": 1.0273747633261144e-06, + "loss": 0.2928, + "step": 10840 + }, + { + "epoch": 0.86, + "learning_rate": 1.0262421623738105e-06, + "loss": 0.378, + "step": 10841 + }, + { + "epoch": 0.86, + "learning_rate": 1.0251101523002805e-06, + "loss": 0.292, + "step": 10842 + }, + { + "epoch": 0.86, + "learning_rate": 1.0239787331800632e-06, + "loss": 0.3194, + "step": 10843 + }, + { + "epoch": 0.86, + "learning_rate": 1.022847905087656e-06, + "loss": 0.2343, + "step": 10844 + }, + { + "epoch": 0.86, + "learning_rate": 1.0217176680975183e-06, + "loss": 0.3416, + "step": 10845 + }, + { + "epoch": 0.86, + "learning_rate": 1.0205880222840726e-06, + "loss": 0.4026, + "step": 10846 + }, + { + "epoch": 0.86, + "learning_rate": 1.0194589677216992e-06, + "loss": 0.3253, + "step": 10847 + }, + { + "epoch": 0.86, + "learning_rate": 1.0183305044847402e-06, + "loss": 0.3552, + "step": 10848 + }, + { + "epoch": 0.86, + "learning_rate": 1.0172026326475016e-06, + "loss": 0.2988, + "step": 10849 + }, + { + "epoch": 0.86, + "learning_rate": 1.0160753522842482e-06, + "loss": 0.3425, + "step": 10850 + }, + { + "epoch": 0.86, + "learning_rate": 1.0149486634692019e-06, + "loss": 0.4985, + "step": 10851 + }, + { + "epoch": 0.86, + "learning_rate": 1.0138225662765555e-06, + "loss": 0.336, + "step": 10852 + }, + { + "epoch": 0.86, + "learning_rate": 1.0126970607804532e-06, + "loss": 0.2693, + "step": 10853 + }, + { + "epoch": 0.86, + "learning_rate": 1.0115721470550045e-06, + "loss": 0.3137, + "step": 10854 + }, + { + "epoch": 0.86, + "learning_rate": 1.0104478251742822e-06, + "loss": 0.3977, + "step": 10855 + }, + { + "epoch": 0.86, + "learning_rate": 1.009324095212315e-06, + "loss": 0.3913, + "step": 10856 + }, + { + "epoch": 0.86, + "learning_rate": 1.0082009572430963e-06, + "loss": 0.3616, + "step": 10857 + }, + { + "epoch": 0.86, + "learning_rate": 1.0070784113405763e-06, + "loss": 0.4347, + "step": 10858 + }, + { + "epoch": 0.86, + "learning_rate": 1.005956457578675e-06, + "loss": 0.3046, + "step": 10859 + }, + { + "epoch": 0.86, + "learning_rate": 1.0048350960312637e-06, + "loss": 0.3257, + "step": 10860 + }, + { + "epoch": 0.86, + "learning_rate": 1.003714326772176e-06, + "loss": 0.2482, + "step": 10861 + }, + { + "epoch": 0.86, + "learning_rate": 1.0025941498752167e-06, + "loss": 0.379, + "step": 10862 + }, + { + "epoch": 0.86, + "learning_rate": 1.001474565414139e-06, + "loss": 0.3384, + "step": 10863 + }, + { + "epoch": 0.86, + "learning_rate": 1.0003555734626603e-06, + "loss": 0.2412, + "step": 10864 + }, + { + "epoch": 0.86, + "learning_rate": 9.992371740944663e-07, + "loss": 0.2849, + "step": 10865 + }, + { + "epoch": 0.86, + "learning_rate": 9.981193673831946e-07, + "loss": 0.2663, + "step": 10866 + }, + { + "epoch": 0.86, + "learning_rate": 9.970021534024476e-07, + "loss": 0.4248, + "step": 10867 + }, + { + "epoch": 0.86, + "learning_rate": 9.958855322257922e-07, + "loss": 0.3876, + "step": 10868 + }, + { + "epoch": 0.86, + "learning_rate": 9.94769503926748e-07, + "loss": 0.3139, + "step": 10869 + }, + { + "epoch": 0.86, + "learning_rate": 9.936540685787998e-07, + "loss": 0.2297, + "step": 10870 + }, + { + "epoch": 0.86, + "learning_rate": 9.925392262553968e-07, + "loss": 0.3353, + "step": 10871 + }, + { + "epoch": 0.86, + "learning_rate": 9.914249770299445e-07, + "loss": 0.3111, + "step": 10872 + }, + { + "epoch": 0.86, + "learning_rate": 9.903113209758098e-07, + "loss": 0.3004, + "step": 10873 + }, + { + "epoch": 0.86, + "learning_rate": 9.89198258166324e-07, + "loss": 0.3239, + "step": 10874 + }, + { + "epoch": 0.86, + "learning_rate": 9.880857886747753e-07, + "loss": 0.3583, + "step": 10875 + }, + { + "epoch": 0.86, + "learning_rate": 9.869739125744138e-07, + "loss": 0.3064, + "step": 10876 + }, + { + "epoch": 0.86, + "learning_rate": 9.858626299384532e-07, + "loss": 0.3133, + "step": 10877 + }, + { + "epoch": 0.86, + "learning_rate": 9.847519408400663e-07, + "loss": 0.2953, + "step": 10878 + }, + { + "epoch": 0.86, + "learning_rate": 9.836418453523833e-07, + "loss": 0.2356, + "step": 10879 + }, + { + "epoch": 0.86, + "learning_rate": 9.825323435485024e-07, + "loss": 0.2714, + "step": 10880 + }, + { + "epoch": 0.86, + "learning_rate": 9.814234355014774e-07, + "loss": 0.3008, + "step": 10881 + }, + { + "epoch": 0.86, + "learning_rate": 9.803151212843253e-07, + "loss": 0.4649, + "step": 10882 + }, + { + "epoch": 0.86, + "learning_rate": 9.792074009700192e-07, + "loss": 0.3706, + "step": 10883 + }, + { + "epoch": 0.86, + "learning_rate": 9.781002746315039e-07, + "loss": 0.3247, + "step": 10884 + }, + { + "epoch": 0.86, + "learning_rate": 9.769937423416741e-07, + "loss": 0.2986, + "step": 10885 + }, + { + "epoch": 0.86, + "learning_rate": 9.758878041733877e-07, + "loss": 0.3407, + "step": 10886 + }, + { + "epoch": 0.86, + "learning_rate": 9.747824601994715e-07, + "loss": 0.2733, + "step": 10887 + }, + { + "epoch": 0.86, + "learning_rate": 9.73677710492703e-07, + "loss": 0.3357, + "step": 10888 + }, + { + "epoch": 0.86, + "learning_rate": 9.725735551258241e-07, + "loss": 0.1986, + "step": 10889 + }, + { + "epoch": 0.86, + "learning_rate": 9.7146999417154e-07, + "loss": 0.3942, + "step": 10890 + }, + { + "epoch": 0.86, + "learning_rate": 9.703670277025158e-07, + "loss": 0.3534, + "step": 10891 + }, + { + "epoch": 0.86, + "learning_rate": 9.69264655791372e-07, + "loss": 0.3111, + "step": 10892 + }, + { + "epoch": 0.86, + "learning_rate": 9.681628785107e-07, + "loss": 0.3124, + "step": 10893 + }, + { + "epoch": 0.86, + "learning_rate": 9.670616959330437e-07, + "loss": 0.3589, + "step": 10894 + }, + { + "epoch": 0.86, + "learning_rate": 9.659611081309095e-07, + "loss": 0.3545, + "step": 10895 + }, + { + "epoch": 0.86, + "learning_rate": 9.648611151767683e-07, + "loss": 0.2947, + "step": 10896 + }, + { + "epoch": 0.86, + "learning_rate": 9.637617171430492e-07, + "loss": 0.3234, + "step": 10897 + }, + { + "epoch": 0.86, + "learning_rate": 9.626629141021414e-07, + "loss": 0.3652, + "step": 10898 + }, + { + "epoch": 0.86, + "learning_rate": 9.615647061263933e-07, + "loss": 0.3116, + "step": 10899 + }, + { + "epoch": 0.86, + "learning_rate": 9.604670932881211e-07, + "loss": 0.421, + "step": 10900 + }, + { + "epoch": 0.86, + "learning_rate": 9.593700756595958e-07, + "loss": 0.3657, + "step": 10901 + }, + { + "epoch": 0.86, + "learning_rate": 9.582736533130488e-07, + "loss": 0.3892, + "step": 10902 + }, + { + "epoch": 0.86, + "learning_rate": 9.571778263206767e-07, + "loss": 0.3554, + "step": 10903 + }, + { + "epoch": 0.86, + "learning_rate": 9.560825947546337e-07, + "loss": 0.2464, + "step": 10904 + }, + { + "epoch": 0.86, + "learning_rate": 9.549879586870336e-07, + "loss": 0.4151, + "step": 10905 + }, + { + "epoch": 0.86, + "learning_rate": 9.538939181899565e-07, + "loss": 0.4167, + "step": 10906 + }, + { + "epoch": 0.86, + "learning_rate": 9.528004733354379e-07, + "loss": 0.4386, + "step": 10907 + }, + { + "epoch": 0.86, + "learning_rate": 9.517076241954737e-07, + "loss": 0.2991, + "step": 10908 + }, + { + "epoch": 0.86, + "learning_rate": 9.506153708420263e-07, + "loss": 0.3169, + "step": 10909 + }, + { + "epoch": 0.86, + "learning_rate": 9.495237133470148e-07, + "loss": 0.3264, + "step": 10910 + }, + { + "epoch": 0.86, + "learning_rate": 9.484326517823173e-07, + "loss": 0.3438, + "step": 10911 + }, + { + "epoch": 0.86, + "learning_rate": 9.473421862197751e-07, + "loss": 0.2556, + "step": 10912 + }, + { + "epoch": 0.86, + "learning_rate": 9.462523167311943e-07, + "loss": 0.3574, + "step": 10913 + }, + { + "epoch": 0.86, + "learning_rate": 9.45163043388333e-07, + "loss": 0.2974, + "step": 10914 + }, + { + "epoch": 0.86, + "learning_rate": 9.440743662629149e-07, + "loss": 0.326, + "step": 10915 + }, + { + "epoch": 0.86, + "learning_rate": 9.429862854266281e-07, + "loss": 0.366, + "step": 10916 + }, + { + "epoch": 0.86, + "learning_rate": 9.418988009511143e-07, + "loss": 0.3858, + "step": 10917 + }, + { + "epoch": 0.86, + "learning_rate": 9.408119129079774e-07, + "loss": 0.2968, + "step": 10918 + }, + { + "epoch": 0.87, + "learning_rate": 9.397256213687877e-07, + "loss": 0.4682, + "step": 10919 + }, + { + "epoch": 0.87, + "learning_rate": 9.386399264050705e-07, + "loss": 0.351, + "step": 10920 + }, + { + "epoch": 0.87, + "learning_rate": 9.375548280883129e-07, + "loss": 0.3541, + "step": 10921 + }, + { + "epoch": 0.87, + "learning_rate": 9.364703264899655e-07, + "loss": 0.2342, + "step": 10922 + }, + { + "epoch": 0.87, + "learning_rate": 9.353864216814356e-07, + "loss": 0.2545, + "step": 10923 + }, + { + "epoch": 0.87, + "learning_rate": 9.34303113734093e-07, + "loss": 0.3238, + "step": 10924 + }, + { + "epoch": 0.87, + "learning_rate": 9.332204027192693e-07, + "loss": 0.3226, + "step": 10925 + }, + { + "epoch": 0.87, + "learning_rate": 9.321382887082564e-07, + "loss": 0.375, + "step": 10926 + }, + { + "epoch": 0.87, + "learning_rate": 9.310567717723063e-07, + "loss": 0.3335, + "step": 10927 + }, + { + "epoch": 0.87, + "learning_rate": 9.299758519826274e-07, + "loss": 0.3147, + "step": 10928 + }, + { + "epoch": 0.87, + "learning_rate": 9.288955294103996e-07, + "loss": 0.3166, + "step": 10929 + }, + { + "epoch": 0.87, + "learning_rate": 9.278158041267526e-07, + "loss": 0.2234, + "step": 10930 + }, + { + "epoch": 0.87, + "learning_rate": 9.267366762027818e-07, + "loss": 0.2373, + "step": 10931 + }, + { + "epoch": 0.87, + "learning_rate": 9.256581457095437e-07, + "loss": 0.2868, + "step": 10932 + }, + { + "epoch": 0.87, + "learning_rate": 9.245802127180547e-07, + "loss": 0.3618, + "step": 10933 + }, + { + "epoch": 0.87, + "learning_rate": 9.235028772992883e-07, + "loss": 0.4306, + "step": 10934 + }, + { + "epoch": 0.87, + "learning_rate": 9.224261395241862e-07, + "loss": 0.2813, + "step": 10935 + }, + { + "epoch": 0.87, + "learning_rate": 9.213499994636443e-07, + "loss": 0.4093, + "step": 10936 + }, + { + "epoch": 0.87, + "learning_rate": 9.202744571885191e-07, + "loss": 0.4162, + "step": 10937 + }, + { + "epoch": 0.87, + "learning_rate": 9.19199512769634e-07, + "loss": 0.3817, + "step": 10938 + }, + { + "epoch": 0.87, + "learning_rate": 9.181251662777668e-07, + "loss": 0.3413, + "step": 10939 + }, + { + "epoch": 0.87, + "learning_rate": 9.170514177836565e-07, + "loss": 0.3625, + "step": 10940 + }, + { + "epoch": 0.87, + "learning_rate": 9.159782673580075e-07, + "loss": 0.2477, + "step": 10941 + }, + { + "epoch": 0.87, + "learning_rate": 9.149057150714802e-07, + "loss": 0.3308, + "step": 10942 + }, + { + "epoch": 0.87, + "learning_rate": 9.138337609946979e-07, + "loss": 0.3491, + "step": 10943 + }, + { + "epoch": 0.87, + "learning_rate": 9.127624051982398e-07, + "loss": 0.3579, + "step": 10944 + }, + { + "epoch": 0.87, + "learning_rate": 9.116916477526539e-07, + "loss": 0.2761, + "step": 10945 + }, + { + "epoch": 0.87, + "learning_rate": 9.106214887284437e-07, + "loss": 0.3744, + "step": 10946 + }, + { + "epoch": 0.87, + "learning_rate": 9.095519281960729e-07, + "loss": 0.3534, + "step": 10947 + }, + { + "epoch": 0.87, + "learning_rate": 9.084829662259665e-07, + "loss": 0.3202, + "step": 10948 + }, + { + "epoch": 0.87, + "learning_rate": 9.0741460288851e-07, + "loss": 0.491, + "step": 10949 + }, + { + "epoch": 0.87, + "learning_rate": 9.06346838254053e-07, + "loss": 0.3074, + "step": 10950 + }, + { + "epoch": 0.87, + "learning_rate": 9.052796723929002e-07, + "loss": 0.2744, + "step": 10951 + }, + { + "epoch": 0.87, + "learning_rate": 9.042131053753211e-07, + "loss": 0.2465, + "step": 10952 + }, + { + "epoch": 0.87, + "learning_rate": 9.031471372715405e-07, + "loss": 0.3648, + "step": 10953 + }, + { + "epoch": 0.87, + "learning_rate": 9.020817681517513e-07, + "loss": 0.2994, + "step": 10954 + }, + { + "epoch": 0.87, + "learning_rate": 9.010169980861005e-07, + "loss": 0.3744, + "step": 10955 + }, + { + "epoch": 0.87, + "learning_rate": 8.999528271446989e-07, + "loss": 0.2741, + "step": 10956 + }, + { + "epoch": 0.87, + "learning_rate": 8.988892553976169e-07, + "loss": 0.2594, + "step": 10957 + }, + { + "epoch": 0.87, + "learning_rate": 8.978262829148876e-07, + "loss": 0.3447, + "step": 10958 + }, + { + "epoch": 0.87, + "learning_rate": 8.96763909766497e-07, + "loss": 0.3104, + "step": 10959 + }, + { + "epoch": 0.87, + "learning_rate": 8.957021360224039e-07, + "loss": 0.3507, + "step": 10960 + }, + { + "epoch": 0.87, + "learning_rate": 8.946409617525175e-07, + "loss": 0.3595, + "step": 10961 + }, + { + "epoch": 0.87, + "learning_rate": 8.935803870267101e-07, + "loss": 0.4249, + "step": 10962 + }, + { + "epoch": 0.87, + "learning_rate": 8.925204119148189e-07, + "loss": 0.2835, + "step": 10963 + }, + { + "epoch": 0.87, + "learning_rate": 8.914610364866361e-07, + "loss": 0.3751, + "step": 10964 + }, + { + "epoch": 0.87, + "learning_rate": 8.904022608119145e-07, + "loss": 0.3225, + "step": 10965 + }, + { + "epoch": 0.87, + "learning_rate": 8.89344084960374e-07, + "loss": 0.2792, + "step": 10966 + }, + { + "epoch": 0.87, + "learning_rate": 8.882865090016868e-07, + "loss": 0.3226, + "step": 10967 + }, + { + "epoch": 0.87, + "learning_rate": 8.872295330054915e-07, + "loss": 0.3531, + "step": 10968 + }, + { + "epoch": 0.87, + "learning_rate": 8.861731570413801e-07, + "loss": 0.3418, + "step": 10969 + }, + { + "epoch": 0.87, + "learning_rate": 8.85117381178916e-07, + "loss": 0.3575, + "step": 10970 + }, + { + "epoch": 0.87, + "learning_rate": 8.840622054876147e-07, + "loss": 0.2415, + "step": 10971 + }, + { + "epoch": 0.87, + "learning_rate": 8.830076300369517e-07, + "loss": 0.2551, + "step": 10972 + }, + { + "epoch": 0.87, + "learning_rate": 8.819536548963703e-07, + "loss": 0.2716, + "step": 10973 + }, + { + "epoch": 0.87, + "learning_rate": 8.809002801352673e-07, + "loss": 0.3015, + "step": 10974 + }, + { + "epoch": 0.87, + "learning_rate": 8.798475058230005e-07, + "loss": 0.3039, + "step": 10975 + }, + { + "epoch": 0.87, + "learning_rate": 8.787953320288945e-07, + "loss": 0.4087, + "step": 10976 + }, + { + "epoch": 0.87, + "learning_rate": 8.777437588222271e-07, + "loss": 0.3183, + "step": 10977 + }, + { + "epoch": 0.87, + "learning_rate": 8.766927862722374e-07, + "loss": 0.3629, + "step": 10978 + }, + { + "epoch": 0.87, + "learning_rate": 8.756424144481313e-07, + "loss": 0.3179, + "step": 10979 + }, + { + "epoch": 0.87, + "learning_rate": 8.745926434190688e-07, + "loss": 0.2327, + "step": 10980 + }, + { + "epoch": 0.87, + "learning_rate": 8.735434732541704e-07, + "loss": 0.3219, + "step": 10981 + }, + { + "epoch": 0.87, + "learning_rate": 8.724949040225217e-07, + "loss": 0.3071, + "step": 10982 + }, + { + "epoch": 0.87, + "learning_rate": 8.714469357931654e-07, + "loss": 0.252, + "step": 10983 + }, + { + "epoch": 0.87, + "learning_rate": 8.703995686351041e-07, + "loss": 0.3679, + "step": 10984 + }, + { + "epoch": 0.87, + "learning_rate": 8.693528026173015e-07, + "loss": 0.3661, + "step": 10985 + }, + { + "epoch": 0.87, + "learning_rate": 8.683066378086846e-07, + "loss": 0.262, + "step": 10986 + }, + { + "epoch": 0.87, + "learning_rate": 8.672610742781363e-07, + "loss": 0.3771, + "step": 10987 + }, + { + "epoch": 0.87, + "learning_rate": 8.662161120945e-07, + "loss": 0.405, + "step": 10988 + }, + { + "epoch": 0.87, + "learning_rate": 8.651717513265867e-07, + "loss": 0.3612, + "step": 10989 + }, + { + "epoch": 0.87, + "learning_rate": 8.641279920431589e-07, + "loss": 0.3288, + "step": 10990 + }, + { + "epoch": 0.87, + "learning_rate": 8.630848343129417e-07, + "loss": 0.2716, + "step": 10991 + }, + { + "epoch": 0.87, + "learning_rate": 8.620422782046268e-07, + "loss": 0.3166, + "step": 10992 + }, + { + "epoch": 0.87, + "learning_rate": 8.61000323786858e-07, + "loss": 0.3769, + "step": 10993 + }, + { + "epoch": 0.87, + "learning_rate": 8.599589711282419e-07, + "loss": 0.4456, + "step": 10994 + }, + { + "epoch": 0.87, + "learning_rate": 8.589182202973512e-07, + "loss": 0.2857, + "step": 10995 + }, + { + "epoch": 0.87, + "learning_rate": 8.578780713627111e-07, + "loss": 0.3031, + "step": 10996 + }, + { + "epoch": 0.87, + "learning_rate": 8.568385243928112e-07, + "loss": 0.3145, + "step": 10997 + }, + { + "epoch": 0.87, + "learning_rate": 8.55799579456098e-07, + "loss": 0.2993, + "step": 10998 + }, + { + "epoch": 0.87, + "learning_rate": 8.547612366209856e-07, + "loss": 0.3129, + "step": 10999 + }, + { + "epoch": 0.87, + "learning_rate": 8.537234959558416e-07, + "loss": 0.3163, + "step": 11000 + }, + { + "epoch": 0.87, + "learning_rate": 8.526863575289945e-07, + "loss": 0.2676, + "step": 11001 + }, + { + "epoch": 0.87, + "learning_rate": 8.516498214087387e-07, + "loss": 0.3905, + "step": 11002 + }, + { + "epoch": 0.87, + "learning_rate": 8.50613887663323e-07, + "loss": 0.2991, + "step": 11003 + }, + { + "epoch": 0.87, + "learning_rate": 8.495785563609571e-07, + "loss": 0.4124, + "step": 11004 + }, + { + "epoch": 0.87, + "learning_rate": 8.485438275698154e-07, + "loss": 0.303, + "step": 11005 + }, + { + "epoch": 0.87, + "learning_rate": 8.475097013580292e-07, + "loss": 0.4597, + "step": 11006 + }, + { + "epoch": 0.87, + "learning_rate": 8.46476177793688e-07, + "loss": 0.3355, + "step": 11007 + }, + { + "epoch": 0.87, + "learning_rate": 8.454432569448489e-07, + "loss": 0.3242, + "step": 11008 + }, + { + "epoch": 0.87, + "learning_rate": 8.444109388795218e-07, + "loss": 0.3718, + "step": 11009 + }, + { + "epoch": 0.87, + "learning_rate": 8.43379223665679e-07, + "loss": 0.3497, + "step": 11010 + }, + { + "epoch": 0.87, + "learning_rate": 8.423481113712573e-07, + "loss": 0.419, + "step": 11011 + }, + { + "epoch": 0.87, + "learning_rate": 8.413176020641489e-07, + "loss": 0.3635, + "step": 11012 + }, + { + "epoch": 0.87, + "learning_rate": 8.402876958122075e-07, + "loss": 0.3411, + "step": 11013 + }, + { + "epoch": 0.87, + "learning_rate": 8.392583926832454e-07, + "loss": 0.2928, + "step": 11014 + }, + { + "epoch": 0.87, + "learning_rate": 8.382296927450417e-07, + "loss": 0.3585, + "step": 11015 + }, + { + "epoch": 0.87, + "learning_rate": 8.37201596065329e-07, + "loss": 0.3347, + "step": 11016 + }, + { + "epoch": 0.87, + "learning_rate": 8.361741027118009e-07, + "loss": 0.3415, + "step": 11017 + }, + { + "epoch": 0.87, + "learning_rate": 8.351472127521166e-07, + "loss": 0.3451, + "step": 11018 + }, + { + "epoch": 0.87, + "learning_rate": 8.341209262538896e-07, + "loss": 0.2968, + "step": 11019 + }, + { + "epoch": 0.87, + "learning_rate": 8.330952432846939e-07, + "loss": 0.3246, + "step": 11020 + }, + { + "epoch": 0.87, + "learning_rate": 8.320701639120709e-07, + "loss": 0.3767, + "step": 11021 + }, + { + "epoch": 0.87, + "learning_rate": 8.310456882035145e-07, + "loss": 0.3432, + "step": 11022 + }, + { + "epoch": 0.87, + "learning_rate": 8.300218162264783e-07, + "loss": 0.4205, + "step": 11023 + }, + { + "epoch": 0.87, + "learning_rate": 8.289985480483864e-07, + "loss": 0.4526, + "step": 11024 + }, + { + "epoch": 0.87, + "learning_rate": 8.279758837366103e-07, + "loss": 0.4085, + "step": 11025 + }, + { + "epoch": 0.87, + "learning_rate": 8.269538233584884e-07, + "loss": 0.3259, + "step": 11026 + }, + { + "epoch": 0.87, + "learning_rate": 8.259323669813202e-07, + "loss": 0.3088, + "step": 11027 + }, + { + "epoch": 0.87, + "learning_rate": 8.24911514672363e-07, + "loss": 0.3264, + "step": 11028 + }, + { + "epoch": 0.87, + "learning_rate": 8.23891266498833e-07, + "loss": 0.3002, + "step": 11029 + }, + { + "epoch": 0.87, + "learning_rate": 8.228716225279121e-07, + "loss": 0.2139, + "step": 11030 + }, + { + "epoch": 0.87, + "learning_rate": 8.218525828267377e-07, + "loss": 0.272, + "step": 11031 + }, + { + "epoch": 0.87, + "learning_rate": 8.208341474624071e-07, + "loss": 0.3692, + "step": 11032 + }, + { + "epoch": 0.87, + "learning_rate": 8.198163165019812e-07, + "loss": 0.4437, + "step": 11033 + }, + { + "epoch": 0.87, + "learning_rate": 8.187990900124787e-07, + "loss": 0.2907, + "step": 11034 + }, + { + "epoch": 0.87, + "learning_rate": 8.177824680608781e-07, + "loss": 0.3234, + "step": 11035 + }, + { + "epoch": 0.87, + "learning_rate": 8.167664507141215e-07, + "loss": 0.4217, + "step": 11036 + }, + { + "epoch": 0.87, + "learning_rate": 8.157510380391065e-07, + "loss": 0.4118, + "step": 11037 + }, + { + "epoch": 0.87, + "learning_rate": 8.14736230102694e-07, + "loss": 0.339, + "step": 11038 + }, + { + "epoch": 0.87, + "learning_rate": 8.137220269717028e-07, + "loss": 0.3039, + "step": 11039 + }, + { + "epoch": 0.87, + "learning_rate": 8.127084287129161e-07, + "loss": 0.4195, + "step": 11040 + }, + { + "epoch": 0.87, + "learning_rate": 8.116954353930728e-07, + "loss": 0.4061, + "step": 11041 + }, + { + "epoch": 0.87, + "learning_rate": 8.106830470788729e-07, + "loss": 0.2787, + "step": 11042 + }, + { + "epoch": 0.87, + "learning_rate": 8.096712638369797e-07, + "loss": 0.2662, + "step": 11043 + }, + { + "epoch": 0.87, + "learning_rate": 8.086600857340121e-07, + "loss": 0.3028, + "step": 11044 + }, + { + "epoch": 0.88, + "learning_rate": 8.076495128365502e-07, + "loss": 0.265, + "step": 11045 + }, + { + "epoch": 0.88, + "learning_rate": 8.066395452111387e-07, + "loss": 0.3454, + "step": 11046 + }, + { + "epoch": 0.88, + "learning_rate": 8.056301829242785e-07, + "loss": 0.3411, + "step": 11047 + }, + { + "epoch": 0.88, + "learning_rate": 8.046214260424279e-07, + "loss": 0.2532, + "step": 11048 + }, + { + "epoch": 0.88, + "learning_rate": 8.036132746320125e-07, + "loss": 0.3357, + "step": 11049 + }, + { + "epoch": 0.88, + "learning_rate": 8.026057287594136e-07, + "loss": 0.4342, + "step": 11050 + }, + { + "epoch": 0.88, + "learning_rate": 8.015987884909692e-07, + "loss": 0.3526, + "step": 11051 + }, + { + "epoch": 0.88, + "learning_rate": 8.005924538929877e-07, + "loss": 0.3852, + "step": 11052 + }, + { + "epoch": 0.88, + "learning_rate": 7.99586725031728e-07, + "loss": 0.4093, + "step": 11053 + }, + { + "epoch": 0.88, + "learning_rate": 7.985816019734127e-07, + "loss": 0.3168, + "step": 11054 + }, + { + "epoch": 0.88, + "learning_rate": 7.975770847842234e-07, + "loss": 0.3667, + "step": 11055 + }, + { + "epoch": 0.88, + "learning_rate": 7.965731735303051e-07, + "loss": 0.3061, + "step": 11056 + }, + { + "epoch": 0.88, + "learning_rate": 7.955698682777601e-07, + "loss": 0.3393, + "step": 11057 + }, + { + "epoch": 0.88, + "learning_rate": 7.945671690926471e-07, + "loss": 0.2841, + "step": 11058 + }, + { + "epoch": 0.88, + "learning_rate": 7.935650760409952e-07, + "loss": 0.433, + "step": 11059 + }, + { + "epoch": 0.88, + "learning_rate": 7.925635891887839e-07, + "loss": 0.3599, + "step": 11060 + }, + { + "epoch": 0.88, + "learning_rate": 7.915627086019561e-07, + "loss": 0.3252, + "step": 11061 + }, + { + "epoch": 0.88, + "learning_rate": 7.905624343464169e-07, + "loss": 0.2937, + "step": 11062 + }, + { + "epoch": 0.88, + "learning_rate": 7.895627664880278e-07, + "loss": 0.3373, + "step": 11063 + }, + { + "epoch": 0.88, + "learning_rate": 7.88563705092612e-07, + "loss": 0.2612, + "step": 11064 + }, + { + "epoch": 0.88, + "learning_rate": 7.875652502259545e-07, + "loss": 0.3355, + "step": 11065 + }, + { + "epoch": 0.88, + "learning_rate": 7.865674019537983e-07, + "loss": 0.2933, + "step": 11066 + }, + { + "epoch": 0.88, + "learning_rate": 7.855701603418442e-07, + "loss": 0.3493, + "step": 11067 + }, + { + "epoch": 0.88, + "learning_rate": 7.845735254557608e-07, + "loss": 0.2581, + "step": 11068 + }, + { + "epoch": 0.88, + "learning_rate": 7.835774973611687e-07, + "loss": 0.37, + "step": 11069 + }, + { + "epoch": 0.88, + "learning_rate": 7.825820761236514e-07, + "loss": 0.4263, + "step": 11070 + }, + { + "epoch": 0.88, + "learning_rate": 7.815872618087506e-07, + "loss": 0.3177, + "step": 11071 + }, + { + "epoch": 0.88, + "learning_rate": 7.805930544819751e-07, + "loss": 0.3331, + "step": 11072 + }, + { + "epoch": 0.88, + "learning_rate": 7.795994542087859e-07, + "loss": 0.4438, + "step": 11073 + }, + { + "epoch": 0.88, + "learning_rate": 7.786064610546051e-07, + "loss": 0.3195, + "step": 11074 + }, + { + "epoch": 0.88, + "learning_rate": 7.776140750848205e-07, + "loss": 0.4427, + "step": 11075 + }, + { + "epoch": 0.88, + "learning_rate": 7.766222963647729e-07, + "loss": 0.3431, + "step": 11076 + }, + { + "epoch": 0.88, + "learning_rate": 7.756311249597659e-07, + "loss": 0.2799, + "step": 11077 + }, + { + "epoch": 0.88, + "learning_rate": 7.746405609350661e-07, + "loss": 0.2257, + "step": 11078 + }, + { + "epoch": 0.88, + "learning_rate": 7.736506043558956e-07, + "loss": 0.3754, + "step": 11079 + }, + { + "epoch": 0.88, + "learning_rate": 7.726612552874368e-07, + "loss": 0.4141, + "step": 11080 + }, + { + "epoch": 0.88, + "learning_rate": 7.716725137948366e-07, + "loss": 0.3395, + "step": 11081 + }, + { + "epoch": 0.88, + "learning_rate": 7.706843799431985e-07, + "loss": 0.3689, + "step": 11082 + }, + { + "epoch": 0.88, + "learning_rate": 7.696968537975847e-07, + "loss": 0.3616, + "step": 11083 + }, + { + "epoch": 0.88, + "learning_rate": 7.687099354230177e-07, + "loss": 0.3817, + "step": 11084 + }, + { + "epoch": 0.88, + "learning_rate": 7.677236248844855e-07, + "loss": 0.3505, + "step": 11085 + }, + { + "epoch": 0.88, + "learning_rate": 7.667379222469295e-07, + "loss": 0.3871, + "step": 11086 + }, + { + "epoch": 0.88, + "learning_rate": 7.657528275752524e-07, + "loss": 0.3331, + "step": 11087 + }, + { + "epoch": 0.88, + "learning_rate": 7.647683409343198e-07, + "loss": 0.397, + "step": 11088 + }, + { + "epoch": 0.88, + "learning_rate": 7.637844623889557e-07, + "loss": 0.3517, + "step": 11089 + }, + { + "epoch": 0.88, + "learning_rate": 7.628011920039414e-07, + "loss": 0.3447, + "step": 11090 + }, + { + "epoch": 0.88, + "learning_rate": 7.618185298440239e-07, + "loss": 0.2698, + "step": 11091 + }, + { + "epoch": 0.88, + "learning_rate": 7.608364759739039e-07, + "loss": 0.2943, + "step": 11092 + }, + { + "epoch": 0.88, + "learning_rate": 7.598550304582453e-07, + "loss": 0.336, + "step": 11093 + }, + { + "epoch": 0.88, + "learning_rate": 7.588741933616728e-07, + "loss": 0.4004, + "step": 11094 + }, + { + "epoch": 0.88, + "learning_rate": 7.578939647487705e-07, + "loss": 0.3138, + "step": 11095 + }, + { + "epoch": 0.88, + "learning_rate": 7.569143446840776e-07, + "loss": 0.4177, + "step": 11096 + }, + { + "epoch": 0.88, + "learning_rate": 7.559353332321029e-07, + "loss": 0.3008, + "step": 11097 + }, + { + "epoch": 0.88, + "learning_rate": 7.549569304573057e-07, + "loss": 0.3898, + "step": 11098 + }, + { + "epoch": 0.88, + "learning_rate": 7.539791364241111e-07, + "loss": 0.33, + "step": 11099 + }, + { + "epoch": 0.88, + "learning_rate": 7.530019511969e-07, + "loss": 0.3652, + "step": 11100 + }, + { + "epoch": 0.88, + "learning_rate": 7.520253748400175e-07, + "loss": 0.2832, + "step": 11101 + }, + { + "epoch": 0.88, + "learning_rate": 7.510494074177666e-07, + "loss": 0.2935, + "step": 11102 + }, + { + "epoch": 0.88, + "learning_rate": 7.500740489944092e-07, + "loss": 0.4179, + "step": 11103 + }, + { + "epoch": 0.88, + "learning_rate": 7.490992996341662e-07, + "loss": 0.2836, + "step": 11104 + }, + { + "epoch": 0.88, + "learning_rate": 7.481251594012218e-07, + "loss": 0.369, + "step": 11105 + }, + { + "epoch": 0.88, + "learning_rate": 7.471516283597191e-07, + "loss": 0.2722, + "step": 11106 + }, + { + "epoch": 0.88, + "learning_rate": 7.461787065737602e-07, + "loss": 0.263, + "step": 11107 + }, + { + "epoch": 0.88, + "learning_rate": 7.452063941074073e-07, + "loss": 0.4026, + "step": 11108 + }, + { + "epoch": 0.88, + "learning_rate": 7.442346910246801e-07, + "loss": 0.4228, + "step": 11109 + }, + { + "epoch": 0.88, + "learning_rate": 7.432635973895652e-07, + "loss": 0.3579, + "step": 11110 + }, + { + "epoch": 0.88, + "learning_rate": 7.422931132660005e-07, + "loss": 0.5135, + "step": 11111 + }, + { + "epoch": 0.88, + "learning_rate": 7.413232387178882e-07, + "loss": 0.3199, + "step": 11112 + }, + { + "epoch": 0.88, + "learning_rate": 7.403539738090914e-07, + "loss": 0.3812, + "step": 11113 + }, + { + "epoch": 0.88, + "learning_rate": 7.393853186034316e-07, + "loss": 0.3856, + "step": 11114 + }, + { + "epoch": 0.88, + "learning_rate": 7.384172731646877e-07, + "loss": 0.4115, + "step": 11115 + }, + { + "epoch": 0.88, + "learning_rate": 7.374498375566042e-07, + "loss": 0.3942, + "step": 11116 + }, + { + "epoch": 0.88, + "learning_rate": 7.364830118428801e-07, + "loss": 0.392, + "step": 11117 + }, + { + "epoch": 0.88, + "learning_rate": 7.355167960871745e-07, + "loss": 0.4333, + "step": 11118 + }, + { + "epoch": 0.88, + "learning_rate": 7.345511903531122e-07, + "loss": 0.3574, + "step": 11119 + }, + { + "epoch": 0.88, + "learning_rate": 7.335861947042711e-07, + "loss": 0.3035, + "step": 11120 + }, + { + "epoch": 0.88, + "learning_rate": 7.326218092041903e-07, + "loss": 0.2396, + "step": 11121 + }, + { + "epoch": 0.88, + "learning_rate": 7.316580339163736e-07, + "loss": 0.4423, + "step": 11122 + }, + { + "epoch": 0.88, + "learning_rate": 7.306948689042792e-07, + "loss": 0.2973, + "step": 11123 + }, + { + "epoch": 0.88, + "learning_rate": 7.297323142313262e-07, + "loss": 0.3209, + "step": 11124 + }, + { + "epoch": 0.88, + "learning_rate": 7.287703699608928e-07, + "loss": 0.3663, + "step": 11125 + }, + { + "epoch": 0.88, + "learning_rate": 7.278090361563228e-07, + "loss": 0.3301, + "step": 11126 + }, + { + "epoch": 0.88, + "learning_rate": 7.268483128809122e-07, + "loss": 0.3469, + "step": 11127 + }, + { + "epoch": 0.88, + "learning_rate": 7.258882001979184e-07, + "loss": 0.3356, + "step": 11128 + }, + { + "epoch": 0.88, + "learning_rate": 7.24928698170565e-07, + "loss": 0.36, + "step": 11129 + }, + { + "epoch": 0.88, + "learning_rate": 7.239698068620272e-07, + "loss": 0.3534, + "step": 11130 + }, + { + "epoch": 0.88, + "learning_rate": 7.230115263354431e-07, + "loss": 0.301, + "step": 11131 + }, + { + "epoch": 0.88, + "learning_rate": 7.220538566539137e-07, + "loss": 0.3524, + "step": 11132 + }, + { + "epoch": 0.88, + "learning_rate": 7.21096797880495e-07, + "loss": 0.3607, + "step": 11133 + }, + { + "epoch": 0.88, + "learning_rate": 7.201403500782034e-07, + "loss": 0.3388, + "step": 11134 + }, + { + "epoch": 0.88, + "learning_rate": 7.191845133100195e-07, + "loss": 0.3916, + "step": 11135 + }, + { + "epoch": 0.88, + "learning_rate": 7.182292876388785e-07, + "loss": 0.2693, + "step": 11136 + }, + { + "epoch": 0.88, + "learning_rate": 7.17274673127677e-07, + "loss": 0.3622, + "step": 11137 + }, + { + "epoch": 0.88, + "learning_rate": 7.163206698392744e-07, + "loss": 0.3608, + "step": 11138 + }, + { + "epoch": 0.88, + "learning_rate": 7.153672778364851e-07, + "loss": 0.295, + "step": 11139 + }, + { + "epoch": 0.88, + "learning_rate": 7.144144971820855e-07, + "loss": 0.4151, + "step": 11140 + }, + { + "epoch": 0.88, + "learning_rate": 7.134623279388098e-07, + "loss": 0.3874, + "step": 11141 + }, + { + "epoch": 0.88, + "learning_rate": 7.12510770169359e-07, + "loss": 0.311, + "step": 11142 + }, + { + "epoch": 0.88, + "learning_rate": 7.115598239363842e-07, + "loss": 0.3562, + "step": 11143 + }, + { + "epoch": 0.88, + "learning_rate": 7.106094893025006e-07, + "loss": 0.5186, + "step": 11144 + }, + { + "epoch": 0.88, + "learning_rate": 7.096597663302862e-07, + "loss": 0.36, + "step": 11145 + }, + { + "epoch": 0.88, + "learning_rate": 7.087106550822731e-07, + "loss": 0.3418, + "step": 11146 + }, + { + "epoch": 0.88, + "learning_rate": 7.077621556209557e-07, + "loss": 0.2383, + "step": 11147 + }, + { + "epoch": 0.88, + "learning_rate": 7.068142680087909e-07, + "loss": 0.4193, + "step": 11148 + }, + { + "epoch": 0.88, + "learning_rate": 7.058669923081896e-07, + "loss": 0.3564, + "step": 11149 + }, + { + "epoch": 0.88, + "learning_rate": 7.049203285815253e-07, + "loss": 0.2923, + "step": 11150 + }, + { + "epoch": 0.88, + "learning_rate": 7.03974276891134e-07, + "loss": 0.3598, + "step": 11151 + }, + { + "epoch": 0.88, + "learning_rate": 7.030288372993066e-07, + "loss": 0.3, + "step": 11152 + }, + { + "epoch": 0.88, + "learning_rate": 7.020840098682968e-07, + "loss": 0.4084, + "step": 11153 + }, + { + "epoch": 0.88, + "learning_rate": 7.011397946603138e-07, + "loss": 0.324, + "step": 11154 + }, + { + "epoch": 0.88, + "learning_rate": 7.001961917375344e-07, + "loss": 0.3372, + "step": 11155 + }, + { + "epoch": 0.88, + "learning_rate": 6.992532011620878e-07, + "loss": 0.3675, + "step": 11156 + }, + { + "epoch": 0.88, + "learning_rate": 6.983108229960633e-07, + "loss": 0.3071, + "step": 11157 + }, + { + "epoch": 0.88, + "learning_rate": 6.973690573015168e-07, + "loss": 0.5485, + "step": 11158 + }, + { + "epoch": 0.88, + "learning_rate": 6.964279041404553e-07, + "loss": 0.3648, + "step": 11159 + }, + { + "epoch": 0.88, + "learning_rate": 6.954873635748493e-07, + "loss": 0.3526, + "step": 11160 + }, + { + "epoch": 0.88, + "learning_rate": 6.945474356666326e-07, + "loss": 0.3549, + "step": 11161 + }, + { + "epoch": 0.88, + "learning_rate": 6.936081204776913e-07, + "loss": 0.3413, + "step": 11162 + }, + { + "epoch": 0.88, + "learning_rate": 6.926694180698734e-07, + "loss": 0.4473, + "step": 11163 + }, + { + "epoch": 0.88, + "learning_rate": 6.917313285049931e-07, + "loss": 0.2944, + "step": 11164 + }, + { + "epoch": 0.88, + "learning_rate": 6.907938518448154e-07, + "loss": 0.2115, + "step": 11165 + }, + { + "epoch": 0.88, + "learning_rate": 6.898569881510686e-07, + "loss": 0.318, + "step": 11166 + }, + { + "epoch": 0.88, + "learning_rate": 6.889207374854434e-07, + "loss": 0.2682, + "step": 11167 + }, + { + "epoch": 0.88, + "learning_rate": 6.879850999095849e-07, + "loss": 0.2411, + "step": 11168 + }, + { + "epoch": 0.88, + "learning_rate": 6.870500754851017e-07, + "loss": 0.3844, + "step": 11169 + }, + { + "epoch": 0.88, + "learning_rate": 6.861156642735578e-07, + "loss": 0.3637, + "step": 11170 + }, + { + "epoch": 0.89, + "learning_rate": 6.851818663364839e-07, + "loss": 0.2991, + "step": 11171 + }, + { + "epoch": 0.89, + "learning_rate": 6.842486817353633e-07, + "loss": 0.3423, + "step": 11172 + }, + { + "epoch": 0.89, + "learning_rate": 6.833161105316421e-07, + "loss": 0.3202, + "step": 11173 + }, + { + "epoch": 0.89, + "learning_rate": 6.823841527867259e-07, + "loss": 0.4396, + "step": 11174 + }, + { + "epoch": 0.89, + "learning_rate": 6.814528085619809e-07, + "loss": 0.3117, + "step": 11175 + }, + { + "epoch": 0.89, + "learning_rate": 6.805220779187293e-07, + "loss": 0.3989, + "step": 11176 + }, + { + "epoch": 0.89, + "learning_rate": 6.795919609182566e-07, + "loss": 0.3016, + "step": 11177 + }, + { + "epoch": 0.89, + "learning_rate": 6.78662457621807e-07, + "loss": 0.2552, + "step": 11178 + }, + { + "epoch": 0.89, + "learning_rate": 6.777335680905817e-07, + "loss": 0.3795, + "step": 11179 + }, + { + "epoch": 0.89, + "learning_rate": 6.768052923857482e-07, + "loss": 0.3216, + "step": 11180 + }, + { + "epoch": 0.89, + "learning_rate": 6.758776305684245e-07, + "loss": 0.2908, + "step": 11181 + }, + { + "epoch": 0.89, + "learning_rate": 6.749505826996927e-07, + "loss": 0.288, + "step": 11182 + }, + { + "epoch": 0.89, + "learning_rate": 6.740241488405963e-07, + "loss": 0.3954, + "step": 11183 + }, + { + "epoch": 0.89, + "learning_rate": 6.730983290521365e-07, + "loss": 0.4099, + "step": 11184 + }, + { + "epoch": 0.89, + "learning_rate": 6.721731233952722e-07, + "loss": 0.3267, + "step": 11185 + }, + { + "epoch": 0.89, + "learning_rate": 6.712485319309258e-07, + "loss": 0.3057, + "step": 11186 + }, + { + "epoch": 0.89, + "learning_rate": 6.703245547199777e-07, + "loss": 0.3455, + "step": 11187 + }, + { + "epoch": 0.89, + "learning_rate": 6.694011918232635e-07, + "loss": 0.3339, + "step": 11188 + }, + { + "epoch": 0.89, + "learning_rate": 6.684784433015867e-07, + "loss": 0.4427, + "step": 11189 + }, + { + "epoch": 0.89, + "learning_rate": 6.675563092157044e-07, + "loss": 0.3448, + "step": 11190 + }, + { + "epoch": 0.89, + "learning_rate": 6.666347896263326e-07, + "loss": 0.3706, + "step": 11191 + }, + { + "epoch": 0.89, + "learning_rate": 6.657138845941524e-07, + "loss": 0.3363, + "step": 11192 + }, + { + "epoch": 0.89, + "learning_rate": 6.64793594179799e-07, + "loss": 0.3749, + "step": 11193 + }, + { + "epoch": 0.89, + "learning_rate": 6.638739184438681e-07, + "loss": 0.3854, + "step": 11194 + }, + { + "epoch": 0.89, + "learning_rate": 6.629548574469169e-07, + "loss": 0.3294, + "step": 11195 + }, + { + "epoch": 0.89, + "learning_rate": 6.620364112494627e-07, + "loss": 0.3543, + "step": 11196 + }, + { + "epoch": 0.89, + "learning_rate": 6.611185799119791e-07, + "loss": 0.3719, + "step": 11197 + }, + { + "epoch": 0.89, + "learning_rate": 6.602013634949001e-07, + "loss": 0.2856, + "step": 11198 + }, + { + "epoch": 0.89, + "learning_rate": 6.592847620586217e-07, + "loss": 0.2891, + "step": 11199 + }, + { + "epoch": 0.89, + "learning_rate": 6.583687756634982e-07, + "loss": 0.4416, + "step": 11200 + }, + { + "epoch": 0.89, + "learning_rate": 6.574534043698399e-07, + "loss": 0.2748, + "step": 11201 + }, + { + "epoch": 0.89, + "learning_rate": 6.565386482379221e-07, + "loss": 0.3483, + "step": 11202 + }, + { + "epoch": 0.89, + "learning_rate": 6.556245073279777e-07, + "loss": 0.3744, + "step": 11203 + }, + { + "epoch": 0.89, + "learning_rate": 6.547109817001951e-07, + "loss": 0.3685, + "step": 11204 + }, + { + "epoch": 0.89, + "learning_rate": 6.537980714147285e-07, + "loss": 0.3848, + "step": 11205 + }, + { + "epoch": 0.89, + "learning_rate": 6.528857765316887e-07, + "loss": 0.2942, + "step": 11206 + }, + { + "epoch": 0.89, + "learning_rate": 6.519740971111432e-07, + "loss": 0.3421, + "step": 11207 + }, + { + "epoch": 0.89, + "learning_rate": 6.510630332131262e-07, + "loss": 0.3263, + "step": 11208 + }, + { + "epoch": 0.89, + "learning_rate": 6.501525848976231e-07, + "loss": 0.2687, + "step": 11209 + }, + { + "epoch": 0.89, + "learning_rate": 6.492427522245836e-07, + "loss": 0.416, + "step": 11210 + }, + { + "epoch": 0.89, + "learning_rate": 6.483335352539144e-07, + "loss": 0.2244, + "step": 11211 + }, + { + "epoch": 0.89, + "learning_rate": 6.474249340454874e-07, + "loss": 0.3404, + "step": 11212 + }, + { + "epoch": 0.89, + "learning_rate": 6.46516948659125e-07, + "loss": 0.3768, + "step": 11213 + }, + { + "epoch": 0.89, + "learning_rate": 6.456095791546147e-07, + "loss": 0.2961, + "step": 11214 + }, + { + "epoch": 0.89, + "learning_rate": 6.447028255917054e-07, + "loss": 0.3162, + "step": 11215 + }, + { + "epoch": 0.89, + "learning_rate": 6.437966880300995e-07, + "loss": 0.2611, + "step": 11216 + }, + { + "epoch": 0.89, + "learning_rate": 6.428911665294601e-07, + "loss": 0.239, + "step": 11217 + }, + { + "epoch": 0.89, + "learning_rate": 6.419862611494165e-07, + "loss": 0.349, + "step": 11218 + }, + { + "epoch": 0.89, + "learning_rate": 6.410819719495498e-07, + "loss": 0.4022, + "step": 11219 + }, + { + "epoch": 0.89, + "learning_rate": 6.401782989894012e-07, + "loss": 0.3268, + "step": 11220 + }, + { + "epoch": 0.89, + "learning_rate": 6.392752423284765e-07, + "loss": 0.3572, + "step": 11221 + }, + { + "epoch": 0.89, + "learning_rate": 6.383728020262359e-07, + "loss": 0.3785, + "step": 11222 + }, + { + "epoch": 0.89, + "learning_rate": 6.374709781420995e-07, + "loss": 0.381, + "step": 11223 + }, + { + "epoch": 0.89, + "learning_rate": 6.365697707354512e-07, + "loss": 0.3539, + "step": 11224 + }, + { + "epoch": 0.89, + "learning_rate": 6.3566917986563e-07, + "loss": 0.2841, + "step": 11225 + }, + { + "epoch": 0.89, + "learning_rate": 6.347692055919353e-07, + "loss": 0.3008, + "step": 11226 + }, + { + "epoch": 0.89, + "learning_rate": 6.338698479736227e-07, + "loss": 0.345, + "step": 11227 + }, + { + "epoch": 0.89, + "learning_rate": 6.329711070699162e-07, + "loss": 0.293, + "step": 11228 + }, + { + "epoch": 0.89, + "learning_rate": 6.320729829399918e-07, + "loss": 0.4797, + "step": 11229 + }, + { + "epoch": 0.89, + "learning_rate": 6.311754756429833e-07, + "loss": 0.3468, + "step": 11230 + }, + { + "epoch": 0.89, + "learning_rate": 6.302785852379911e-07, + "loss": 0.3533, + "step": 11231 + }, + { + "epoch": 0.89, + "learning_rate": 6.293823117840703e-07, + "loss": 0.3123, + "step": 11232 + }, + { + "epoch": 0.89, + "learning_rate": 6.284866553402347e-07, + "loss": 0.29, + "step": 11233 + }, + { + "epoch": 0.89, + "learning_rate": 6.275916159654616e-07, + "loss": 0.3046, + "step": 11234 + }, + { + "epoch": 0.89, + "learning_rate": 6.266971937186827e-07, + "loss": 0.4302, + "step": 11235 + }, + { + "epoch": 0.89, + "learning_rate": 6.258033886587911e-07, + "loss": 0.2668, + "step": 11236 + }, + { + "epoch": 0.89, + "learning_rate": 6.249102008446418e-07, + "loss": 0.2926, + "step": 11237 + }, + { + "epoch": 0.89, + "learning_rate": 6.240176303350453e-07, + "loss": 0.4042, + "step": 11238 + }, + { + "epoch": 0.89, + "learning_rate": 6.231256771887739e-07, + "loss": 0.3289, + "step": 11239 + }, + { + "epoch": 0.89, + "learning_rate": 6.222343414645571e-07, + "loss": 0.4492, + "step": 11240 + }, + { + "epoch": 0.89, + "learning_rate": 6.213436232210868e-07, + "loss": 0.3848, + "step": 11241 + }, + { + "epoch": 0.89, + "learning_rate": 6.204535225170116e-07, + "loss": 0.4132, + "step": 11242 + }, + { + "epoch": 0.89, + "learning_rate": 6.195640394109393e-07, + "loss": 0.3514, + "step": 11243 + }, + { + "epoch": 0.89, + "learning_rate": 6.186751739614405e-07, + "loss": 0.3507, + "step": 11244 + }, + { + "epoch": 0.89, + "learning_rate": 6.177869262270419e-07, + "loss": 0.3461, + "step": 11245 + }, + { + "epoch": 0.89, + "learning_rate": 6.168992962662279e-07, + "loss": 0.4006, + "step": 11246 + }, + { + "epoch": 0.89, + "learning_rate": 6.160122841374482e-07, + "loss": 0.435, + "step": 11247 + }, + { + "epoch": 0.89, + "learning_rate": 6.151258898991064e-07, + "loss": 0.4181, + "step": 11248 + }, + { + "epoch": 0.89, + "learning_rate": 6.142401136095666e-07, + "loss": 0.4354, + "step": 11249 + }, + { + "epoch": 0.89, + "learning_rate": 6.133549553271556e-07, + "loss": 0.2621, + "step": 11250 + }, + { + "epoch": 0.89, + "learning_rate": 6.124704151101546e-07, + "loss": 0.3485, + "step": 11251 + }, + { + "epoch": 0.89, + "learning_rate": 6.115864930168058e-07, + "loss": 0.3415, + "step": 11252 + }, + { + "epoch": 0.89, + "learning_rate": 6.107031891053139e-07, + "loss": 0.4024, + "step": 11253 + }, + { + "epoch": 0.89, + "learning_rate": 6.098205034338378e-07, + "loss": 0.303, + "step": 11254 + }, + { + "epoch": 0.89, + "learning_rate": 6.089384360605e-07, + "loss": 0.3837, + "step": 11255 + }, + { + "epoch": 0.89, + "learning_rate": 6.080569870433773e-07, + "loss": 0.3162, + "step": 11256 + }, + { + "epoch": 0.89, + "learning_rate": 6.071761564405121e-07, + "loss": 0.3656, + "step": 11257 + }, + { + "epoch": 0.89, + "learning_rate": 6.062959443099014e-07, + "loss": 0.4609, + "step": 11258 + }, + { + "epoch": 0.89, + "learning_rate": 6.054163507095035e-07, + "loss": 0.406, + "step": 11259 + }, + { + "epoch": 0.89, + "learning_rate": 6.04537375697235e-07, + "loss": 0.293, + "step": 11260 + }, + { + "epoch": 0.89, + "learning_rate": 6.036590193309711e-07, + "loss": 0.3266, + "step": 11261 + }, + { + "epoch": 0.89, + "learning_rate": 6.027812816685497e-07, + "loss": 0.2914, + "step": 11262 + }, + { + "epoch": 0.89, + "learning_rate": 6.019041627677635e-07, + "loss": 0.3206, + "step": 11263 + }, + { + "epoch": 0.89, + "learning_rate": 6.010276626863687e-07, + "loss": 0.3233, + "step": 11264 + }, + { + "epoch": 0.89, + "learning_rate": 6.001517814820757e-07, + "loss": 0.3812, + "step": 11265 + }, + { + "epoch": 0.89, + "learning_rate": 5.992765192125594e-07, + "loss": 0.4169, + "step": 11266 + }, + { + "epoch": 0.89, + "learning_rate": 5.984018759354515e-07, + "loss": 0.3942, + "step": 11267 + }, + { + "epoch": 0.89, + "learning_rate": 5.975278517083405e-07, + "loss": 0.3842, + "step": 11268 + }, + { + "epoch": 0.89, + "learning_rate": 5.966544465887803e-07, + "loss": 0.2733, + "step": 11269 + }, + { + "epoch": 0.89, + "learning_rate": 5.957816606342792e-07, + "loss": 0.307, + "step": 11270 + }, + { + "epoch": 0.89, + "learning_rate": 5.949094939023037e-07, + "loss": 0.3261, + "step": 11271 + }, + { + "epoch": 0.89, + "learning_rate": 5.940379464502854e-07, + "loss": 0.3036, + "step": 11272 + }, + { + "epoch": 0.89, + "learning_rate": 5.931670183356097e-07, + "loss": 0.4555, + "step": 11273 + }, + { + "epoch": 0.89, + "learning_rate": 5.922967096156218e-07, + "loss": 0.2828, + "step": 11274 + }, + { + "epoch": 0.89, + "learning_rate": 5.914270203476291e-07, + "loss": 0.4357, + "step": 11275 + }, + { + "epoch": 0.89, + "learning_rate": 5.90557950588897e-07, + "loss": 0.2549, + "step": 11276 + }, + { + "epoch": 0.89, + "learning_rate": 5.896895003966463e-07, + "loss": 0.313, + "step": 11277 + }, + { + "epoch": 0.89, + "learning_rate": 5.888216698280646e-07, + "loss": 0.2554, + "step": 11278 + }, + { + "epoch": 0.89, + "learning_rate": 5.879544589402919e-07, + "loss": 0.3335, + "step": 11279 + }, + { + "epoch": 0.89, + "learning_rate": 5.870878677904302e-07, + "loss": 0.4568, + "step": 11280 + }, + { + "epoch": 0.89, + "learning_rate": 5.862218964355382e-07, + "loss": 0.3635, + "step": 11281 + }, + { + "epoch": 0.89, + "learning_rate": 5.853565449326404e-07, + "loss": 0.4179, + "step": 11282 + }, + { + "epoch": 0.89, + "learning_rate": 5.844918133387134e-07, + "loss": 0.3524, + "step": 11283 + }, + { + "epoch": 0.89, + "learning_rate": 5.836277017106951e-07, + "loss": 0.31, + "step": 11284 + }, + { + "epoch": 0.89, + "learning_rate": 5.827642101054854e-07, + "loss": 0.413, + "step": 11285 + }, + { + "epoch": 0.89, + "learning_rate": 5.819013385799388e-07, + "loss": 0.3638, + "step": 11286 + }, + { + "epoch": 0.89, + "learning_rate": 5.810390871908711e-07, + "loss": 0.4041, + "step": 11287 + }, + { + "epoch": 0.89, + "learning_rate": 5.801774559950591e-07, + "loss": 0.2884, + "step": 11288 + }, + { + "epoch": 0.89, + "learning_rate": 5.793164450492372e-07, + "loss": 0.3964, + "step": 11289 + }, + { + "epoch": 0.89, + "learning_rate": 5.784560544100959e-07, + "loss": 0.3699, + "step": 11290 + }, + { + "epoch": 0.89, + "learning_rate": 5.775962841342919e-07, + "loss": 0.3451, + "step": 11291 + }, + { + "epoch": 0.89, + "learning_rate": 5.767371342784345e-07, + "loss": 0.2879, + "step": 11292 + }, + { + "epoch": 0.89, + "learning_rate": 5.758786048990939e-07, + "loss": 0.3269, + "step": 11293 + }, + { + "epoch": 0.89, + "learning_rate": 5.750206960528027e-07, + "loss": 0.306, + "step": 11294 + }, + { + "epoch": 0.89, + "learning_rate": 5.741634077960479e-07, + "loss": 0.3899, + "step": 11295 + }, + { + "epoch": 0.89, + "learning_rate": 5.733067401852788e-07, + "loss": 0.3174, + "step": 11296 + }, + { + "epoch": 0.89, + "learning_rate": 5.724506932769014e-07, + "loss": 0.3065, + "step": 11297 + }, + { + "epoch": 0.9, + "learning_rate": 5.71595267127284e-07, + "loss": 0.2087, + "step": 11298 + }, + { + "epoch": 0.9, + "learning_rate": 5.707404617927526e-07, + "loss": 0.3254, + "step": 11299 + }, + { + "epoch": 0.9, + "learning_rate": 5.698862773295888e-07, + "loss": 0.3522, + "step": 11300 + }, + { + "epoch": 0.9, + "learning_rate": 5.69032713794041e-07, + "loss": 0.4151, + "step": 11301 + }, + { + "epoch": 0.9, + "learning_rate": 5.681797712423099e-07, + "loss": 0.2315, + "step": 11302 + }, + { + "epoch": 0.9, + "learning_rate": 5.673274497305559e-07, + "loss": 0.3056, + "step": 11303 + }, + { + "epoch": 0.9, + "learning_rate": 5.664757493149042e-07, + "loss": 0.4119, + "step": 11304 + }, + { + "epoch": 0.9, + "learning_rate": 5.656246700514323e-07, + "loss": 0.4212, + "step": 11305 + }, + { + "epoch": 0.9, + "learning_rate": 5.647742119961797e-07, + "loss": 0.3783, + "step": 11306 + }, + { + "epoch": 0.9, + "learning_rate": 5.639243752051482e-07, + "loss": 0.2513, + "step": 11307 + }, + { + "epoch": 0.9, + "learning_rate": 5.630751597342921e-07, + "loss": 0.3094, + "step": 11308 + }, + { + "epoch": 0.9, + "learning_rate": 5.622265656395276e-07, + "loss": 0.4205, + "step": 11309 + }, + { + "epoch": 0.9, + "learning_rate": 5.613785929767335e-07, + "loss": 0.3972, + "step": 11310 + }, + { + "epoch": 0.9, + "learning_rate": 5.605312418017439e-07, + "loss": 0.4563, + "step": 11311 + }, + { + "epoch": 0.9, + "learning_rate": 5.59684512170352e-07, + "loss": 0.2731, + "step": 11312 + }, + { + "epoch": 0.9, + "learning_rate": 5.588384041383089e-07, + "loss": 0.2951, + "step": 11313 + }, + { + "epoch": 0.9, + "learning_rate": 5.579929177613308e-07, + "loss": 0.4905, + "step": 11314 + }, + { + "epoch": 0.9, + "learning_rate": 5.571480530950879e-07, + "loss": 0.3124, + "step": 11315 + }, + { + "epoch": 0.9, + "learning_rate": 5.563038101952067e-07, + "loss": 0.3666, + "step": 11316 + }, + { + "epoch": 0.9, + "learning_rate": 5.554601891172817e-07, + "loss": 0.2576, + "step": 11317 + }, + { + "epoch": 0.9, + "learning_rate": 5.546171899168595e-07, + "loss": 0.415, + "step": 11318 + }, + { + "epoch": 0.9, + "learning_rate": 5.537748126494446e-07, + "loss": 0.3965, + "step": 11319 + }, + { + "epoch": 0.9, + "learning_rate": 5.529330573705083e-07, + "loss": 0.2957, + "step": 11320 + }, + { + "epoch": 0.9, + "learning_rate": 5.520919241354728e-07, + "loss": 0.2932, + "step": 11321 + }, + { + "epoch": 0.9, + "learning_rate": 5.512514129997227e-07, + "loss": 0.4173, + "step": 11322 + }, + { + "epoch": 0.9, + "learning_rate": 5.504115240186048e-07, + "loss": 0.273, + "step": 11323 + }, + { + "epoch": 0.9, + "learning_rate": 5.495722572474183e-07, + "loss": 0.4487, + "step": 11324 + }, + { + "epoch": 0.9, + "learning_rate": 5.487336127414267e-07, + "loss": 0.353, + "step": 11325 + }, + { + "epoch": 0.9, + "learning_rate": 5.478955905558491e-07, + "loss": 0.4051, + "step": 11326 + }, + { + "epoch": 0.9, + "learning_rate": 5.470581907458672e-07, + "loss": 0.3001, + "step": 11327 + }, + { + "epoch": 0.9, + "learning_rate": 5.462214133666189e-07, + "loss": 0.2564, + "step": 11328 + }, + { + "epoch": 0.9, + "learning_rate": 5.453852584732e-07, + "loss": 0.2642, + "step": 11329 + }, + { + "epoch": 0.9, + "learning_rate": 5.4454972612067e-07, + "loss": 0.3955, + "step": 11330 + }, + { + "epoch": 0.9, + "learning_rate": 5.437148163640449e-07, + "loss": 0.4932, + "step": 11331 + }, + { + "epoch": 0.9, + "learning_rate": 5.428805292582973e-07, + "loss": 0.4038, + "step": 11332 + }, + { + "epoch": 0.9, + "learning_rate": 5.420468648583621e-07, + "loss": 0.3334, + "step": 11333 + }, + { + "epoch": 0.9, + "learning_rate": 5.412138232191333e-07, + "loss": 0.3529, + "step": 11334 + }, + { + "epoch": 0.9, + "learning_rate": 5.403814043954592e-07, + "loss": 0.3166, + "step": 11335 + }, + { + "epoch": 0.9, + "learning_rate": 5.39549608442157e-07, + "loss": 0.2578, + "step": 11336 + }, + { + "epoch": 0.9, + "learning_rate": 5.387184354139896e-07, + "loss": 0.2062, + "step": 11337 + }, + { + "epoch": 0.9, + "learning_rate": 5.378878853656877e-07, + "loss": 0.2972, + "step": 11338 + }, + { + "epoch": 0.9, + "learning_rate": 5.370579583519409e-07, + "loss": 0.3722, + "step": 11339 + }, + { + "epoch": 0.9, + "learning_rate": 5.362286544273942e-07, + "loss": 0.3519, + "step": 11340 + }, + { + "epoch": 0.9, + "learning_rate": 5.353999736466531e-07, + "loss": 0.262, + "step": 11341 + }, + { + "epoch": 0.9, + "learning_rate": 5.345719160642848e-07, + "loss": 0.3114, + "step": 11342 + }, + { + "epoch": 0.9, + "learning_rate": 5.337444817348103e-07, + "loss": 0.2667, + "step": 11343 + }, + { + "epoch": 0.9, + "learning_rate": 5.329176707127115e-07, + "loss": 0.3299, + "step": 11344 + }, + { + "epoch": 0.9, + "learning_rate": 5.320914830524337e-07, + "loss": 0.2674, + "step": 11345 + }, + { + "epoch": 0.9, + "learning_rate": 5.312659188083746e-07, + "loss": 0.3126, + "step": 11346 + }, + { + "epoch": 0.9, + "learning_rate": 5.304409780348919e-07, + "loss": 0.3057, + "step": 11347 + }, + { + "epoch": 0.9, + "learning_rate": 5.296166607863085e-07, + "loss": 0.392, + "step": 11348 + }, + { + "epoch": 0.9, + "learning_rate": 5.287929671168989e-07, + "loss": 0.3131, + "step": 11349 + }, + { + "epoch": 0.9, + "learning_rate": 5.279698970809011e-07, + "loss": 0.3253, + "step": 11350 + }, + { + "epoch": 0.9, + "learning_rate": 5.271474507325058e-07, + "loss": 0.3122, + "step": 11351 + }, + { + "epoch": 0.9, + "learning_rate": 5.263256281258733e-07, + "loss": 0.3124, + "step": 11352 + }, + { + "epoch": 0.9, + "learning_rate": 5.255044293151135e-07, + "loss": 0.3641, + "step": 11353 + }, + { + "epoch": 0.9, + "learning_rate": 5.246838543542964e-07, + "loss": 0.2936, + "step": 11354 + }, + { + "epoch": 0.9, + "learning_rate": 5.23863903297458e-07, + "loss": 0.3514, + "step": 11355 + }, + { + "epoch": 0.9, + "learning_rate": 5.230445761985836e-07, + "loss": 0.3797, + "step": 11356 + }, + { + "epoch": 0.9, + "learning_rate": 5.222258731116237e-07, + "loss": 0.3552, + "step": 11357 + }, + { + "epoch": 0.9, + "learning_rate": 5.214077940904872e-07, + "loss": 0.4179, + "step": 11358 + }, + { + "epoch": 0.9, + "learning_rate": 5.205903391890387e-07, + "loss": 0.3788, + "step": 11359 + }, + { + "epoch": 0.9, + "learning_rate": 5.197735084611033e-07, + "loss": 0.2914, + "step": 11360 + }, + { + "epoch": 0.9, + "learning_rate": 5.189573019604676e-07, + "loss": 0.3652, + "step": 11361 + }, + { + "epoch": 0.9, + "learning_rate": 5.181417197408733e-07, + "loss": 0.4108, + "step": 11362 + }, + { + "epoch": 0.9, + "learning_rate": 5.173267618560229e-07, + "loss": 0.3996, + "step": 11363 + }, + { + "epoch": 0.9, + "learning_rate": 5.165124283595779e-07, + "loss": 0.2416, + "step": 11364 + }, + { + "epoch": 0.9, + "learning_rate": 5.156987193051577e-07, + "loss": 0.3956, + "step": 11365 + }, + { + "epoch": 0.9, + "learning_rate": 5.148856347463416e-07, + "loss": 0.4484, + "step": 11366 + }, + { + "epoch": 0.9, + "learning_rate": 5.140731747366656e-07, + "loss": 0.3995, + "step": 11367 + }, + { + "epoch": 0.9, + "learning_rate": 5.132613393296293e-07, + "loss": 0.2753, + "step": 11368 + }, + { + "epoch": 0.9, + "learning_rate": 5.124501285786865e-07, + "loss": 0.3906, + "step": 11369 + }, + { + "epoch": 0.9, + "learning_rate": 5.1163954253725e-07, + "loss": 0.3113, + "step": 11370 + }, + { + "epoch": 0.9, + "learning_rate": 5.108295812586961e-07, + "loss": 0.3232, + "step": 11371 + }, + { + "epoch": 0.9, + "learning_rate": 5.100202447963553e-07, + "loss": 0.4707, + "step": 11372 + }, + { + "epoch": 0.9, + "learning_rate": 5.092115332035163e-07, + "loss": 0.3884, + "step": 11373 + }, + { + "epoch": 0.9, + "learning_rate": 5.084034465334342e-07, + "loss": 0.3506, + "step": 11374 + }, + { + "epoch": 0.9, + "learning_rate": 5.07595984839313e-07, + "loss": 0.341, + "step": 11375 + }, + { + "epoch": 0.9, + "learning_rate": 5.067891481743203e-07, + "loss": 0.32, + "step": 11376 + }, + { + "epoch": 0.9, + "learning_rate": 5.059829365915859e-07, + "loss": 0.4593, + "step": 11377 + }, + { + "epoch": 0.9, + "learning_rate": 5.051773501441926e-07, + "loss": 0.4358, + "step": 11378 + }, + { + "epoch": 0.9, + "learning_rate": 5.043723888851837e-07, + "loss": 0.3956, + "step": 11379 + }, + { + "epoch": 0.9, + "learning_rate": 5.035680528675635e-07, + "loss": 0.4623, + "step": 11380 + }, + { + "epoch": 0.9, + "learning_rate": 5.027643421442929e-07, + "loss": 0.2829, + "step": 11381 + }, + { + "epoch": 0.9, + "learning_rate": 5.01961256768293e-07, + "loss": 0.3257, + "step": 11382 + }, + { + "epoch": 0.9, + "learning_rate": 5.011587967924414e-07, + "loss": 0.2921, + "step": 11383 + }, + { + "epoch": 0.9, + "learning_rate": 5.003569622695792e-07, + "loss": 0.3277, + "step": 11384 + }, + { + "epoch": 0.9, + "learning_rate": 4.99555753252502e-07, + "loss": 0.3583, + "step": 11385 + }, + { + "epoch": 0.9, + "learning_rate": 4.987551697939629e-07, + "loss": 0.4257, + "step": 11386 + }, + { + "epoch": 0.9, + "learning_rate": 4.979552119466802e-07, + "loss": 0.3032, + "step": 11387 + }, + { + "epoch": 0.9, + "learning_rate": 4.971558797633258e-07, + "loss": 0.3999, + "step": 11388 + }, + { + "epoch": 0.9, + "learning_rate": 4.963571732965311e-07, + "loss": 0.3144, + "step": 11389 + }, + { + "epoch": 0.9, + "learning_rate": 4.955590925988896e-07, + "loss": 0.3366, + "step": 11390 + }, + { + "epoch": 0.9, + "learning_rate": 4.947616377229492e-07, + "loss": 0.3165, + "step": 11391 + }, + { + "epoch": 0.9, + "learning_rate": 4.939648087212168e-07, + "loss": 0.3978, + "step": 11392 + }, + { + "epoch": 0.9, + "learning_rate": 4.931686056461626e-07, + "loss": 0.3128, + "step": 11393 + }, + { + "epoch": 0.9, + "learning_rate": 4.923730285502126e-07, + "loss": 0.3964, + "step": 11394 + }, + { + "epoch": 0.9, + "learning_rate": 4.915780774857504e-07, + "loss": 0.4333, + "step": 11395 + }, + { + "epoch": 0.9, + "learning_rate": 4.907837525051196e-07, + "loss": 0.2787, + "step": 11396 + }, + { + "epoch": 0.9, + "learning_rate": 4.89990053660624e-07, + "loss": 0.4344, + "step": 11397 + }, + { + "epoch": 0.9, + "learning_rate": 4.891969810045239e-07, + "loss": 0.3895, + "step": 11398 + }, + { + "epoch": 0.9, + "learning_rate": 4.884045345890387e-07, + "loss": 0.3341, + "step": 11399 + }, + { + "epoch": 0.9, + "learning_rate": 4.87612714466349e-07, + "loss": 0.3355, + "step": 11400 + }, + { + "epoch": 0.9, + "learning_rate": 4.868215206885918e-07, + "loss": 0.321, + "step": 11401 + }, + { + "epoch": 0.9, + "learning_rate": 4.860309533078611e-07, + "loss": 0.3097, + "step": 11402 + }, + { + "epoch": 0.9, + "learning_rate": 4.852410123762164e-07, + "loss": 0.438, + "step": 11403 + }, + { + "epoch": 0.9, + "learning_rate": 4.844516979456671e-07, + "loss": 0.3916, + "step": 11404 + }, + { + "epoch": 0.9, + "learning_rate": 4.836630100681872e-07, + "loss": 0.2626, + "step": 11405 + }, + { + "epoch": 0.9, + "learning_rate": 4.828749487957097e-07, + "loss": 0.4684, + "step": 11406 + }, + { + "epoch": 0.9, + "learning_rate": 4.82087514180124e-07, + "loss": 0.2799, + "step": 11407 + }, + { + "epoch": 0.9, + "learning_rate": 4.813007062732756e-07, + "loss": 0.2893, + "step": 11408 + }, + { + "epoch": 0.9, + "learning_rate": 4.805145251269772e-07, + "loss": 0.2501, + "step": 11409 + }, + { + "epoch": 0.9, + "learning_rate": 4.797289707929919e-07, + "loss": 0.3186, + "step": 11410 + }, + { + "epoch": 0.9, + "learning_rate": 4.789440433230452e-07, + "loss": 0.3082, + "step": 11411 + }, + { + "epoch": 0.9, + "learning_rate": 4.781597427688189e-07, + "loss": 0.3525, + "step": 11412 + }, + { + "epoch": 0.9, + "learning_rate": 4.773760691819596e-07, + "loss": 0.3071, + "step": 11413 + }, + { + "epoch": 0.9, + "learning_rate": 4.765930226140658e-07, + "loss": 0.3358, + "step": 11414 + }, + { + "epoch": 0.9, + "learning_rate": 4.7581060311669757e-07, + "loss": 0.3336, + "step": 11415 + }, + { + "epoch": 0.9, + "learning_rate": 4.7502881074137476e-07, + "loss": 0.3571, + "step": 11416 + }, + { + "epoch": 0.9, + "learning_rate": 4.742476455395706e-07, + "loss": 0.3202, + "step": 11417 + }, + { + "epoch": 0.9, + "learning_rate": 4.734671075627262e-07, + "loss": 0.3015, + "step": 11418 + }, + { + "epoch": 0.9, + "learning_rate": 4.726871968622337e-07, + "loss": 0.3626, + "step": 11419 + }, + { + "epoch": 0.9, + "learning_rate": 4.7190791348944777e-07, + "loss": 0.2948, + "step": 11420 + }, + { + "epoch": 0.9, + "learning_rate": 4.711292574956772e-07, + "loss": 0.289, + "step": 11421 + }, + { + "epoch": 0.9, + "learning_rate": 4.7035122893219653e-07, + "loss": 0.319, + "step": 11422 + }, + { + "epoch": 0.9, + "learning_rate": 4.695738278502338e-07, + "loss": 0.3458, + "step": 11423 + }, + { + "epoch": 0.91, + "learning_rate": 4.6879705430097566e-07, + "loss": 0.2575, + "step": 11424 + }, + { + "epoch": 0.91, + "learning_rate": 4.6802090833557136e-07, + "loss": 0.4024, + "step": 11425 + }, + { + "epoch": 0.91, + "learning_rate": 4.6724539000512546e-07, + "loss": 0.2007, + "step": 11426 + }, + { + "epoch": 0.91, + "learning_rate": 4.6647049936070054e-07, + "loss": 0.333, + "step": 11427 + }, + { + "epoch": 0.91, + "learning_rate": 4.656962364533224e-07, + "loss": 0.2626, + "step": 11428 + }, + { + "epoch": 0.91, + "learning_rate": 4.649226013339703e-07, + "loss": 0.3398, + "step": 11429 + }, + { + "epoch": 0.91, + "learning_rate": 4.641495940535845e-07, + "loss": 0.2962, + "step": 11430 + }, + { + "epoch": 0.91, + "learning_rate": 4.633772146630655e-07, + "loss": 0.3674, + "step": 11431 + }, + { + "epoch": 0.91, + "learning_rate": 4.626054632132693e-07, + "loss": 0.4311, + "step": 11432 + }, + { + "epoch": 0.91, + "learning_rate": 4.6183433975501067e-07, + "loss": 0.345, + "step": 11433 + }, + { + "epoch": 0.91, + "learning_rate": 4.61063844339068e-07, + "loss": 0.3084, + "step": 11434 + }, + { + "epoch": 0.91, + "learning_rate": 4.6029397701617296e-07, + "loss": 0.4026, + "step": 11435 + }, + { + "epoch": 0.91, + "learning_rate": 4.595247378370171e-07, + "loss": 0.4222, + "step": 11436 + }, + { + "epoch": 0.91, + "learning_rate": 4.5875612685225e-07, + "loss": 0.2897, + "step": 11437 + }, + { + "epoch": 0.91, + "learning_rate": 4.5798814411248336e-07, + "loss": 0.3442, + "step": 11438 + }, + { + "epoch": 0.91, + "learning_rate": 4.5722078966828455e-07, + "loss": 0.3739, + "step": 11439 + }, + { + "epoch": 0.91, + "learning_rate": 4.5645406357017865e-07, + "loss": 0.3343, + "step": 11440 + }, + { + "epoch": 0.91, + "learning_rate": 4.5568796586865304e-07, + "loss": 0.323, + "step": 11441 + }, + { + "epoch": 0.91, + "learning_rate": 4.5492249661415077e-07, + "loss": 0.3881, + "step": 11442 + }, + { + "epoch": 0.91, + "learning_rate": 4.541576558570726e-07, + "loss": 0.351, + "step": 11443 + }, + { + "epoch": 0.91, + "learning_rate": 4.533934436477827e-07, + "loss": 0.3588, + "step": 11444 + }, + { + "epoch": 0.91, + "learning_rate": 4.526298600365997e-07, + "loss": 0.2933, + "step": 11445 + }, + { + "epoch": 0.91, + "learning_rate": 4.5186690507379894e-07, + "loss": 0.278, + "step": 11446 + }, + { + "epoch": 0.91, + "learning_rate": 4.5110457880962246e-07, + "loss": 0.2881, + "step": 11447 + }, + { + "epoch": 0.91, + "learning_rate": 4.503428812942623e-07, + "loss": 0.3573, + "step": 11448 + }, + { + "epoch": 0.91, + "learning_rate": 4.495818125778717e-07, + "loss": 0.3919, + "step": 11449 + }, + { + "epoch": 0.91, + "learning_rate": 4.488213727105672e-07, + "loss": 0.3253, + "step": 11450 + }, + { + "epoch": 0.91, + "learning_rate": 4.4806156174241776e-07, + "loss": 0.2969, + "step": 11451 + }, + { + "epoch": 0.91, + "learning_rate": 4.4730237972345326e-07, + "loss": 0.2072, + "step": 11452 + }, + { + "epoch": 0.91, + "learning_rate": 4.465438267036604e-07, + "loss": 0.4086, + "step": 11453 + }, + { + "epoch": 0.91, + "learning_rate": 4.4578590273299027e-07, + "loss": 0.2709, + "step": 11454 + }, + { + "epoch": 0.91, + "learning_rate": 4.4502860786134747e-07, + "loss": 0.3398, + "step": 11455 + }, + { + "epoch": 0.91, + "learning_rate": 4.4427194213859216e-07, + "loss": 0.3787, + "step": 11456 + }, + { + "epoch": 0.91, + "learning_rate": 4.435159056145533e-07, + "loss": 0.3348, + "step": 11457 + }, + { + "epoch": 0.91, + "learning_rate": 4.427604983390077e-07, + "loss": 0.3398, + "step": 11458 + }, + { + "epoch": 0.91, + "learning_rate": 4.420057203616956e-07, + "loss": 0.4297, + "step": 11459 + }, + { + "epoch": 0.91, + "learning_rate": 4.4125157173231847e-07, + "loss": 0.233, + "step": 11460 + }, + { + "epoch": 0.91, + "learning_rate": 4.40498052500532e-07, + "loss": 0.355, + "step": 11461 + }, + { + "epoch": 0.91, + "learning_rate": 4.397451627159499e-07, + "loss": 0.2922, + "step": 11462 + }, + { + "epoch": 0.91, + "learning_rate": 4.389929024281492e-07, + "loss": 0.3856, + "step": 11463 + }, + { + "epoch": 0.91, + "learning_rate": 4.382412716866602e-07, + "loss": 0.3362, + "step": 11464 + }, + { + "epoch": 0.91, + "learning_rate": 4.374902705409745e-07, + "loss": 0.3239, + "step": 11465 + }, + { + "epoch": 0.91, + "learning_rate": 4.367398990405447e-07, + "loss": 0.3526, + "step": 11466 + }, + { + "epoch": 0.91, + "learning_rate": 4.359901572347758e-07, + "loss": 0.3134, + "step": 11467 + }, + { + "epoch": 0.91, + "learning_rate": 4.3524104517303714e-07, + "loss": 0.238, + "step": 11468 + }, + { + "epoch": 0.91, + "learning_rate": 4.3449256290465035e-07, + "loss": 0.4064, + "step": 11469 + }, + { + "epoch": 0.91, + "learning_rate": 4.3374471047890497e-07, + "loss": 0.3134, + "step": 11470 + }, + { + "epoch": 0.91, + "learning_rate": 4.329974879450394e-07, + "loss": 0.416, + "step": 11471 + }, + { + "epoch": 0.91, + "learning_rate": 4.3225089535225415e-07, + "loss": 0.3565, + "step": 11472 + }, + { + "epoch": 0.91, + "learning_rate": 4.3150493274971227e-07, + "loss": 0.3645, + "step": 11473 + }, + { + "epoch": 0.91, + "learning_rate": 4.3075960018652995e-07, + "loss": 0.3852, + "step": 11474 + }, + { + "epoch": 0.91, + "learning_rate": 4.300148977117824e-07, + "loss": 0.3864, + "step": 11475 + }, + { + "epoch": 0.91, + "learning_rate": 4.2927082537450705e-07, + "loss": 0.2641, + "step": 11476 + }, + { + "epoch": 0.91, + "learning_rate": 4.285273832236969e-07, + "loss": 0.2194, + "step": 11477 + }, + { + "epoch": 0.91, + "learning_rate": 4.277845713083018e-07, + "loss": 0.3662, + "step": 11478 + }, + { + "epoch": 0.91, + "learning_rate": 4.2704238967723574e-07, + "loss": 0.3145, + "step": 11479 + }, + { + "epoch": 0.91, + "learning_rate": 4.2630083837936654e-07, + "loss": 0.2971, + "step": 11480 + }, + { + "epoch": 0.91, + "learning_rate": 4.2555991746352054e-07, + "loss": 0.3663, + "step": 11481 + }, + { + "epoch": 0.91, + "learning_rate": 4.2481962697848323e-07, + "loss": 0.4088, + "step": 11482 + }, + { + "epoch": 0.91, + "learning_rate": 4.240799669730034e-07, + "loss": 0.3215, + "step": 11483 + }, + { + "epoch": 0.91, + "learning_rate": 4.2334093749577975e-07, + "loss": 0.3443, + "step": 11484 + }, + { + "epoch": 0.91, + "learning_rate": 4.226025385954746e-07, + "loss": 0.3072, + "step": 11485 + }, + { + "epoch": 0.91, + "learning_rate": 4.218647703207113e-07, + "loss": 0.2754, + "step": 11486 + }, + { + "epoch": 0.91, + "learning_rate": 4.211276327200642e-07, + "loss": 0.3135, + "step": 11487 + }, + { + "epoch": 0.91, + "learning_rate": 4.203911258420712e-07, + "loss": 0.3465, + "step": 11488 + }, + { + "epoch": 0.91, + "learning_rate": 4.196552497352302e-07, + "loss": 0.2638, + "step": 11489 + }, + { + "epoch": 0.91, + "learning_rate": 4.189200044479924e-07, + "loss": 0.3703, + "step": 11490 + }, + { + "epoch": 0.91, + "learning_rate": 4.1818539002877024e-07, + "loss": 0.3984, + "step": 11491 + }, + { + "epoch": 0.91, + "learning_rate": 4.174514065259383e-07, + "loss": 0.3081, + "step": 11492 + }, + { + "epoch": 0.91, + "learning_rate": 4.167180539878213e-07, + "loss": 0.284, + "step": 11493 + }, + { + "epoch": 0.91, + "learning_rate": 4.1598533246270833e-07, + "loss": 0.3355, + "step": 11494 + }, + { + "epoch": 0.91, + "learning_rate": 4.152532419988453e-07, + "loss": 0.4341, + "step": 11495 + }, + { + "epoch": 0.91, + "learning_rate": 4.145217826444392e-07, + "loss": 0.4302, + "step": 11496 + }, + { + "epoch": 0.91, + "learning_rate": 4.1379095444764926e-07, + "loss": 0.4009, + "step": 11497 + }, + { + "epoch": 0.91, + "learning_rate": 4.130607574566003e-07, + "loss": 0.4427, + "step": 11498 + }, + { + "epoch": 0.91, + "learning_rate": 4.1233119171937065e-07, + "loss": 0.3487, + "step": 11499 + }, + { + "epoch": 0.91, + "learning_rate": 4.116022572839984e-07, + "loss": 0.334, + "step": 11500 + }, + { + "epoch": 0.91, + "learning_rate": 4.1087395419848186e-07, + "loss": 0.3252, + "step": 11501 + }, + { + "epoch": 0.91, + "learning_rate": 4.10146282510776e-07, + "loss": 0.3318, + "step": 11502 + }, + { + "epoch": 0.91, + "learning_rate": 4.094192422687926e-07, + "loss": 0.2432, + "step": 11503 + }, + { + "epoch": 0.91, + "learning_rate": 4.0869283352040656e-07, + "loss": 0.4293, + "step": 11504 + }, + { + "epoch": 0.91, + "learning_rate": 4.079670563134475e-07, + "loss": 0.299, + "step": 11505 + }, + { + "epoch": 0.91, + "learning_rate": 4.072419106957026e-07, + "loss": 0.3444, + "step": 11506 + }, + { + "epoch": 0.91, + "learning_rate": 4.065173967149205e-07, + "loss": 0.2582, + "step": 11507 + }, + { + "epoch": 0.91, + "learning_rate": 4.057935144188074e-07, + "loss": 0.2545, + "step": 11508 + }, + { + "epoch": 0.91, + "learning_rate": 4.0507026385502747e-07, + "loss": 0.3376, + "step": 11509 + }, + { + "epoch": 0.91, + "learning_rate": 4.043476450712014e-07, + "loss": 0.3282, + "step": 11510 + }, + { + "epoch": 0.91, + "learning_rate": 4.036256581149123e-07, + "loss": 0.4305, + "step": 11511 + }, + { + "epoch": 0.91, + "learning_rate": 4.0290430303369876e-07, + "loss": 0.3323, + "step": 11512 + }, + { + "epoch": 0.91, + "learning_rate": 4.021835798750584e-07, + "loss": 0.4596, + "step": 11513 + }, + { + "epoch": 0.91, + "learning_rate": 4.0146348868644767e-07, + "loss": 0.3945, + "step": 11514 + }, + { + "epoch": 0.91, + "learning_rate": 4.0074402951528204e-07, + "loss": 0.2587, + "step": 11515 + }, + { + "epoch": 0.91, + "learning_rate": 4.000252024089313e-07, + "loss": 0.2585, + "step": 11516 + }, + { + "epoch": 0.91, + "learning_rate": 3.9930700741473093e-07, + "loss": 0.4487, + "step": 11517 + }, + { + "epoch": 0.91, + "learning_rate": 3.985894445799676e-07, + "loss": 0.4101, + "step": 11518 + }, + { + "epoch": 0.91, + "learning_rate": 3.978725139518891e-07, + "loss": 0.3197, + "step": 11519 + }, + { + "epoch": 0.91, + "learning_rate": 3.9715621557770535e-07, + "loss": 0.3434, + "step": 11520 + }, + { + "epoch": 0.91, + "learning_rate": 3.9644054950457753e-07, + "loss": 0.4126, + "step": 11521 + }, + { + "epoch": 0.91, + "learning_rate": 3.9572551577963135e-07, + "loss": 0.4224, + "step": 11522 + }, + { + "epoch": 0.91, + "learning_rate": 3.9501111444994576e-07, + "loss": 0.3349, + "step": 11523 + }, + { + "epoch": 0.91, + "learning_rate": 3.9429734556256205e-07, + "loss": 0.4454, + "step": 11524 + }, + { + "epoch": 0.91, + "learning_rate": 3.9358420916447927e-07, + "loss": 0.3969, + "step": 11525 + }, + { + "epoch": 0.91, + "learning_rate": 3.9287170530265206e-07, + "loss": 0.3631, + "step": 11526 + }, + { + "epoch": 0.91, + "learning_rate": 3.9215983402399736e-07, + "loss": 0.2957, + "step": 11527 + }, + { + "epoch": 0.91, + "learning_rate": 3.914485953753888e-07, + "loss": 0.2347, + "step": 11528 + }, + { + "epoch": 0.91, + "learning_rate": 3.907379894036545e-07, + "loss": 0.448, + "step": 11529 + }, + { + "epoch": 0.91, + "learning_rate": 3.9002801615558805e-07, + "loss": 0.4525, + "step": 11530 + }, + { + "epoch": 0.91, + "learning_rate": 3.893186756779366e-07, + "loss": 0.3844, + "step": 11531 + }, + { + "epoch": 0.91, + "learning_rate": 3.886099680174049e-07, + "loss": 0.3259, + "step": 11532 + }, + { + "epoch": 0.91, + "learning_rate": 3.879018932206624e-07, + "loss": 0.3473, + "step": 11533 + }, + { + "epoch": 0.91, + "learning_rate": 3.871944513343284e-07, + "loss": 0.3887, + "step": 11534 + }, + { + "epoch": 0.91, + "learning_rate": 3.864876424049857e-07, + "loss": 0.375, + "step": 11535 + }, + { + "epoch": 0.91, + "learning_rate": 3.857814664791748e-07, + "loss": 0.2714, + "step": 11536 + }, + { + "epoch": 0.91, + "learning_rate": 3.8507592360339407e-07, + "loss": 0.4141, + "step": 11537 + }, + { + "epoch": 0.91, + "learning_rate": 3.843710138240997e-07, + "loss": 0.3234, + "step": 11538 + }, + { + "epoch": 0.91, + "learning_rate": 3.8366673718770564e-07, + "loss": 0.2506, + "step": 11539 + }, + { + "epoch": 0.91, + "learning_rate": 3.8296309374058704e-07, + "loss": 0.3222, + "step": 11540 + }, + { + "epoch": 0.91, + "learning_rate": 3.8226008352907464e-07, + "loss": 0.2802, + "step": 11541 + }, + { + "epoch": 0.91, + "learning_rate": 3.815577065994569e-07, + "loss": 0.18, + "step": 11542 + }, + { + "epoch": 0.91, + "learning_rate": 3.8085596299798465e-07, + "loss": 0.4598, + "step": 11543 + }, + { + "epoch": 0.91, + "learning_rate": 3.801548527708621e-07, + "loss": 0.3214, + "step": 11544 + }, + { + "epoch": 0.91, + "learning_rate": 3.794543759642544e-07, + "loss": 0.2872, + "step": 11545 + }, + { + "epoch": 0.91, + "learning_rate": 3.7875453262428584e-07, + "loss": 0.3456, + "step": 11546 + }, + { + "epoch": 0.91, + "learning_rate": 3.7805532279703625e-07, + "loss": 0.2847, + "step": 11547 + }, + { + "epoch": 0.91, + "learning_rate": 3.773567465285455e-07, + "loss": 0.3713, + "step": 11548 + }, + { + "epoch": 0.91, + "learning_rate": 3.7665880386481226e-07, + "loss": 0.3774, + "step": 11549 + }, + { + "epoch": 0.92, + "learning_rate": 3.759614948517931e-07, + "loss": 0.3269, + "step": 11550 + }, + { + "epoch": 0.92, + "learning_rate": 3.7526481953539915e-07, + "loss": 0.3242, + "step": 11551 + }, + { + "epoch": 0.92, + "learning_rate": 3.74568777961507e-07, + "loss": 0.3681, + "step": 11552 + }, + { + "epoch": 0.92, + "learning_rate": 3.7387337017594674e-07, + "loss": 0.2631, + "step": 11553 + }, + { + "epoch": 0.92, + "learning_rate": 3.7317859622450714e-07, + "loss": 0.3018, + "step": 11554 + }, + { + "epoch": 0.92, + "learning_rate": 3.7248445615293506e-07, + "loss": 0.3842, + "step": 11555 + }, + { + "epoch": 0.92, + "learning_rate": 3.7179095000693723e-07, + "loss": 0.3327, + "step": 11556 + }, + { + "epoch": 0.92, + "learning_rate": 3.710980778321771e-07, + "loss": 0.3379, + "step": 11557 + }, + { + "epoch": 0.92, + "learning_rate": 3.70405839674276e-07, + "loss": 0.3062, + "step": 11558 + }, + { + "epoch": 0.92, + "learning_rate": 3.697142355788175e-07, + "loss": 0.3749, + "step": 11559 + }, + { + "epoch": 0.92, + "learning_rate": 3.6902326559133836e-07, + "loss": 0.3217, + "step": 11560 + }, + { + "epoch": 0.92, + "learning_rate": 3.683329297573346e-07, + "loss": 0.3393, + "step": 11561 + }, + { + "epoch": 0.92, + "learning_rate": 3.6764322812226416e-07, + "loss": 0.2781, + "step": 11562 + }, + { + "epoch": 0.92, + "learning_rate": 3.669541607315397e-07, + "loss": 0.3455, + "step": 11563 + }, + { + "epoch": 0.92, + "learning_rate": 3.6626572763053034e-07, + "loss": 0.3987, + "step": 11564 + }, + { + "epoch": 0.92, + "learning_rate": 3.6557792886457e-07, + "loss": 0.3516, + "step": 11565 + }, + { + "epoch": 0.92, + "learning_rate": 3.6489076447894456e-07, + "loss": 0.3613, + "step": 11566 + }, + { + "epoch": 0.92, + "learning_rate": 3.642042345189023e-07, + "loss": 0.4027, + "step": 11567 + }, + { + "epoch": 0.92, + "learning_rate": 3.6351833902964485e-07, + "loss": 0.3906, + "step": 11568 + }, + { + "epoch": 0.92, + "learning_rate": 3.6283307805633714e-07, + "loss": 0.3645, + "step": 11569 + }, + { + "epoch": 0.92, + "learning_rate": 3.6214845164410205e-07, + "loss": 0.3196, + "step": 11570 + }, + { + "epoch": 0.92, + "learning_rate": 3.614644598380157e-07, + "loss": 0.4127, + "step": 11571 + }, + { + "epoch": 0.92, + "learning_rate": 3.607811026831176e-07, + "loss": 0.423, + "step": 11572 + }, + { + "epoch": 0.92, + "learning_rate": 3.600983802244007e-07, + "loss": 0.3461, + "step": 11573 + }, + { + "epoch": 0.92, + "learning_rate": 3.594162925068234e-07, + "loss": 0.2725, + "step": 11574 + }, + { + "epoch": 0.92, + "learning_rate": 3.587348395752954e-07, + "loss": 0.5053, + "step": 11575 + }, + { + "epoch": 0.92, + "learning_rate": 3.5805402147468746e-07, + "loss": 0.3769, + "step": 11576 + }, + { + "epoch": 0.92, + "learning_rate": 3.573738382498271e-07, + "loss": 0.3648, + "step": 11577 + }, + { + "epoch": 0.92, + "learning_rate": 3.566942899455039e-07, + "loss": 0.3771, + "step": 11578 + }, + { + "epoch": 0.92, + "learning_rate": 3.5601537660646e-07, + "loss": 0.3777, + "step": 11579 + }, + { + "epoch": 0.92, + "learning_rate": 3.553370982773985e-07, + "loss": 0.3207, + "step": 11580 + }, + { + "epoch": 0.92, + "learning_rate": 3.546594550029836e-07, + "loss": 0.3238, + "step": 11581 + }, + { + "epoch": 0.92, + "learning_rate": 3.53982446827833e-07, + "loss": 0.244, + "step": 11582 + }, + { + "epoch": 0.92, + "learning_rate": 3.533060737965244e-07, + "loss": 0.2592, + "step": 11583 + }, + { + "epoch": 0.92, + "learning_rate": 3.526303359535932e-07, + "loss": 0.313, + "step": 11584 + }, + { + "epoch": 0.92, + "learning_rate": 3.519552333435361e-07, + "loss": 0.2862, + "step": 11585 + }, + { + "epoch": 0.92, + "learning_rate": 3.5128076601080087e-07, + "loss": 0.3183, + "step": 11586 + }, + { + "epoch": 0.92, + "learning_rate": 3.5060693399980194e-07, + "loss": 0.39, + "step": 11587 + }, + { + "epoch": 0.92, + "learning_rate": 3.499337373549072e-07, + "loss": 0.2972, + "step": 11588 + }, + { + "epoch": 0.92, + "learning_rate": 3.4926117612044117e-07, + "loss": 0.4211, + "step": 11589 + }, + { + "epoch": 0.92, + "learning_rate": 3.485892503406907e-07, + "loss": 0.3813, + "step": 11590 + }, + { + "epoch": 0.92, + "learning_rate": 3.4791796005989917e-07, + "loss": 0.3087, + "step": 11591 + }, + { + "epoch": 0.92, + "learning_rate": 3.4724730532226693e-07, + "loss": 0.3715, + "step": 11592 + }, + { + "epoch": 0.92, + "learning_rate": 3.4657728617195295e-07, + "loss": 0.4016, + "step": 11593 + }, + { + "epoch": 0.92, + "learning_rate": 3.459079026530754e-07, + "loss": 0.2264, + "step": 11594 + }, + { + "epoch": 0.92, + "learning_rate": 3.4523915480971113e-07, + "loss": 0.2143, + "step": 11595 + }, + { + "epoch": 0.92, + "learning_rate": 3.445710426858906e-07, + "loss": 0.3246, + "step": 11596 + }, + { + "epoch": 0.92, + "learning_rate": 3.439035663256096e-07, + "loss": 0.2536, + "step": 11597 + }, + { + "epoch": 0.92, + "learning_rate": 3.4323672577281754e-07, + "loss": 0.3375, + "step": 11598 + }, + { + "epoch": 0.92, + "learning_rate": 3.425705210714192e-07, + "loss": 0.3043, + "step": 11599 + }, + { + "epoch": 0.92, + "learning_rate": 3.419049522652851e-07, + "loss": 0.4295, + "step": 11600 + }, + { + "epoch": 0.92, + "learning_rate": 3.412400193982379e-07, + "loss": 0.2557, + "step": 11601 + }, + { + "epoch": 0.92, + "learning_rate": 3.4057572251405936e-07, + "loss": 0.3263, + "step": 11602 + }, + { + "epoch": 0.92, + "learning_rate": 3.3991206165649213e-07, + "loss": 0.2582, + "step": 11603 + }, + { + "epoch": 0.92, + "learning_rate": 3.392490368692347e-07, + "loss": 0.3434, + "step": 11604 + }, + { + "epoch": 0.92, + "learning_rate": 3.385866481959432e-07, + "loss": 0.4292, + "step": 11605 + }, + { + "epoch": 0.92, + "learning_rate": 3.379248956802328e-07, + "loss": 0.3758, + "step": 11606 + }, + { + "epoch": 0.92, + "learning_rate": 3.3726377936567856e-07, + "loss": 0.2419, + "step": 11607 + }, + { + "epoch": 0.92, + "learning_rate": 3.3660329929580904e-07, + "loss": 0.3142, + "step": 11608 + }, + { + "epoch": 0.92, + "learning_rate": 3.3594345551411503e-07, + "loss": 0.3919, + "step": 11609 + }, + { + "epoch": 0.92, + "learning_rate": 3.352842480640439e-07, + "loss": 0.2617, + "step": 11610 + }, + { + "epoch": 0.92, + "learning_rate": 3.346256769890022e-07, + "loss": 0.3078, + "step": 11611 + }, + { + "epoch": 0.92, + "learning_rate": 3.3396774233235173e-07, + "loss": 0.3123, + "step": 11612 + }, + { + "epoch": 0.92, + "learning_rate": 3.333104441374158e-07, + "loss": 0.4089, + "step": 11613 + }, + { + "epoch": 0.92, + "learning_rate": 3.32653782447474e-07, + "loss": 0.3747, + "step": 11614 + }, + { + "epoch": 0.92, + "learning_rate": 3.319977573057642e-07, + "loss": 0.3544, + "step": 11615 + }, + { + "epoch": 0.92, + "learning_rate": 3.313423687554829e-07, + "loss": 0.5045, + "step": 11616 + }, + { + "epoch": 0.92, + "learning_rate": 3.3068761683978434e-07, + "loss": 0.2535, + "step": 11617 + }, + { + "epoch": 0.92, + "learning_rate": 3.3003350160177974e-07, + "loss": 0.3323, + "step": 11618 + }, + { + "epoch": 0.92, + "learning_rate": 3.293800230845412e-07, + "loss": 0.2745, + "step": 11619 + }, + { + "epoch": 0.92, + "learning_rate": 3.287271813310955e-07, + "loss": 0.3605, + "step": 11620 + }, + { + "epoch": 0.92, + "learning_rate": 3.280749763844293e-07, + "loss": 0.375, + "step": 11621 + }, + { + "epoch": 0.92, + "learning_rate": 3.274234082874872e-07, + "loss": 0.3686, + "step": 11622 + }, + { + "epoch": 0.92, + "learning_rate": 3.267724770831737e-07, + "loss": 0.3476, + "step": 11623 + }, + { + "epoch": 0.92, + "learning_rate": 3.2612218281434794e-07, + "loss": 0.2777, + "step": 11624 + }, + { + "epoch": 0.92, + "learning_rate": 3.254725255238267e-07, + "loss": 0.5198, + "step": 11625 + }, + { + "epoch": 0.92, + "learning_rate": 3.2482350525439023e-07, + "loss": 0.2957, + "step": 11626 + }, + { + "epoch": 0.92, + "learning_rate": 3.241751220487721e-07, + "loss": 0.4522, + "step": 11627 + }, + { + "epoch": 0.92, + "learning_rate": 3.235273759496638e-07, + "loss": 0.3259, + "step": 11628 + }, + { + "epoch": 0.92, + "learning_rate": 3.2288026699971884e-07, + "loss": 0.1901, + "step": 11629 + }, + { + "epoch": 0.92, + "learning_rate": 3.222337952415455e-07, + "loss": 0.2677, + "step": 11630 + }, + { + "epoch": 0.92, + "learning_rate": 3.215879607177086e-07, + "loss": 0.3505, + "step": 11631 + }, + { + "epoch": 0.92, + "learning_rate": 3.2094276347073626e-07, + "loss": 0.4793, + "step": 11632 + }, + { + "epoch": 0.92, + "learning_rate": 3.2029820354311014e-07, + "loss": 0.3729, + "step": 11633 + }, + { + "epoch": 0.92, + "learning_rate": 3.196542809772707e-07, + "loss": 0.3598, + "step": 11634 + }, + { + "epoch": 0.92, + "learning_rate": 3.1901099581561846e-07, + "loss": 0.3771, + "step": 11635 + }, + { + "epoch": 0.92, + "learning_rate": 3.183683481005106e-07, + "loss": 0.3036, + "step": 11636 + }, + { + "epoch": 0.92, + "learning_rate": 3.1772633787426233e-07, + "loss": 0.292, + "step": 11637 + }, + { + "epoch": 0.92, + "learning_rate": 3.1708496517914523e-07, + "loss": 0.4238, + "step": 11638 + }, + { + "epoch": 0.92, + "learning_rate": 3.1644423005739335e-07, + "loss": 0.3217, + "step": 11639 + }, + { + "epoch": 0.92, + "learning_rate": 3.15804132551194e-07, + "loss": 0.3099, + "step": 11640 + }, + { + "epoch": 0.92, + "learning_rate": 3.151646727026947e-07, + "loss": 0.3607, + "step": 11641 + }, + { + "epoch": 0.92, + "learning_rate": 3.1452585055400167e-07, + "loss": 0.3256, + "step": 11642 + }, + { + "epoch": 0.92, + "learning_rate": 3.138876661471779e-07, + "loss": 0.2827, + "step": 11643 + }, + { + "epoch": 0.92, + "learning_rate": 3.1325011952424435e-07, + "loss": 0.3441, + "step": 11644 + }, + { + "epoch": 0.92, + "learning_rate": 3.1261321072718063e-07, + "loss": 0.4465, + "step": 11645 + }, + { + "epoch": 0.92, + "learning_rate": 3.1197693979792556e-07, + "loss": 0.3487, + "step": 11646 + }, + { + "epoch": 0.92, + "learning_rate": 3.1134130677837103e-07, + "loss": 0.4117, + "step": 11647 + }, + { + "epoch": 0.92, + "learning_rate": 3.107063117103759e-07, + "loss": 0.3025, + "step": 11648 + }, + { + "epoch": 0.92, + "learning_rate": 3.100719546357467e-07, + "loss": 0.3015, + "step": 11649 + }, + { + "epoch": 0.92, + "learning_rate": 3.0943823559625217e-07, + "loss": 0.3972, + "step": 11650 + }, + { + "epoch": 0.92, + "learning_rate": 3.088051546336246e-07, + "loss": 0.4694, + "step": 11651 + }, + { + "epoch": 0.92, + "learning_rate": 3.08172711789545e-07, + "loss": 0.3672, + "step": 11652 + }, + { + "epoch": 0.92, + "learning_rate": 3.0754090710565785e-07, + "loss": 0.4418, + "step": 11653 + }, + { + "epoch": 0.92, + "learning_rate": 3.069097406235666e-07, + "loss": 0.511, + "step": 11654 + }, + { + "epoch": 0.92, + "learning_rate": 3.0627921238482794e-07, + "loss": 0.3405, + "step": 11655 + }, + { + "epoch": 0.92, + "learning_rate": 3.056493224309587e-07, + "loss": 0.3881, + "step": 11656 + }, + { + "epoch": 0.92, + "learning_rate": 3.0502007080343675e-07, + "loss": 0.3236, + "step": 11657 + }, + { + "epoch": 0.92, + "learning_rate": 3.043914575436946e-07, + "loss": 0.3485, + "step": 11658 + }, + { + "epoch": 0.92, + "learning_rate": 3.0376348269312017e-07, + "loss": 0.3, + "step": 11659 + }, + { + "epoch": 0.92, + "learning_rate": 3.031361462930671e-07, + "loss": 0.2664, + "step": 11660 + }, + { + "epoch": 0.92, + "learning_rate": 3.025094483848401e-07, + "loss": 0.3022, + "step": 11661 + }, + { + "epoch": 0.92, + "learning_rate": 3.0188338900970505e-07, + "loss": 0.4007, + "step": 11662 + }, + { + "epoch": 0.92, + "learning_rate": 3.0125796820888343e-07, + "loss": 0.3305, + "step": 11663 + }, + { + "epoch": 0.92, + "learning_rate": 3.0063318602355787e-07, + "loss": 0.3656, + "step": 11664 + }, + { + "epoch": 0.92, + "learning_rate": 3.000090424948665e-07, + "loss": 0.3938, + "step": 11665 + }, + { + "epoch": 0.92, + "learning_rate": 2.993855376639054e-07, + "loss": 0.4178, + "step": 11666 + }, + { + "epoch": 0.92, + "learning_rate": 2.987626715717318e-07, + "loss": 0.473, + "step": 11667 + }, + { + "epoch": 0.92, + "learning_rate": 2.9814044425935605e-07, + "loss": 0.2983, + "step": 11668 + }, + { + "epoch": 0.92, + "learning_rate": 2.9751885576774887e-07, + "loss": 0.3872, + "step": 11669 + }, + { + "epoch": 0.92, + "learning_rate": 2.9689790613784073e-07, + "loss": 0.3717, + "step": 11670 + }, + { + "epoch": 0.92, + "learning_rate": 2.962775954105179e-07, + "loss": 0.2776, + "step": 11671 + }, + { + "epoch": 0.92, + "learning_rate": 2.9565792362662213e-07, + "loss": 0.2503, + "step": 11672 + }, + { + "epoch": 0.92, + "learning_rate": 2.9503889082695967e-07, + "loss": 0.3741, + "step": 11673 + }, + { + "epoch": 0.92, + "learning_rate": 2.9442049705228794e-07, + "loss": 0.3097, + "step": 11674 + }, + { + "epoch": 0.92, + "learning_rate": 2.938027423433254e-07, + "loss": 0.239, + "step": 11675 + }, + { + "epoch": 0.93, + "learning_rate": 2.931856267407507e-07, + "loss": 0.3157, + "step": 11676 + }, + { + "epoch": 0.93, + "learning_rate": 2.9256915028519575e-07, + "loss": 0.3759, + "step": 11677 + }, + { + "epoch": 0.93, + "learning_rate": 2.919533130172536e-07, + "loss": 0.35, + "step": 11678 + }, + { + "epoch": 0.93, + "learning_rate": 2.913381149774719e-07, + "loss": 0.2461, + "step": 11679 + }, + { + "epoch": 0.93, + "learning_rate": 2.907235562063615e-07, + "loss": 0.3628, + "step": 11680 + }, + { + "epoch": 0.93, + "learning_rate": 2.9010963674438674e-07, + "loss": 0.4231, + "step": 11681 + }, + { + "epoch": 0.93, + "learning_rate": 2.8949635663197087e-07, + "loss": 0.2851, + "step": 11682 + }, + { + "epoch": 0.93, + "learning_rate": 2.8888371590949703e-07, + "loss": 0.3082, + "step": 11683 + }, + { + "epoch": 0.93, + "learning_rate": 2.882717146173031e-07, + "loss": 0.3448, + "step": 11684 + }, + { + "epoch": 0.93, + "learning_rate": 2.8766035279568563e-07, + "loss": 0.3649, + "step": 11685 + }, + { + "epoch": 0.93, + "learning_rate": 2.8704963048490243e-07, + "loss": 0.3233, + "step": 11686 + }, + { + "epoch": 0.93, + "learning_rate": 2.864395477251658e-07, + "loss": 0.3513, + "step": 11687 + }, + { + "epoch": 0.93, + "learning_rate": 2.858301045566447e-07, + "loss": 0.3288, + "step": 11688 + }, + { + "epoch": 0.93, + "learning_rate": 2.8522130101947045e-07, + "loss": 0.2511, + "step": 11689 + }, + { + "epoch": 0.93, + "learning_rate": 2.8461313715372976e-07, + "loss": 0.381, + "step": 11690 + }, + { + "epoch": 0.93, + "learning_rate": 2.8400561299946503e-07, + "loss": 0.362, + "step": 11691 + }, + { + "epoch": 0.93, + "learning_rate": 2.8339872859668103e-07, + "loss": 0.3384, + "step": 11692 + }, + { + "epoch": 0.93, + "learning_rate": 2.82792483985338e-07, + "loss": 0.3846, + "step": 11693 + }, + { + "epoch": 0.93, + "learning_rate": 2.8218687920535395e-07, + "loss": 0.3181, + "step": 11694 + }, + { + "epoch": 0.93, + "learning_rate": 2.8158191429660364e-07, + "loss": 0.3638, + "step": 11695 + }, + { + "epoch": 0.93, + "learning_rate": 2.8097758929892196e-07, + "loss": 0.2576, + "step": 11696 + }, + { + "epoch": 0.93, + "learning_rate": 2.803739042521025e-07, + "loss": 0.3227, + "step": 11697 + }, + { + "epoch": 0.93, + "learning_rate": 2.7977085919589253e-07, + "loss": 0.3963, + "step": 11698 + }, + { + "epoch": 0.93, + "learning_rate": 2.791684541700013e-07, + "loss": 0.3538, + "step": 11699 + }, + { + "epoch": 0.93, + "learning_rate": 2.785666892140937e-07, + "loss": 0.3389, + "step": 11700 + }, + { + "epoch": 0.93, + "learning_rate": 2.7796556436779144e-07, + "loss": 0.3022, + "step": 11701 + }, + { + "epoch": 0.93, + "learning_rate": 2.773650796706795e-07, + "loss": 0.299, + "step": 11702 + }, + { + "epoch": 0.93, + "learning_rate": 2.7676523516229404e-07, + "loss": 0.2919, + "step": 11703 + }, + { + "epoch": 0.93, + "learning_rate": 2.7616603088213126e-07, + "loss": 0.2706, + "step": 11704 + }, + { + "epoch": 0.93, + "learning_rate": 2.755674668696495e-07, + "loss": 0.3859, + "step": 11705 + }, + { + "epoch": 0.93, + "learning_rate": 2.749695431642574e-07, + "loss": 0.2895, + "step": 11706 + }, + { + "epoch": 0.93, + "learning_rate": 2.743722598053278e-07, + "loss": 0.3838, + "step": 11707 + }, + { + "epoch": 0.93, + "learning_rate": 2.737756168321881e-07, + "loss": 0.3584, + "step": 11708 + }, + { + "epoch": 0.93, + "learning_rate": 2.7317961428412475e-07, + "loss": 0.3963, + "step": 11709 + }, + { + "epoch": 0.93, + "learning_rate": 2.7258425220038077e-07, + "loss": 0.4228, + "step": 11710 + }, + { + "epoch": 0.93, + "learning_rate": 2.719895306201581e-07, + "loss": 0.3055, + "step": 11711 + }, + { + "epoch": 0.93, + "learning_rate": 2.7139544958261765e-07, + "loss": 0.2924, + "step": 11712 + }, + { + "epoch": 0.93, + "learning_rate": 2.7080200912687484e-07, + "loss": 0.3537, + "step": 11713 + }, + { + "epoch": 0.93, + "learning_rate": 2.702092092920061e-07, + "loss": 0.378, + "step": 11714 + }, + { + "epoch": 0.93, + "learning_rate": 2.6961705011704475e-07, + "loss": 0.4392, + "step": 11715 + }, + { + "epoch": 0.93, + "learning_rate": 2.6902553164098065e-07, + "loss": 0.394, + "step": 11716 + }, + { + "epoch": 0.93, + "learning_rate": 2.684346539027616e-07, + "loss": 0.3761, + "step": 11717 + }, + { + "epoch": 0.93, + "learning_rate": 2.6784441694129747e-07, + "loss": 0.3345, + "step": 11718 + }, + { + "epoch": 0.93, + "learning_rate": 2.672548207954495e-07, + "loss": 0.3235, + "step": 11719 + }, + { + "epoch": 0.93, + "learning_rate": 2.6666586550403884e-07, + "loss": 0.445, + "step": 11720 + }, + { + "epoch": 0.93, + "learning_rate": 2.6607755110584886e-07, + "loss": 0.4057, + "step": 11721 + }, + { + "epoch": 0.93, + "learning_rate": 2.654898776396164e-07, + "loss": 0.3921, + "step": 11722 + }, + { + "epoch": 0.93, + "learning_rate": 2.64902845144035e-07, + "loss": 0.2917, + "step": 11723 + }, + { + "epoch": 0.93, + "learning_rate": 2.6431645365775806e-07, + "loss": 0.3328, + "step": 11724 + }, + { + "epoch": 0.93, + "learning_rate": 2.637307032193992e-07, + "loss": 0.4322, + "step": 11725 + }, + { + "epoch": 0.93, + "learning_rate": 2.6314559386752423e-07, + "loss": 0.2794, + "step": 11726 + }, + { + "epoch": 0.93, + "learning_rate": 2.6256112564066236e-07, + "loss": 0.3299, + "step": 11727 + }, + { + "epoch": 0.93, + "learning_rate": 2.6197729857729617e-07, + "loss": 0.2591, + "step": 11728 + }, + { + "epoch": 0.93, + "learning_rate": 2.613941127158681e-07, + "loss": 0.3821, + "step": 11729 + }, + { + "epoch": 0.93, + "learning_rate": 2.608115680947787e-07, + "loss": 0.2495, + "step": 11730 + }, + { + "epoch": 0.93, + "learning_rate": 2.602296647523861e-07, + "loss": 0.3706, + "step": 11731 + }, + { + "epoch": 0.93, + "learning_rate": 2.596484027270041e-07, + "loss": 0.358, + "step": 11732 + }, + { + "epoch": 0.93, + "learning_rate": 2.5906778205690876e-07, + "loss": 0.2955, + "step": 11733 + }, + { + "epoch": 0.93, + "learning_rate": 2.5848780278032836e-07, + "loss": 0.3014, + "step": 11734 + }, + { + "epoch": 0.93, + "learning_rate": 2.579084649354546e-07, + "loss": 0.349, + "step": 11735 + }, + { + "epoch": 0.93, + "learning_rate": 2.5732976856043034e-07, + "loss": 0.2587, + "step": 11736 + }, + { + "epoch": 0.93, + "learning_rate": 2.5675171369336284e-07, + "loss": 0.279, + "step": 11737 + }, + { + "epoch": 0.93, + "learning_rate": 2.5617430037231495e-07, + "loss": 0.4973, + "step": 11738 + }, + { + "epoch": 0.93, + "learning_rate": 2.5559752863530295e-07, + "loss": 0.2975, + "step": 11739 + }, + { + "epoch": 0.93, + "learning_rate": 2.550213985203076e-07, + "loss": 0.2443, + "step": 11740 + }, + { + "epoch": 0.93, + "learning_rate": 2.54445910065263e-07, + "loss": 0.5825, + "step": 11741 + }, + { + "epoch": 0.93, + "learning_rate": 2.538710633080621e-07, + "loss": 0.2654, + "step": 11742 + }, + { + "epoch": 0.93, + "learning_rate": 2.5329685828655803e-07, + "loss": 0.2661, + "step": 11743 + }, + { + "epoch": 0.93, + "learning_rate": 2.527232950385572e-07, + "loss": 0.3758, + "step": 11744 + }, + { + "epoch": 0.93, + "learning_rate": 2.521503736018249e-07, + "loss": 0.2787, + "step": 11745 + }, + { + "epoch": 0.93, + "learning_rate": 2.5157809401408775e-07, + "loss": 0.3367, + "step": 11746 + }, + { + "epoch": 0.93, + "learning_rate": 2.510064563130277e-07, + "loss": 0.5051, + "step": 11747 + }, + { + "epoch": 0.93, + "learning_rate": 2.5043546053628245e-07, + "loss": 0.401, + "step": 11748 + }, + { + "epoch": 0.93, + "learning_rate": 2.498651067214497e-07, + "loss": 0.3376, + "step": 11749 + }, + { + "epoch": 0.93, + "learning_rate": 2.4929539490608614e-07, + "loss": 0.3189, + "step": 11750 + }, + { + "epoch": 0.93, + "learning_rate": 2.487263251277028e-07, + "loss": 0.4611, + "step": 11751 + }, + { + "epoch": 0.93, + "learning_rate": 2.481578974237697e-07, + "loss": 0.2737, + "step": 11752 + }, + { + "epoch": 0.93, + "learning_rate": 2.475901118317181e-07, + "loss": 0.4264, + "step": 11753 + }, + { + "epoch": 0.93, + "learning_rate": 2.4702296838893134e-07, + "loss": 0.3213, + "step": 11754 + }, + { + "epoch": 0.93, + "learning_rate": 2.464564671327529e-07, + "loss": 0.2517, + "step": 11755 + }, + { + "epoch": 0.93, + "learning_rate": 2.4589060810048635e-07, + "loss": 0.4419, + "step": 11756 + }, + { + "epoch": 0.93, + "learning_rate": 2.453253913293896e-07, + "loss": 0.3833, + "step": 11757 + }, + { + "epoch": 0.93, + "learning_rate": 2.447608168566784e-07, + "loss": 0.2836, + "step": 11758 + }, + { + "epoch": 0.93, + "learning_rate": 2.441968847195286e-07, + "loss": 0.2736, + "step": 11759 + }, + { + "epoch": 0.93, + "learning_rate": 2.4363359495507166e-07, + "loss": 0.3382, + "step": 11760 + }, + { + "epoch": 0.93, + "learning_rate": 2.430709476003978e-07, + "loss": 0.287, + "step": 11761 + }, + { + "epoch": 0.93, + "learning_rate": 2.425089426925553e-07, + "loss": 0.3048, + "step": 11762 + }, + { + "epoch": 0.93, + "learning_rate": 2.419475802685489e-07, + "loss": 0.3489, + "step": 11763 + }, + { + "epoch": 0.93, + "learning_rate": 2.413868603653413e-07, + "loss": 0.2669, + "step": 11764 + }, + { + "epoch": 0.93, + "learning_rate": 2.4082678301985297e-07, + "loss": 0.2986, + "step": 11765 + }, + { + "epoch": 0.93, + "learning_rate": 2.402673482689633e-07, + "loss": 0.349, + "step": 11766 + }, + { + "epoch": 0.93, + "learning_rate": 2.3970855614950827e-07, + "loss": 0.5069, + "step": 11767 + }, + { + "epoch": 0.93, + "learning_rate": 2.3915040669828084e-07, + "loss": 0.2991, + "step": 11768 + }, + { + "epoch": 0.93, + "learning_rate": 2.385928999520326e-07, + "loss": 0.4161, + "step": 11769 + }, + { + "epoch": 0.93, + "learning_rate": 2.3803603594747427e-07, + "loss": 0.4035, + "step": 11770 + }, + { + "epoch": 0.93, + "learning_rate": 2.374798147212698e-07, + "loss": 0.2354, + "step": 11771 + }, + { + "epoch": 0.93, + "learning_rate": 2.3692423631004658e-07, + "loss": 0.3413, + "step": 11772 + }, + { + "epoch": 0.93, + "learning_rate": 2.3636930075038534e-07, + "loss": 0.3375, + "step": 11773 + }, + { + "epoch": 0.93, + "learning_rate": 2.3581500807882462e-07, + "loss": 0.3348, + "step": 11774 + }, + { + "epoch": 0.93, + "learning_rate": 2.3526135833186527e-07, + "loss": 0.2816, + "step": 11775 + }, + { + "epoch": 0.93, + "learning_rate": 2.3470835154595918e-07, + "loss": 0.3961, + "step": 11776 + }, + { + "epoch": 0.93, + "learning_rate": 2.3415598775752057e-07, + "loss": 0.2876, + "step": 11777 + }, + { + "epoch": 0.93, + "learning_rate": 2.3360426700292038e-07, + "loss": 0.3331, + "step": 11778 + }, + { + "epoch": 0.93, + "learning_rate": 2.330531893184873e-07, + "loss": 0.346, + "step": 11779 + }, + { + "epoch": 0.93, + "learning_rate": 2.3250275474050565e-07, + "loss": 0.274, + "step": 11780 + }, + { + "epoch": 0.93, + "learning_rate": 2.3195296330521756e-07, + "loss": 0.3279, + "step": 11781 + }, + { + "epoch": 0.93, + "learning_rate": 2.3140381504882736e-07, + "loss": 0.2136, + "step": 11782 + }, + { + "epoch": 0.93, + "learning_rate": 2.3085531000749285e-07, + "loss": 0.3006, + "step": 11783 + }, + { + "epoch": 0.93, + "learning_rate": 2.3030744821732953e-07, + "loss": 0.2777, + "step": 11784 + }, + { + "epoch": 0.93, + "learning_rate": 2.297602297144119e-07, + "loss": 0.3766, + "step": 11785 + }, + { + "epoch": 0.93, + "learning_rate": 2.2921365453477229e-07, + "loss": 0.3083, + "step": 11786 + }, + { + "epoch": 0.93, + "learning_rate": 2.286677227143985e-07, + "loss": 0.2939, + "step": 11787 + }, + { + "epoch": 0.93, + "learning_rate": 2.2812243428923964e-07, + "loss": 0.3919, + "step": 11788 + }, + { + "epoch": 0.93, + "learning_rate": 2.2757778929519914e-07, + "loss": 0.2999, + "step": 11789 + }, + { + "epoch": 0.93, + "learning_rate": 2.2703378776813833e-07, + "loss": 0.4328, + "step": 11790 + }, + { + "epoch": 0.93, + "learning_rate": 2.2649042974387858e-07, + "loss": 0.2964, + "step": 11791 + }, + { + "epoch": 0.93, + "learning_rate": 2.259477152581979e-07, + "loss": 0.3273, + "step": 11792 + }, + { + "epoch": 0.93, + "learning_rate": 2.2540564434682998e-07, + "loss": 0.3541, + "step": 11793 + }, + { + "epoch": 0.93, + "learning_rate": 2.2486421704546623e-07, + "loss": 0.3538, + "step": 11794 + }, + { + "epoch": 0.93, + "learning_rate": 2.2432343338976038e-07, + "loss": 0.3717, + "step": 11795 + }, + { + "epoch": 0.93, + "learning_rate": 2.2378329341531946e-07, + "loss": 0.3129, + "step": 11796 + }, + { + "epoch": 0.93, + "learning_rate": 2.2324379715770728e-07, + "loss": 0.3536, + "step": 11797 + }, + { + "epoch": 0.93, + "learning_rate": 2.2270494465244874e-07, + "loss": 0.2823, + "step": 11798 + }, + { + "epoch": 0.93, + "learning_rate": 2.2216673593502437e-07, + "loss": 0.2901, + "step": 11799 + }, + { + "epoch": 0.93, + "learning_rate": 2.2162917104087245e-07, + "loss": 0.3755, + "step": 11800 + }, + { + "epoch": 0.93, + "learning_rate": 2.2109225000538915e-07, + "loss": 0.4441, + "step": 11801 + }, + { + "epoch": 0.93, + "learning_rate": 2.2055597286392838e-07, + "loss": 0.286, + "step": 11802 + }, + { + "epoch": 0.94, + "learning_rate": 2.200203396517997e-07, + "loss": 0.301, + "step": 11803 + }, + { + "epoch": 0.94, + "learning_rate": 2.19485350404276e-07, + "loss": 0.3412, + "step": 11804 + }, + { + "epoch": 0.94, + "learning_rate": 2.1895100515658019e-07, + "loss": 0.4043, + "step": 11805 + }, + { + "epoch": 0.94, + "learning_rate": 2.1841730394389527e-07, + "loss": 0.4151, + "step": 11806 + }, + { + "epoch": 0.94, + "learning_rate": 2.1788424680136756e-07, + "loss": 0.2842, + "step": 11807 + }, + { + "epoch": 0.94, + "learning_rate": 2.173518337640923e-07, + "loss": 0.3538, + "step": 11808 + }, + { + "epoch": 0.94, + "learning_rate": 2.1682006486712703e-07, + "loss": 0.2886, + "step": 11809 + }, + { + "epoch": 0.94, + "learning_rate": 2.1628894014548819e-07, + "loss": 0.3993, + "step": 11810 + }, + { + "epoch": 0.94, + "learning_rate": 2.1575845963414555e-07, + "loss": 0.36, + "step": 11811 + }, + { + "epoch": 0.94, + "learning_rate": 2.1522862336803008e-07, + "loss": 0.3347, + "step": 11812 + }, + { + "epoch": 0.94, + "learning_rate": 2.146994313820283e-07, + "loss": 0.2824, + "step": 11813 + }, + { + "epoch": 0.94, + "learning_rate": 2.141708837109846e-07, + "loss": 0.3095, + "step": 11814 + }, + { + "epoch": 0.94, + "learning_rate": 2.136429803897022e-07, + "loss": 0.4379, + "step": 11815 + }, + { + "epoch": 0.94, + "learning_rate": 2.1311572145294114e-07, + "loss": 0.3865, + "step": 11816 + }, + { + "epoch": 0.94, + "learning_rate": 2.1258910693541802e-07, + "loss": 0.2476, + "step": 11817 + }, + { + "epoch": 0.94, + "learning_rate": 2.1206313687180845e-07, + "loss": 0.445, + "step": 11818 + }, + { + "epoch": 0.94, + "learning_rate": 2.1153781129674367e-07, + "loss": 0.2497, + "step": 11819 + }, + { + "epoch": 0.94, + "learning_rate": 2.1101313024481595e-07, + "loss": 0.3517, + "step": 11820 + }, + { + "epoch": 0.94, + "learning_rate": 2.1048909375057103e-07, + "loss": 0.4294, + "step": 11821 + }, + { + "epoch": 0.94, + "learning_rate": 2.0996570184851572e-07, + "loss": 0.2793, + "step": 11822 + }, + { + "epoch": 0.94, + "learning_rate": 2.0944295457311247e-07, + "loss": 0.4086, + "step": 11823 + }, + { + "epoch": 0.94, + "learning_rate": 2.0892085195878154e-07, + "loss": 0.412, + "step": 11824 + }, + { + "epoch": 0.94, + "learning_rate": 2.0839939403989984e-07, + "loss": 0.2418, + "step": 11825 + }, + { + "epoch": 0.94, + "learning_rate": 2.078785808508055e-07, + "loss": 0.468, + "step": 11826 + }, + { + "epoch": 0.94, + "learning_rate": 2.0735841242578992e-07, + "loss": 0.2857, + "step": 11827 + }, + { + "epoch": 0.94, + "learning_rate": 2.068388887991013e-07, + "loss": 0.2975, + "step": 11828 + }, + { + "epoch": 0.94, + "learning_rate": 2.0632001000495228e-07, + "loss": 0.3571, + "step": 11829 + }, + { + "epoch": 0.94, + "learning_rate": 2.0580177607750663e-07, + "loss": 0.3448, + "step": 11830 + }, + { + "epoch": 0.94, + "learning_rate": 2.0528418705088592e-07, + "loss": 0.3735, + "step": 11831 + }, + { + "epoch": 0.94, + "learning_rate": 2.0476724295917294e-07, + "loss": 0.4129, + "step": 11832 + }, + { + "epoch": 0.94, + "learning_rate": 2.04250943836406e-07, + "loss": 0.2834, + "step": 11833 + }, + { + "epoch": 0.94, + "learning_rate": 2.0373528971658009e-07, + "loss": 0.3244, + "step": 11834 + }, + { + "epoch": 0.94, + "learning_rate": 2.0322028063364806e-07, + "loss": 0.3979, + "step": 11835 + }, + { + "epoch": 0.94, + "learning_rate": 2.0270591662152173e-07, + "loss": 0.3357, + "step": 11836 + }, + { + "epoch": 0.94, + "learning_rate": 2.0219219771406952e-07, + "loss": 0.3396, + "step": 11837 + }, + { + "epoch": 0.94, + "learning_rate": 2.0167912394511657e-07, + "loss": 0.4665, + "step": 11838 + }, + { + "epoch": 0.94, + "learning_rate": 2.01166695348447e-07, + "loss": 0.4584, + "step": 11839 + }, + { + "epoch": 0.94, + "learning_rate": 2.0065491195780163e-07, + "loss": 0.4089, + "step": 11840 + }, + { + "epoch": 0.94, + "learning_rate": 2.00143773806879e-07, + "loss": 0.4239, + "step": 11841 + }, + { + "epoch": 0.94, + "learning_rate": 1.9963328092933444e-07, + "loss": 0.34, + "step": 11842 + }, + { + "epoch": 0.94, + "learning_rate": 1.9912343335878326e-07, + "loss": 0.4061, + "step": 11843 + }, + { + "epoch": 0.94, + "learning_rate": 1.9861423112879308e-07, + "loss": 0.2628, + "step": 11844 + }, + { + "epoch": 0.94, + "learning_rate": 1.9810567427289596e-07, + "loss": 0.2885, + "step": 11845 + }, + { + "epoch": 0.94, + "learning_rate": 1.9759776282457731e-07, + "loss": 0.3492, + "step": 11846 + }, + { + "epoch": 0.94, + "learning_rate": 1.970904968172771e-07, + "loss": 0.3196, + "step": 11847 + }, + { + "epoch": 0.94, + "learning_rate": 1.965838762844019e-07, + "loss": 0.3619, + "step": 11848 + }, + { + "epoch": 0.94, + "learning_rate": 1.9607790125930614e-07, + "loss": 0.4205, + "step": 11849 + }, + { + "epoch": 0.94, + "learning_rate": 1.9557257177530763e-07, + "loss": 0.4101, + "step": 11850 + }, + { + "epoch": 0.94, + "learning_rate": 1.9506788786567865e-07, + "loss": 0.3581, + "step": 11851 + }, + { + "epoch": 0.94, + "learning_rate": 1.9456384956365149e-07, + "loss": 0.3686, + "step": 11852 + }, + { + "epoch": 0.94, + "learning_rate": 1.9406045690241404e-07, + "loss": 0.2948, + "step": 11853 + }, + { + "epoch": 0.94, + "learning_rate": 1.935577099151109e-07, + "loss": 0.2695, + "step": 11854 + }, + { + "epoch": 0.94, + "learning_rate": 1.9305560863484896e-07, + "loss": 0.3987, + "step": 11855 + }, + { + "epoch": 0.94, + "learning_rate": 1.9255415309468618e-07, + "loss": 0.3763, + "step": 11856 + }, + { + "epoch": 0.94, + "learning_rate": 1.920533433276417e-07, + "loss": 0.3581, + "step": 11857 + }, + { + "epoch": 0.94, + "learning_rate": 1.9155317936669248e-07, + "loss": 0.3356, + "step": 11858 + }, + { + "epoch": 0.94, + "learning_rate": 1.910536612447711e-07, + "loss": 0.4097, + "step": 11859 + }, + { + "epoch": 0.94, + "learning_rate": 1.9055478899476788e-07, + "loss": 0.3218, + "step": 11860 + }, + { + "epoch": 0.94, + "learning_rate": 1.900565626495332e-07, + "loss": 0.4581, + "step": 11861 + }, + { + "epoch": 0.94, + "learning_rate": 1.8955898224187086e-07, + "loss": 0.2684, + "step": 11862 + }, + { + "epoch": 0.94, + "learning_rate": 1.890620478045435e-07, + "loss": 0.3749, + "step": 11863 + }, + { + "epoch": 0.94, + "learning_rate": 1.8856575937027388e-07, + "loss": 0.3001, + "step": 11864 + }, + { + "epoch": 0.94, + "learning_rate": 1.8807011697174027e-07, + "loss": 0.2684, + "step": 11865 + }, + { + "epoch": 0.94, + "learning_rate": 1.8757512064157658e-07, + "loss": 0.3446, + "step": 11866 + }, + { + "epoch": 0.94, + "learning_rate": 1.870807704123756e-07, + "loss": 0.4606, + "step": 11867 + }, + { + "epoch": 0.94, + "learning_rate": 1.8658706631669133e-07, + "loss": 0.2566, + "step": 11868 + }, + { + "epoch": 0.94, + "learning_rate": 1.8609400838702884e-07, + "loss": 0.3273, + "step": 11869 + }, + { + "epoch": 0.94, + "learning_rate": 1.856015966558533e-07, + "loss": 0.2845, + "step": 11870 + }, + { + "epoch": 0.94, + "learning_rate": 1.8510983115558988e-07, + "loss": 0.3022, + "step": 11871 + }, + { + "epoch": 0.94, + "learning_rate": 1.8461871191861825e-07, + "loss": 0.3068, + "step": 11872 + }, + { + "epoch": 0.94, + "learning_rate": 1.8412823897727473e-07, + "loss": 0.4241, + "step": 11873 + }, + { + "epoch": 0.94, + "learning_rate": 1.8363841236385571e-07, + "loss": 0.2321, + "step": 11874 + }, + { + "epoch": 0.94, + "learning_rate": 1.8314923211061542e-07, + "loss": 0.2779, + "step": 11875 + }, + { + "epoch": 0.94, + "learning_rate": 1.826606982497603e-07, + "loss": 0.2645, + "step": 11876 + }, + { + "epoch": 0.94, + "learning_rate": 1.8217281081346238e-07, + "loss": 0.4018, + "step": 11877 + }, + { + "epoch": 0.94, + "learning_rate": 1.8168556983384377e-07, + "loss": 0.3601, + "step": 11878 + }, + { + "epoch": 0.94, + "learning_rate": 1.811989753429877e-07, + "loss": 0.3427, + "step": 11879 + }, + { + "epoch": 0.94, + "learning_rate": 1.8071302737293294e-07, + "loss": 0.3797, + "step": 11880 + }, + { + "epoch": 0.94, + "learning_rate": 1.802277259556784e-07, + "loss": 0.298, + "step": 11881 + }, + { + "epoch": 0.94, + "learning_rate": 1.7974307112317957e-07, + "loss": 0.3198, + "step": 11882 + }, + { + "epoch": 0.94, + "learning_rate": 1.7925906290734653e-07, + "loss": 0.2956, + "step": 11883 + }, + { + "epoch": 0.94, + "learning_rate": 1.787757013400504e-07, + "loss": 0.2855, + "step": 11884 + }, + { + "epoch": 0.94, + "learning_rate": 1.7829298645311688e-07, + "loss": 0.4363, + "step": 11885 + }, + { + "epoch": 0.94, + "learning_rate": 1.7781091827833164e-07, + "loss": 0.3112, + "step": 11886 + }, + { + "epoch": 0.94, + "learning_rate": 1.7732949684743593e-07, + "loss": 0.3897, + "step": 11887 + }, + { + "epoch": 0.94, + "learning_rate": 1.768487221921278e-07, + "loss": 0.3021, + "step": 11888 + }, + { + "epoch": 0.94, + "learning_rate": 1.763685943440674e-07, + "loss": 0.3569, + "step": 11889 + }, + { + "epoch": 0.94, + "learning_rate": 1.7588911333486614e-07, + "loss": 0.3313, + "step": 11890 + }, + { + "epoch": 0.94, + "learning_rate": 1.7541027919609545e-07, + "loss": 0.2788, + "step": 11891 + }, + { + "epoch": 0.94, + "learning_rate": 1.7493209195928562e-07, + "loss": 0.3118, + "step": 11892 + }, + { + "epoch": 0.94, + "learning_rate": 1.7445455165592262e-07, + "loss": 0.3422, + "step": 11893 + }, + { + "epoch": 0.94, + "learning_rate": 1.7397765831744905e-07, + "loss": 0.3713, + "step": 11894 + }, + { + "epoch": 0.94, + "learning_rate": 1.7350141197526648e-07, + "loss": 0.3567, + "step": 11895 + }, + { + "epoch": 0.94, + "learning_rate": 1.7302581266073537e-07, + "loss": 0.1848, + "step": 11896 + }, + { + "epoch": 0.94, + "learning_rate": 1.7255086040516954e-07, + "loss": 0.2512, + "step": 11897 + }, + { + "epoch": 0.94, + "learning_rate": 1.7207655523984179e-07, + "loss": 0.3882, + "step": 11898 + }, + { + "epoch": 0.94, + "learning_rate": 1.71602897195986e-07, + "loss": 0.4586, + "step": 11899 + }, + { + "epoch": 0.94, + "learning_rate": 1.711298863047872e-07, + "loss": 0.3511, + "step": 11900 + }, + { + "epoch": 0.94, + "learning_rate": 1.7065752259739056e-07, + "loss": 0.4553, + "step": 11901 + }, + { + "epoch": 0.94, + "learning_rate": 1.701858061049022e-07, + "loss": 0.3984, + "step": 11902 + }, + { + "epoch": 0.94, + "learning_rate": 1.697147368583796e-07, + "loss": 0.4776, + "step": 11903 + }, + { + "epoch": 0.94, + "learning_rate": 1.692443148888412e-07, + "loss": 0.385, + "step": 11904 + }, + { + "epoch": 0.94, + "learning_rate": 1.6877454022726225e-07, + "loss": 0.3512, + "step": 11905 + }, + { + "epoch": 0.94, + "learning_rate": 1.6830541290457468e-07, + "loss": 0.3157, + "step": 11906 + }, + { + "epoch": 0.94, + "learning_rate": 1.6783693295166935e-07, + "loss": 0.3466, + "step": 11907 + }, + { + "epoch": 0.94, + "learning_rate": 1.6736910039939159e-07, + "loss": 0.3863, + "step": 11908 + }, + { + "epoch": 0.94, + "learning_rate": 1.6690191527854782e-07, + "loss": 0.304, + "step": 11909 + }, + { + "epoch": 0.94, + "learning_rate": 1.6643537761989904e-07, + "loss": 0.3777, + "step": 11910 + }, + { + "epoch": 0.94, + "learning_rate": 1.6596948745416397e-07, + "loss": 0.3264, + "step": 11911 + }, + { + "epoch": 0.94, + "learning_rate": 1.6550424481202032e-07, + "loss": 0.3771, + "step": 11912 + }, + { + "epoch": 0.94, + "learning_rate": 1.6503964972410136e-07, + "loss": 0.4353, + "step": 11913 + }, + { + "epoch": 0.94, + "learning_rate": 1.6457570222099816e-07, + "loss": 0.2802, + "step": 11914 + }, + { + "epoch": 0.94, + "learning_rate": 1.6411240233326076e-07, + "loss": 0.3132, + "step": 11915 + }, + { + "epoch": 0.94, + "learning_rate": 1.6364975009139473e-07, + "loss": 0.4515, + "step": 11916 + }, + { + "epoch": 0.94, + "learning_rate": 1.6318774552586237e-07, + "loss": 0.2927, + "step": 11917 + }, + { + "epoch": 0.94, + "learning_rate": 1.627263886670849e-07, + "loss": 0.35, + "step": 11918 + }, + { + "epoch": 0.94, + "learning_rate": 1.6226567954544248e-07, + "loss": 0.3943, + "step": 11919 + }, + { + "epoch": 0.94, + "learning_rate": 1.618056181912675e-07, + "loss": 0.3562, + "step": 11920 + }, + { + "epoch": 0.94, + "learning_rate": 1.6134620463485352e-07, + "loss": 0.2483, + "step": 11921 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088743890645297e-07, + "loss": 0.3535, + "step": 11922 + }, + { + "epoch": 0.94, + "learning_rate": 1.6042932103627174e-07, + "loss": 0.3626, + "step": 11923 + }, + { + "epoch": 0.94, + "learning_rate": 1.5997185105447344e-07, + "loss": 0.321, + "step": 11924 + }, + { + "epoch": 0.94, + "learning_rate": 1.5951502899118176e-07, + "loss": 0.2716, + "step": 11925 + }, + { + "epoch": 0.94, + "learning_rate": 1.590588548764771e-07, + "loss": 0.319, + "step": 11926 + }, + { + "epoch": 0.94, + "learning_rate": 1.586033287403943e-07, + "loss": 0.3206, + "step": 11927 + }, + { + "epoch": 0.94, + "learning_rate": 1.5814845061292938e-07, + "loss": 0.2493, + "step": 11928 + }, + { + "epoch": 0.95, + "learning_rate": 1.5769422052403172e-07, + "loss": 0.2501, + "step": 11929 + }, + { + "epoch": 0.95, + "learning_rate": 1.572406385036118e-07, + "loss": 0.301, + "step": 11930 + }, + { + "epoch": 0.95, + "learning_rate": 1.5678770458153693e-07, + "loss": 0.3719, + "step": 11931 + }, + { + "epoch": 0.95, + "learning_rate": 1.563354187876287e-07, + "loss": 0.3067, + "step": 11932 + }, + { + "epoch": 0.95, + "learning_rate": 1.558837811516667e-07, + "loss": 0.4187, + "step": 11933 + }, + { + "epoch": 0.95, + "learning_rate": 1.5543279170339265e-07, + "loss": 0.2284, + "step": 11934 + }, + { + "epoch": 0.95, + "learning_rate": 1.5498245047249948e-07, + "loss": 0.4684, + "step": 11935 + }, + { + "epoch": 0.95, + "learning_rate": 1.5453275748864128e-07, + "loss": 0.2716, + "step": 11936 + }, + { + "epoch": 0.95, + "learning_rate": 1.5408371278142652e-07, + "loss": 0.4626, + "step": 11937 + }, + { + "epoch": 0.95, + "learning_rate": 1.5363531638042494e-07, + "loss": 0.3279, + "step": 11938 + }, + { + "epoch": 0.95, + "learning_rate": 1.5318756831516069e-07, + "loss": 0.2929, + "step": 11939 + }, + { + "epoch": 0.95, + "learning_rate": 1.5274046861511348e-07, + "loss": 0.2696, + "step": 11940 + }, + { + "epoch": 0.95, + "learning_rate": 1.5229401730972536e-07, + "loss": 0.409, + "step": 11941 + }, + { + "epoch": 0.95, + "learning_rate": 1.518482144283917e-07, + "loss": 0.4784, + "step": 11942 + }, + { + "epoch": 0.95, + "learning_rate": 1.514030600004668e-07, + "loss": 0.3188, + "step": 11943 + }, + { + "epoch": 0.95, + "learning_rate": 1.5095855405526272e-07, + "loss": 0.4168, + "step": 11944 + }, + { + "epoch": 0.95, + "learning_rate": 1.505146966220461e-07, + "loss": 0.3168, + "step": 11945 + }, + { + "epoch": 0.95, + "learning_rate": 1.5007148773004466e-07, + "loss": 0.2914, + "step": 11946 + }, + { + "epoch": 0.95, + "learning_rate": 1.496289274084417e-07, + "loss": 0.3869, + "step": 11947 + }, + { + "epoch": 0.95, + "learning_rate": 1.4918701568637618e-07, + "loss": 0.4282, + "step": 11948 + }, + { + "epoch": 0.95, + "learning_rate": 1.4874575259294588e-07, + "loss": 0.3895, + "step": 11949 + }, + { + "epoch": 0.95, + "learning_rate": 1.483051381572076e-07, + "loss": 0.3077, + "step": 11950 + }, + { + "epoch": 0.95, + "learning_rate": 1.4786517240817255e-07, + "loss": 0.3333, + "step": 11951 + }, + { + "epoch": 0.95, + "learning_rate": 1.474258553748098e-07, + "loss": 0.3773, + "step": 11952 + }, + { + "epoch": 0.95, + "learning_rate": 1.469871870860473e-07, + "loss": 0.3165, + "step": 11953 + }, + { + "epoch": 0.95, + "learning_rate": 1.4654916757076865e-07, + "loss": 0.3832, + "step": 11954 + }, + { + "epoch": 0.95, + "learning_rate": 1.461117968578163e-07, + "loss": 0.2916, + "step": 11955 + }, + { + "epoch": 0.95, + "learning_rate": 1.4567507497598722e-07, + "loss": 0.2404, + "step": 11956 + }, + { + "epoch": 0.95, + "learning_rate": 1.452390019540384e-07, + "loss": 0.4709, + "step": 11957 + }, + { + "epoch": 0.95, + "learning_rate": 1.4480357782068467e-07, + "loss": 0.3138, + "step": 11958 + }, + { + "epoch": 0.95, + "learning_rate": 1.4436880260459307e-07, + "loss": 0.3224, + "step": 11959 + }, + { + "epoch": 0.95, + "learning_rate": 1.4393467633439629e-07, + "loss": 0.3625, + "step": 11960 + }, + { + "epoch": 0.95, + "learning_rate": 1.4350119903867477e-07, + "loss": 0.3212, + "step": 11961 + }, + { + "epoch": 0.95, + "learning_rate": 1.4306837074597235e-07, + "loss": 0.2987, + "step": 11962 + }, + { + "epoch": 0.95, + "learning_rate": 1.426361914847907e-07, + "loss": 0.2815, + "step": 11963 + }, + { + "epoch": 0.95, + "learning_rate": 1.422046612835848e-07, + "loss": 0.3263, + "step": 11964 + }, + { + "epoch": 0.95, + "learning_rate": 1.417737801707686e-07, + "loss": 0.4626, + "step": 11965 + }, + { + "epoch": 0.95, + "learning_rate": 1.4134354817471497e-07, + "loss": 0.3521, + "step": 11966 + }, + { + "epoch": 0.95, + "learning_rate": 1.4091396532375123e-07, + "loss": 0.5522, + "step": 11967 + }, + { + "epoch": 0.95, + "learning_rate": 1.4048503164616367e-07, + "loss": 0.2998, + "step": 11968 + }, + { + "epoch": 0.95, + "learning_rate": 1.4005674717019746e-07, + "loss": 0.4665, + "step": 11969 + }, + { + "epoch": 0.95, + "learning_rate": 1.3962911192405004e-07, + "loss": 0.4066, + "step": 11970 + }, + { + "epoch": 0.95, + "learning_rate": 1.3920212593588113e-07, + "loss": 0.4556, + "step": 11971 + }, + { + "epoch": 0.95, + "learning_rate": 1.3877578923380486e-07, + "loss": 0.3271, + "step": 11972 + }, + { + "epoch": 0.95, + "learning_rate": 1.3835010184589325e-07, + "loss": 0.3563, + "step": 11973 + }, + { + "epoch": 0.95, + "learning_rate": 1.3792506380017612e-07, + "loss": 0.3767, + "step": 11974 + }, + { + "epoch": 0.95, + "learning_rate": 1.3750067512464105e-07, + "loss": 0.2213, + "step": 11975 + }, + { + "epoch": 0.95, + "learning_rate": 1.3707693584723124e-07, + "loss": 0.3284, + "step": 11976 + }, + { + "epoch": 0.95, + "learning_rate": 1.3665384599584774e-07, + "loss": 0.3188, + "step": 11977 + }, + { + "epoch": 0.95, + "learning_rate": 1.3623140559834824e-07, + "loss": 0.4382, + "step": 11978 + }, + { + "epoch": 0.95, + "learning_rate": 1.358096146825505e-07, + "loss": 0.3339, + "step": 11979 + }, + { + "epoch": 0.95, + "learning_rate": 1.353884732762256e-07, + "loss": 0.1687, + "step": 11980 + }, + { + "epoch": 0.95, + "learning_rate": 1.3496798140710365e-07, + "loss": 0.2783, + "step": 11981 + }, + { + "epoch": 0.95, + "learning_rate": 1.3454813910287358e-07, + "loss": 0.3878, + "step": 11982 + }, + { + "epoch": 0.95, + "learning_rate": 1.341289463911788e-07, + "loss": 0.4403, + "step": 11983 + }, + { + "epoch": 0.95, + "learning_rate": 1.337104032996206e-07, + "loss": 0.238, + "step": 11984 + }, + { + "epoch": 0.95, + "learning_rate": 1.3329250985575915e-07, + "loss": 0.314, + "step": 11985 + }, + { + "epoch": 0.95, + "learning_rate": 1.3287526608711132e-07, + "loss": 0.4486, + "step": 11986 + }, + { + "epoch": 0.95, + "learning_rate": 1.324586720211485e-07, + "loss": 0.3134, + "step": 11987 + }, + { + "epoch": 0.95, + "learning_rate": 1.3204272768530313e-07, + "loss": 0.3885, + "step": 11988 + }, + { + "epoch": 0.95, + "learning_rate": 1.3162743310696224e-07, + "loss": 0.3606, + "step": 11989 + }, + { + "epoch": 0.95, + "learning_rate": 1.3121278831347172e-07, + "loss": 0.3615, + "step": 11990 + }, + { + "epoch": 0.95, + "learning_rate": 1.3079879333213308e-07, + "loss": 0.3362, + "step": 11991 + }, + { + "epoch": 0.95, + "learning_rate": 1.303854481902067e-07, + "loss": 0.3612, + "step": 11992 + }, + { + "epoch": 0.95, + "learning_rate": 1.2997275291490863e-07, + "loss": 0.35, + "step": 11993 + }, + { + "epoch": 0.95, + "learning_rate": 1.2956070753341265e-07, + "loss": 0.4458, + "step": 11994 + }, + { + "epoch": 0.95, + "learning_rate": 1.2914931207285154e-07, + "loss": 0.287, + "step": 11995 + }, + { + "epoch": 0.95, + "learning_rate": 1.2873856656031358e-07, + "loss": 0.4596, + "step": 11996 + }, + { + "epoch": 0.95, + "learning_rate": 1.2832847102284162e-07, + "loss": 0.2645, + "step": 11997 + }, + { + "epoch": 0.95, + "learning_rate": 1.2791902548744185e-07, + "loss": 0.3687, + "step": 11998 + }, + { + "epoch": 0.95, + "learning_rate": 1.2751022998107154e-07, + "loss": 0.4703, + "step": 11999 + }, + { + "epoch": 0.95, + "learning_rate": 1.271020845306492e-07, + "loss": 0.2924, + "step": 12000 + }, + { + "epoch": 0.95, + "learning_rate": 1.2669458916305112e-07, + "loss": 0.3642, + "step": 12001 + }, + { + "epoch": 0.95, + "learning_rate": 1.2628774390510578e-07, + "loss": 0.2501, + "step": 12002 + }, + { + "epoch": 0.95, + "learning_rate": 1.2588154878360293e-07, + "loss": 0.2683, + "step": 12003 + }, + { + "epoch": 0.95, + "learning_rate": 1.254760038252889e-07, + "loss": 0.4046, + "step": 12004 + }, + { + "epoch": 0.95, + "learning_rate": 1.2507110905686793e-07, + "loss": 0.3664, + "step": 12005 + }, + { + "epoch": 0.95, + "learning_rate": 1.2466686450499866e-07, + "loss": 0.3086, + "step": 12006 + }, + { + "epoch": 0.95, + "learning_rate": 1.242632701962987e-07, + "loss": 0.2434, + "step": 12007 + }, + { + "epoch": 0.95, + "learning_rate": 1.2386032615734345e-07, + "loss": 0.4294, + "step": 12008 + }, + { + "epoch": 0.95, + "learning_rate": 1.2345803241466504e-07, + "loss": 0.3445, + "step": 12009 + }, + { + "epoch": 0.95, + "learning_rate": 1.2305638899475226e-07, + "loss": 0.3634, + "step": 12010 + }, + { + "epoch": 0.95, + "learning_rate": 1.2265539592405173e-07, + "loss": 0.356, + "step": 12011 + }, + { + "epoch": 0.95, + "learning_rate": 1.222550532289668e-07, + "loss": 0.3416, + "step": 12012 + }, + { + "epoch": 0.95, + "learning_rate": 1.218553609358575e-07, + "loss": 0.3225, + "step": 12013 + }, + { + "epoch": 0.95, + "learning_rate": 1.214563190710416e-07, + "loss": 0.3416, + "step": 12014 + }, + { + "epoch": 0.95, + "learning_rate": 1.2105792766079594e-07, + "loss": 0.3409, + "step": 12015 + }, + { + "epoch": 0.95, + "learning_rate": 1.2066018673134948e-07, + "loss": 0.3026, + "step": 12016 + }, + { + "epoch": 0.95, + "learning_rate": 1.2026309630889465e-07, + "loss": 0.2941, + "step": 12017 + }, + { + "epoch": 0.95, + "learning_rate": 1.1986665641957718e-07, + "loss": 0.3789, + "step": 12018 + }, + { + "epoch": 0.95, + "learning_rate": 1.194708670894984e-07, + "loss": 0.358, + "step": 12019 + }, + { + "epoch": 0.95, + "learning_rate": 1.1907572834472303e-07, + "loss": 0.3342, + "step": 12020 + }, + { + "epoch": 0.95, + "learning_rate": 1.1868124021126582e-07, + "loss": 0.4099, + "step": 12021 + }, + { + "epoch": 0.95, + "learning_rate": 1.1828740271510375e-07, + "loss": 0.4195, + "step": 12022 + }, + { + "epoch": 0.95, + "learning_rate": 1.1789421588216721e-07, + "loss": 0.3122, + "step": 12023 + }, + { + "epoch": 0.95, + "learning_rate": 1.1750167973834769e-07, + "loss": 0.3789, + "step": 12024 + }, + { + "epoch": 0.95, + "learning_rate": 1.171097943094912e-07, + "loss": 0.3315, + "step": 12025 + }, + { + "epoch": 0.95, + "learning_rate": 1.1671855962140045e-07, + "loss": 0.3936, + "step": 12026 + }, + { + "epoch": 0.95, + "learning_rate": 1.1632797569983811e-07, + "loss": 0.3384, + "step": 12027 + }, + { + "epoch": 0.95, + "learning_rate": 1.1593804257052143e-07, + "loss": 0.4356, + "step": 12028 + }, + { + "epoch": 0.95, + "learning_rate": 1.1554876025912432e-07, + "loss": 0.3751, + "step": 12029 + }, + { + "epoch": 0.95, + "learning_rate": 1.151601287912818e-07, + "loss": 0.3594, + "step": 12030 + }, + { + "epoch": 0.95, + "learning_rate": 1.147721481925812e-07, + "loss": 0.3367, + "step": 12031 + }, + { + "epoch": 0.95, + "learning_rate": 1.1438481848856986e-07, + "loss": 0.4457, + "step": 12032 + }, + { + "epoch": 0.95, + "learning_rate": 1.1399813970475293e-07, + "loss": 0.4346, + "step": 12033 + }, + { + "epoch": 0.95, + "learning_rate": 1.1361211186658893e-07, + "loss": 0.3576, + "step": 12034 + }, + { + "epoch": 0.95, + "learning_rate": 1.1322673499949754e-07, + "loss": 0.2664, + "step": 12035 + }, + { + "epoch": 0.95, + "learning_rate": 1.1284200912885291e-07, + "loss": 0.3586, + "step": 12036 + }, + { + "epoch": 0.95, + "learning_rate": 1.1245793427998919e-07, + "loss": 0.31, + "step": 12037 + }, + { + "epoch": 0.95, + "learning_rate": 1.1207451047819396e-07, + "loss": 0.3332, + "step": 12038 + }, + { + "epoch": 0.95, + "learning_rate": 1.1169173774871478e-07, + "loss": 0.3389, + "step": 12039 + }, + { + "epoch": 0.95, + "learning_rate": 1.1130961611675484e-07, + "loss": 0.3719, + "step": 12040 + }, + { + "epoch": 0.95, + "learning_rate": 1.1092814560747511e-07, + "loss": 0.3624, + "step": 12041 + }, + { + "epoch": 0.95, + "learning_rate": 1.105473262459944e-07, + "loss": 0.2753, + "step": 12042 + }, + { + "epoch": 0.95, + "learning_rate": 1.1016715805738709e-07, + "loss": 0.341, + "step": 12043 + }, + { + "epoch": 0.95, + "learning_rate": 1.0978764106668538e-07, + "loss": 0.4127, + "step": 12044 + }, + { + "epoch": 0.95, + "learning_rate": 1.0940877529887928e-07, + "loss": 0.4583, + "step": 12045 + }, + { + "epoch": 0.95, + "learning_rate": 1.0903056077891438e-07, + "loss": 0.3567, + "step": 12046 + }, + { + "epoch": 0.95, + "learning_rate": 1.0865299753169522e-07, + "loss": 0.5136, + "step": 12047 + }, + { + "epoch": 0.95, + "learning_rate": 1.0827608558208192e-07, + "loss": 0.2778, + "step": 12048 + }, + { + "epoch": 0.95, + "learning_rate": 1.0789982495489238e-07, + "loss": 0.4075, + "step": 12049 + }, + { + "epoch": 0.95, + "learning_rate": 1.0752421567490123e-07, + "loss": 0.3112, + "step": 12050 + }, + { + "epoch": 0.95, + "learning_rate": 1.0714925776684093e-07, + "loss": 0.3075, + "step": 12051 + }, + { + "epoch": 0.95, + "learning_rate": 1.067749512554006e-07, + "loss": 0.416, + "step": 12052 + }, + { + "epoch": 0.95, + "learning_rate": 1.0640129616522721e-07, + "loss": 0.3218, + "step": 12053 + }, + { + "epoch": 0.95, + "learning_rate": 1.0602829252092328e-07, + "loss": 0.2568, + "step": 12054 + }, + { + "epoch": 0.96, + "learning_rate": 1.0565594034704918e-07, + "loss": 0.4156, + "step": 12055 + }, + { + "epoch": 0.96, + "learning_rate": 1.0528423966812307e-07, + "loss": 0.3633, + "step": 12056 + }, + { + "epoch": 0.96, + "learning_rate": 1.0491319050861981e-07, + "loss": 0.4713, + "step": 12057 + }, + { + "epoch": 0.96, + "learning_rate": 1.0454279289296987e-07, + "loss": 0.3741, + "step": 12058 + }, + { + "epoch": 0.96, + "learning_rate": 1.0417304684556373e-07, + "loss": 0.407, + "step": 12059 + }, + { + "epoch": 0.96, + "learning_rate": 1.0380395239074747e-07, + "loss": 0.3741, + "step": 12060 + }, + { + "epoch": 0.96, + "learning_rate": 1.0343550955282278e-07, + "loss": 0.383, + "step": 12061 + }, + { + "epoch": 0.96, + "learning_rate": 1.0306771835605022e-07, + "loss": 0.4156, + "step": 12062 + }, + { + "epoch": 0.96, + "learning_rate": 1.0270057882464823e-07, + "loss": 0.3699, + "step": 12063 + }, + { + "epoch": 0.96, + "learning_rate": 1.0233409098278967e-07, + "loss": 0.3472, + "step": 12064 + }, + { + "epoch": 0.96, + "learning_rate": 1.0196825485460637e-07, + "loss": 0.3561, + "step": 12065 + }, + { + "epoch": 0.96, + "learning_rate": 1.0160307046418794e-07, + "loss": 0.248, + "step": 12066 + }, + { + "epoch": 0.96, + "learning_rate": 1.0123853783557847e-07, + "loss": 0.2995, + "step": 12067 + }, + { + "epoch": 0.96, + "learning_rate": 1.0087465699278321e-07, + "loss": 0.3037, + "step": 12068 + }, + { + "epoch": 0.96, + "learning_rate": 1.0051142795975855e-07, + "loss": 0.3391, + "step": 12069 + }, + { + "epoch": 0.96, + "learning_rate": 1.0014885076042313e-07, + "loss": 0.3256, + "step": 12070 + }, + { + "epoch": 0.96, + "learning_rate": 9.978692541865121e-08, + "loss": 0.4011, + "step": 12071 + }, + { + "epoch": 0.96, + "learning_rate": 9.94256519582748e-08, + "loss": 0.3237, + "step": 12072 + }, + { + "epoch": 0.96, + "learning_rate": 9.906503040307824e-08, + "loss": 0.4269, + "step": 12073 + }, + { + "epoch": 0.96, + "learning_rate": 9.87050607768103e-08, + "loss": 0.4215, + "step": 12074 + }, + { + "epoch": 0.96, + "learning_rate": 9.834574310317313e-08, + "loss": 0.2969, + "step": 12075 + }, + { + "epoch": 0.96, + "learning_rate": 9.798707740582447e-08, + "loss": 0.307, + "step": 12076 + }, + { + "epoch": 0.96, + "learning_rate": 9.762906370837988e-08, + "loss": 0.2986, + "step": 12077 + }, + { + "epoch": 0.96, + "learning_rate": 9.727170203441605e-08, + "loss": 0.2348, + "step": 12078 + }, + { + "epoch": 0.96, + "learning_rate": 9.691499240746083e-08, + "loss": 0.3299, + "step": 12079 + }, + { + "epoch": 0.96, + "learning_rate": 9.65589348510032e-08, + "loss": 0.4185, + "step": 12080 + }, + { + "epoch": 0.96, + "learning_rate": 9.620352938848665e-08, + "loss": 0.3759, + "step": 12081 + }, + { + "epoch": 0.96, + "learning_rate": 9.584877604331467e-08, + "loss": 0.2584, + "step": 12082 + }, + { + "epoch": 0.96, + "learning_rate": 9.549467483884412e-08, + "loss": 0.3448, + "step": 12083 + }, + { + "epoch": 0.96, + "learning_rate": 9.514122579839302e-08, + "loss": 0.3217, + "step": 12084 + }, + { + "epoch": 0.96, + "learning_rate": 9.478842894523165e-08, + "loss": 0.3512, + "step": 12085 + }, + { + "epoch": 0.96, + "learning_rate": 9.443628430259144e-08, + "loss": 0.4864, + "step": 12086 + }, + { + "epoch": 0.96, + "learning_rate": 9.408479189366049e-08, + "loss": 0.3499, + "step": 12087 + }, + { + "epoch": 0.96, + "learning_rate": 9.37339517415814e-08, + "loss": 0.3401, + "step": 12088 + }, + { + "epoch": 0.96, + "learning_rate": 9.33837638694557e-08, + "loss": 0.2571, + "step": 12089 + }, + { + "epoch": 0.96, + "learning_rate": 9.30342283003416e-08, + "loss": 0.3153, + "step": 12090 + }, + { + "epoch": 0.96, + "learning_rate": 9.268534505725402e-08, + "loss": 0.3131, + "step": 12091 + }, + { + "epoch": 0.96, + "learning_rate": 9.233711416316571e-08, + "loss": 0.2881, + "step": 12092 + }, + { + "epoch": 0.96, + "learning_rate": 9.1989535641005e-08, + "loss": 0.3645, + "step": 12093 + }, + { + "epoch": 0.96, + "learning_rate": 9.164260951366021e-08, + "loss": 0.3839, + "step": 12094 + }, + { + "epoch": 0.96, + "learning_rate": 9.129633580397312e-08, + "loss": 0.4747, + "step": 12095 + }, + { + "epoch": 0.96, + "learning_rate": 9.095071453474435e-08, + "loss": 0.3879, + "step": 12096 + }, + { + "epoch": 0.96, + "learning_rate": 9.060574572873238e-08, + "loss": 0.3404, + "step": 12097 + }, + { + "epoch": 0.96, + "learning_rate": 9.026142940865013e-08, + "loss": 0.2679, + "step": 12098 + }, + { + "epoch": 0.96, + "learning_rate": 8.991776559717058e-08, + "loss": 0.3971, + "step": 12099 + }, + { + "epoch": 0.96, + "learning_rate": 8.95747543169223e-08, + "loss": 0.4527, + "step": 12100 + }, + { + "epoch": 0.96, + "learning_rate": 8.923239559049057e-08, + "loss": 0.3804, + "step": 12101 + }, + { + "epoch": 0.96, + "learning_rate": 8.889068944041734e-08, + "loss": 0.3397, + "step": 12102 + }, + { + "epoch": 0.96, + "learning_rate": 8.854963588920351e-08, + "loss": 0.3671, + "step": 12103 + }, + { + "epoch": 0.96, + "learning_rate": 8.820923495930556e-08, + "loss": 0.3644, + "step": 12104 + }, + { + "epoch": 0.96, + "learning_rate": 8.786948667313667e-08, + "loss": 0.4327, + "step": 12105 + }, + { + "epoch": 0.96, + "learning_rate": 8.753039105306782e-08, + "loss": 0.3397, + "step": 12106 + }, + { + "epoch": 0.96, + "learning_rate": 8.719194812142673e-08, + "loss": 0.3636, + "step": 12107 + }, + { + "epoch": 0.96, + "learning_rate": 8.685415790049889e-08, + "loss": 0.3344, + "step": 12108 + }, + { + "epoch": 0.96, + "learning_rate": 8.651702041252541e-08, + "loss": 0.4102, + "step": 12109 + }, + { + "epoch": 0.96, + "learning_rate": 8.61805356797063e-08, + "loss": 0.3707, + "step": 12110 + }, + { + "epoch": 0.96, + "learning_rate": 8.584470372419606e-08, + "loss": 0.4136, + "step": 12111 + }, + { + "epoch": 0.96, + "learning_rate": 8.550952456810813e-08, + "loss": 0.3826, + "step": 12112 + }, + { + "epoch": 0.96, + "learning_rate": 8.517499823351261e-08, + "loss": 0.461, + "step": 12113 + }, + { + "epoch": 0.96, + "learning_rate": 8.484112474243633e-08, + "loss": 0.3296, + "step": 12114 + }, + { + "epoch": 0.96, + "learning_rate": 8.450790411686282e-08, + "loss": 0.2954, + "step": 12115 + }, + { + "epoch": 0.96, + "learning_rate": 8.417533637873454e-08, + "loss": 0.3309, + "step": 12116 + }, + { + "epoch": 0.96, + "learning_rate": 8.384342154994841e-08, + "loss": 0.3679, + "step": 12117 + }, + { + "epoch": 0.96, + "learning_rate": 8.351215965235915e-08, + "loss": 0.2849, + "step": 12118 + }, + { + "epoch": 0.96, + "learning_rate": 8.318155070777822e-08, + "loss": 0.4373, + "step": 12119 + }, + { + "epoch": 0.96, + "learning_rate": 8.28515947379771e-08, + "loss": 0.2149, + "step": 12120 + }, + { + "epoch": 0.96, + "learning_rate": 8.252229176467841e-08, + "loss": 0.2586, + "step": 12121 + }, + { + "epoch": 0.96, + "learning_rate": 8.219364180956812e-08, + "loss": 0.2872, + "step": 12122 + }, + { + "epoch": 0.96, + "learning_rate": 8.186564489428561e-08, + "loss": 0.3229, + "step": 12123 + }, + { + "epoch": 0.96, + "learning_rate": 8.153830104042582e-08, + "loss": 0.2766, + "step": 12124 + }, + { + "epoch": 0.96, + "learning_rate": 8.121161026954482e-08, + "loss": 0.4131, + "step": 12125 + }, + { + "epoch": 0.96, + "learning_rate": 8.088557260315322e-08, + "loss": 0.2755, + "step": 12126 + }, + { + "epoch": 0.96, + "learning_rate": 8.056018806271937e-08, + "loss": 0.4606, + "step": 12127 + }, + { + "epoch": 0.96, + "learning_rate": 8.023545666966726e-08, + "loss": 0.32, + "step": 12128 + }, + { + "epoch": 0.96, + "learning_rate": 7.991137844537977e-08, + "loss": 0.4596, + "step": 12129 + }, + { + "epoch": 0.96, + "learning_rate": 7.958795341119541e-08, + "loss": 0.2653, + "step": 12130 + }, + { + "epoch": 0.96, + "learning_rate": 7.926518158841045e-08, + "loss": 0.392, + "step": 12131 + }, + { + "epoch": 0.96, + "learning_rate": 7.894306299827791e-08, + "loss": 0.3833, + "step": 12132 + }, + { + "epoch": 0.96, + "learning_rate": 7.86215976620075e-08, + "loss": 0.2571, + "step": 12133 + }, + { + "epoch": 0.96, + "learning_rate": 7.83007856007667e-08, + "loss": 0.4766, + "step": 12134 + }, + { + "epoch": 0.96, + "learning_rate": 7.798062683567864e-08, + "loss": 0.3484, + "step": 12135 + }, + { + "epoch": 0.96, + "learning_rate": 7.766112138782422e-08, + "loss": 0.2787, + "step": 12136 + }, + { + "epoch": 0.96, + "learning_rate": 7.734226927824106e-08, + "loss": 0.3435, + "step": 12137 + }, + { + "epoch": 0.96, + "learning_rate": 7.70240705279257e-08, + "loss": 0.3462, + "step": 12138 + }, + { + "epoch": 0.96, + "learning_rate": 7.670652515782917e-08, + "loss": 0.2878, + "step": 12139 + }, + { + "epoch": 0.96, + "learning_rate": 7.638963318886028e-08, + "loss": 0.2658, + "step": 12140 + }, + { + "epoch": 0.96, + "learning_rate": 7.607339464188346e-08, + "loss": 0.3013, + "step": 12141 + }, + { + "epoch": 0.96, + "learning_rate": 7.575780953772427e-08, + "loss": 0.4405, + "step": 12142 + }, + { + "epoch": 0.96, + "learning_rate": 7.544287789715943e-08, + "loss": 0.3033, + "step": 12143 + }, + { + "epoch": 0.96, + "learning_rate": 7.51285997409279e-08, + "loss": 0.3666, + "step": 12144 + }, + { + "epoch": 0.96, + "learning_rate": 7.481497508972313e-08, + "loss": 0.437, + "step": 12145 + }, + { + "epoch": 0.96, + "learning_rate": 7.450200396419416e-08, + "loss": 0.4163, + "step": 12146 + }, + { + "epoch": 0.96, + "learning_rate": 7.418968638495006e-08, + "loss": 0.4216, + "step": 12147 + }, + { + "epoch": 0.96, + "learning_rate": 7.387802237255658e-08, + "loss": 0.2521, + "step": 12148 + }, + { + "epoch": 0.96, + "learning_rate": 7.35670119475329e-08, + "loss": 0.4141, + "step": 12149 + }, + { + "epoch": 0.96, + "learning_rate": 7.325665513035707e-08, + "loss": 0.314, + "step": 12150 + }, + { + "epoch": 0.96, + "learning_rate": 7.294695194146829e-08, + "loss": 0.324, + "step": 12151 + }, + { + "epoch": 0.96, + "learning_rate": 7.263790240125579e-08, + "loss": 0.4119, + "step": 12152 + }, + { + "epoch": 0.96, + "learning_rate": 7.232950653006998e-08, + "loss": 0.4388, + "step": 12153 + }, + { + "epoch": 0.96, + "learning_rate": 7.202176434821683e-08, + "loss": 0.3871, + "step": 12154 + }, + { + "epoch": 0.96, + "learning_rate": 7.171467587596126e-08, + "loss": 0.2624, + "step": 12155 + }, + { + "epoch": 0.96, + "learning_rate": 7.140824113352151e-08, + "loss": 0.3529, + "step": 12156 + }, + { + "epoch": 0.96, + "learning_rate": 7.110246014107592e-08, + "loss": 0.3505, + "step": 12157 + }, + { + "epoch": 0.96, + "learning_rate": 7.079733291875945e-08, + "loss": 0.3633, + "step": 12158 + }, + { + "epoch": 0.96, + "learning_rate": 7.049285948666052e-08, + "loss": 0.306, + "step": 12159 + }, + { + "epoch": 0.96, + "learning_rate": 7.018903986483083e-08, + "loss": 0.3614, + "step": 12160 + }, + { + "epoch": 0.96, + "learning_rate": 6.988587407327219e-08, + "loss": 0.3703, + "step": 12161 + }, + { + "epoch": 0.96, + "learning_rate": 6.958336213194972e-08, + "loss": 0.392, + "step": 12162 + }, + { + "epoch": 0.96, + "learning_rate": 6.928150406077861e-08, + "loss": 0.2839, + "step": 12163 + }, + { + "epoch": 0.96, + "learning_rate": 6.89802998796385e-08, + "loss": 0.4131, + "step": 12164 + }, + { + "epoch": 0.96, + "learning_rate": 6.867974960836022e-08, + "loss": 0.3616, + "step": 12165 + }, + { + "epoch": 0.96, + "learning_rate": 6.837985326673457e-08, + "loss": 0.3696, + "step": 12166 + }, + { + "epoch": 0.96, + "learning_rate": 6.80806108745069e-08, + "loss": 0.3873, + "step": 12167 + }, + { + "epoch": 0.96, + "learning_rate": 6.778202245138144e-08, + "loss": 0.4288, + "step": 12168 + }, + { + "epoch": 0.96, + "learning_rate": 6.748408801701911e-08, + "loss": 0.2594, + "step": 12169 + }, + { + "epoch": 0.96, + "learning_rate": 6.718680759103757e-08, + "loss": 0.3184, + "step": 12170 + }, + { + "epoch": 0.96, + "learning_rate": 6.689018119301227e-08, + "loss": 0.3662, + "step": 12171 + }, + { + "epoch": 0.96, + "learning_rate": 6.659420884247203e-08, + "loss": 0.3546, + "step": 12172 + }, + { + "epoch": 0.96, + "learning_rate": 6.629889055890682e-08, + "loss": 0.3719, + "step": 12173 + }, + { + "epoch": 0.96, + "learning_rate": 6.600422636176219e-08, + "loss": 0.3835, + "step": 12174 + }, + { + "epoch": 0.96, + "learning_rate": 6.571021627043928e-08, + "loss": 0.3098, + "step": 12175 + }, + { + "epoch": 0.96, + "learning_rate": 6.541686030429817e-08, + "loss": 0.3724, + "step": 12176 + }, + { + "epoch": 0.96, + "learning_rate": 6.512415848265453e-08, + "loss": 0.3477, + "step": 12177 + }, + { + "epoch": 0.96, + "learning_rate": 6.48321108247818e-08, + "loss": 0.3171, + "step": 12178 + }, + { + "epoch": 0.96, + "learning_rate": 6.454071734990907e-08, + "loss": 0.4526, + "step": 12179 + }, + { + "epoch": 0.96, + "learning_rate": 6.424997807722433e-08, + "loss": 0.3519, + "step": 12180 + }, + { + "epoch": 0.97, + "learning_rate": 6.395989302587113e-08, + "loss": 0.348, + "step": 12181 + }, + { + "epoch": 0.97, + "learning_rate": 6.367046221494866e-08, + "loss": 0.4227, + "step": 12182 + }, + { + "epoch": 0.97, + "learning_rate": 6.33816856635161e-08, + "loss": 0.2685, + "step": 12183 + }, + { + "epoch": 0.97, + "learning_rate": 6.309356339058825e-08, + "loss": 0.3617, + "step": 12184 + }, + { + "epoch": 0.97, + "learning_rate": 6.28060954151355e-08, + "loss": 0.2706, + "step": 12185 + }, + { + "epoch": 0.97, + "learning_rate": 6.251928175608602e-08, + "loss": 0.3387, + "step": 12186 + }, + { + "epoch": 0.97, + "learning_rate": 6.223312243232693e-08, + "loss": 0.5133, + "step": 12187 + }, + { + "epoch": 0.97, + "learning_rate": 6.194761746269762e-08, + "loss": 0.3192, + "step": 12188 + }, + { + "epoch": 0.97, + "learning_rate": 6.16627668659997e-08, + "loss": 0.3286, + "step": 12189 + }, + { + "epoch": 0.97, + "learning_rate": 6.137857066098929e-08, + "loss": 0.4659, + "step": 12190 + }, + { + "epoch": 0.97, + "learning_rate": 6.109502886637697e-08, + "loss": 0.2805, + "step": 12191 + }, + { + "epoch": 0.97, + "learning_rate": 6.081214150083447e-08, + "loss": 0.2075, + "step": 12192 + }, + { + "epoch": 0.97, + "learning_rate": 6.052990858298801e-08, + "loss": 0.3727, + "step": 12193 + }, + { + "epoch": 0.97, + "learning_rate": 6.024833013142272e-08, + "loss": 0.37, + "step": 12194 + }, + { + "epoch": 0.97, + "learning_rate": 5.9967406164676e-08, + "loss": 0.3872, + "step": 12195 + }, + { + "epoch": 0.97, + "learning_rate": 5.96871367012486e-08, + "loss": 0.2285, + "step": 12196 + }, + { + "epoch": 0.97, + "learning_rate": 5.9407521759592414e-08, + "loss": 0.4702, + "step": 12197 + }, + { + "epoch": 0.97, + "learning_rate": 5.912856135812051e-08, + "loss": 0.3225, + "step": 12198 + }, + { + "epoch": 0.97, + "learning_rate": 5.8850255515200405e-08, + "loss": 0.2935, + "step": 12199 + }, + { + "epoch": 0.97, + "learning_rate": 5.857260424915634e-08, + "loss": 0.3875, + "step": 12200 + }, + { + "epoch": 0.97, + "learning_rate": 5.8295607578272575e-08, + "loss": 0.4305, + "step": 12201 + }, + { + "epoch": 0.97, + "learning_rate": 5.801926552078563e-08, + "loss": 0.4076, + "step": 12202 + }, + { + "epoch": 0.97, + "learning_rate": 5.774357809489317e-08, + "loss": 0.3179, + "step": 12203 + }, + { + "epoch": 0.97, + "learning_rate": 5.746854531874624e-08, + "loss": 0.4271, + "step": 12204 + }, + { + "epoch": 0.97, + "learning_rate": 5.7194167210454785e-08, + "loss": 0.3155, + "step": 12205 + }, + { + "epoch": 0.97, + "learning_rate": 5.692044378808659e-08, + "loss": 0.3239, + "step": 12206 + }, + { + "epoch": 0.97, + "learning_rate": 5.664737506966389e-08, + "loss": 0.3566, + "step": 12207 + }, + { + "epoch": 0.97, + "learning_rate": 5.6374961073166757e-08, + "loss": 0.3701, + "step": 12208 + }, + { + "epoch": 0.97, + "learning_rate": 5.610320181653306e-08, + "loss": 0.4315, + "step": 12209 + }, + { + "epoch": 0.97, + "learning_rate": 5.583209731765626e-08, + "loss": 0.3273, + "step": 12210 + }, + { + "epoch": 0.97, + "learning_rate": 5.5561647594388756e-08, + "loss": 0.3646, + "step": 12211 + }, + { + "epoch": 0.97, + "learning_rate": 5.529185266453629e-08, + "loss": 0.4587, + "step": 12212 + }, + { + "epoch": 0.97, + "learning_rate": 5.502271254586356e-08, + "loss": 0.292, + "step": 12213 + }, + { + "epoch": 0.97, + "learning_rate": 5.4754227256094136e-08, + "loss": 0.3092, + "step": 12214 + }, + { + "epoch": 0.97, + "learning_rate": 5.4486396812906125e-08, + "loss": 0.3388, + "step": 12215 + }, + { + "epoch": 0.97, + "learning_rate": 5.421922123393208e-08, + "loss": 0.4311, + "step": 12216 + }, + { + "epoch": 0.97, + "learning_rate": 5.395270053676793e-08, + "loss": 0.2737, + "step": 12217 + }, + { + "epoch": 0.97, + "learning_rate": 5.3686834738960744e-08, + "loss": 0.3873, + "step": 12218 + }, + { + "epoch": 0.97, + "learning_rate": 5.3421623858016525e-08, + "loss": 0.343, + "step": 12219 + }, + { + "epoch": 0.97, + "learning_rate": 5.3157067911399076e-08, + "loss": 0.3047, + "step": 12220 + }, + { + "epoch": 0.97, + "learning_rate": 5.289316691652668e-08, + "loss": 0.3618, + "step": 12221 + }, + { + "epoch": 0.97, + "learning_rate": 5.2629920890777676e-08, + "loss": 0.3897, + "step": 12222 + }, + { + "epoch": 0.97, + "learning_rate": 5.236732985148374e-08, + "loss": 0.3697, + "step": 12223 + }, + { + "epoch": 0.97, + "learning_rate": 5.21053938159366e-08, + "loss": 0.3475, + "step": 12224 + }, + { + "epoch": 0.97, + "learning_rate": 5.1844112801383576e-08, + "loss": 0.3527, + "step": 12225 + }, + { + "epoch": 0.97, + "learning_rate": 5.158348682502756e-08, + "loss": 0.2972, + "step": 12226 + }, + { + "epoch": 0.97, + "learning_rate": 5.1323515904031506e-08, + "loss": 0.3668, + "step": 12227 + }, + { + "epoch": 0.97, + "learning_rate": 5.1064200055510606e-08, + "loss": 0.34, + "step": 12228 + }, + { + "epoch": 0.97, + "learning_rate": 5.080553929654119e-08, + "loss": 0.3656, + "step": 12229 + }, + { + "epoch": 0.97, + "learning_rate": 5.05475336441541e-08, + "loss": 0.3391, + "step": 12230 + }, + { + "epoch": 0.97, + "learning_rate": 5.0290183115339065e-08, + "loss": 0.4544, + "step": 12231 + }, + { + "epoch": 0.97, + "learning_rate": 5.003348772704031e-08, + "loss": 0.3577, + "step": 12232 + }, + { + "epoch": 0.97, + "learning_rate": 4.977744749615987e-08, + "loss": 0.3168, + "step": 12233 + }, + { + "epoch": 0.97, + "learning_rate": 4.9522062439557595e-08, + "loss": 0.3094, + "step": 12234 + }, + { + "epoch": 0.97, + "learning_rate": 4.926733257404892e-08, + "loss": 0.2749, + "step": 12235 + }, + { + "epoch": 0.97, + "learning_rate": 4.901325791640599e-08, + "loss": 0.3631, + "step": 12236 + }, + { + "epoch": 0.97, + "learning_rate": 4.8759838483358745e-08, + "loss": 0.2556, + "step": 12237 + }, + { + "epoch": 0.97, + "learning_rate": 4.850707429159496e-08, + "loss": 0.3143, + "step": 12238 + }, + { + "epoch": 0.97, + "learning_rate": 4.825496535775576e-08, + "loss": 0.3547, + "step": 12239 + }, + { + "epoch": 0.97, + "learning_rate": 4.800351169844231e-08, + "loss": 0.4514, + "step": 12240 + }, + { + "epoch": 0.97, + "learning_rate": 4.7752713330212475e-08, + "loss": 0.3069, + "step": 12241 + }, + { + "epoch": 0.97, + "learning_rate": 4.7502570269578605e-08, + "loss": 0.3333, + "step": 12242 + }, + { + "epoch": 0.97, + "learning_rate": 4.725308253301197e-08, + "loss": 0.3464, + "step": 12243 + }, + { + "epoch": 0.97, + "learning_rate": 4.7004250136940547e-08, + "loss": 0.3236, + "step": 12244 + }, + { + "epoch": 0.97, + "learning_rate": 4.675607309774899e-08, + "loss": 0.4539, + "step": 12245 + }, + { + "epoch": 0.97, + "learning_rate": 4.650855143177757e-08, + "loss": 0.4041, + "step": 12246 + }, + { + "epoch": 0.97, + "learning_rate": 4.626168515532548e-08, + "loss": 0.3215, + "step": 12247 + }, + { + "epoch": 0.97, + "learning_rate": 4.6015474284646366e-08, + "loss": 0.3223, + "step": 12248 + }, + { + "epoch": 0.97, + "learning_rate": 4.576991883595283e-08, + "loss": 0.3437, + "step": 12249 + }, + { + "epoch": 0.97, + "learning_rate": 4.5525018825414157e-08, + "loss": 0.3455, + "step": 12250 + }, + { + "epoch": 0.97, + "learning_rate": 4.528077426915412e-08, + "loss": 0.4493, + "step": 12251 + }, + { + "epoch": 0.97, + "learning_rate": 4.50371851832565e-08, + "loss": 0.443, + "step": 12252 + }, + { + "epoch": 0.97, + "learning_rate": 4.4794251583759604e-08, + "loss": 0.337, + "step": 12253 + }, + { + "epoch": 0.97, + "learning_rate": 4.4551973486660625e-08, + "loss": 0.3312, + "step": 12254 + }, + { + "epoch": 0.97, + "learning_rate": 4.431035090791125e-08, + "loss": 0.3591, + "step": 12255 + }, + { + "epoch": 0.97, + "learning_rate": 4.4069383863420966e-08, + "loss": 0.3252, + "step": 12256 + }, + { + "epoch": 0.97, + "learning_rate": 4.38290723690582e-08, + "loss": 0.3375, + "step": 12257 + }, + { + "epoch": 0.97, + "learning_rate": 4.3589416440643626e-08, + "loss": 0.2726, + "step": 12258 + }, + { + "epoch": 0.97, + "learning_rate": 4.335041609396018e-08, + "loss": 0.2164, + "step": 12259 + }, + { + "epoch": 0.97, + "learning_rate": 4.3112071344741935e-08, + "loss": 0.3031, + "step": 12260 + }, + { + "epoch": 0.97, + "learning_rate": 4.287438220868523e-08, + "loss": 0.3503, + "step": 12261 + }, + { + "epoch": 0.97, + "learning_rate": 4.263734870143976e-08, + "loss": 0.3621, + "step": 12262 + }, + { + "epoch": 0.97, + "learning_rate": 4.2400970838613057e-08, + "loss": 0.4393, + "step": 12263 + }, + { + "epoch": 0.97, + "learning_rate": 4.216524863576932e-08, + "loss": 0.333, + "step": 12264 + }, + { + "epoch": 0.97, + "learning_rate": 4.1930182108430584e-08, + "loss": 0.2678, + "step": 12265 + }, + { + "epoch": 0.97, + "learning_rate": 4.1695771272073357e-08, + "loss": 0.2386, + "step": 12266 + }, + { + "epoch": 0.97, + "learning_rate": 4.146201614213419e-08, + "loss": 0.3534, + "step": 12267 + }, + { + "epoch": 0.97, + "learning_rate": 4.1228916734002976e-08, + "loss": 0.3282, + "step": 12268 + }, + { + "epoch": 0.97, + "learning_rate": 4.099647306302856e-08, + "loss": 0.3841, + "step": 12269 + }, + { + "epoch": 0.97, + "learning_rate": 4.076468514451759e-08, + "loss": 0.3879, + "step": 12270 + }, + { + "epoch": 0.97, + "learning_rate": 4.0533552993731186e-08, + "loss": 0.2948, + "step": 12271 + }, + { + "epoch": 0.97, + "learning_rate": 4.030307662588939e-08, + "loss": 0.3277, + "step": 12272 + }, + { + "epoch": 0.97, + "learning_rate": 4.007325605616563e-08, + "loss": 0.2959, + "step": 12273 + }, + { + "epoch": 0.97, + "learning_rate": 3.9844091299694466e-08, + "loss": 0.3895, + "step": 12274 + }, + { + "epoch": 0.97, + "learning_rate": 3.961558237156493e-08, + "loss": 0.3588, + "step": 12275 + }, + { + "epoch": 0.97, + "learning_rate": 3.9387729286821666e-08, + "loss": 0.2916, + "step": 12276 + }, + { + "epoch": 0.97, + "learning_rate": 3.9160532060470435e-08, + "loss": 0.3493, + "step": 12277 + }, + { + "epoch": 0.97, + "learning_rate": 3.893399070746928e-08, + "loss": 0.2952, + "step": 12278 + }, + { + "epoch": 0.97, + "learning_rate": 3.870810524273516e-08, + "loss": 0.2734, + "step": 12279 + }, + { + "epoch": 0.97, + "learning_rate": 3.8482875681140616e-08, + "loss": 0.3387, + "step": 12280 + }, + { + "epoch": 0.97, + "learning_rate": 3.8258302037518234e-08, + "loss": 0.4282, + "step": 12281 + }, + { + "epoch": 0.97, + "learning_rate": 3.803438432665396e-08, + "loss": 0.4403, + "step": 12282 + }, + { + "epoch": 0.97, + "learning_rate": 3.781112256329045e-08, + "loss": 0.3155, + "step": 12283 + }, + { + "epoch": 0.97, + "learning_rate": 3.758851676213038e-08, + "loss": 0.3653, + "step": 12284 + }, + { + "epoch": 0.97, + "learning_rate": 3.7366566937829804e-08, + "loss": 0.3528, + "step": 12285 + }, + { + "epoch": 0.97, + "learning_rate": 3.714527310500371e-08, + "loss": 0.3451, + "step": 12286 + }, + { + "epoch": 0.97, + "learning_rate": 3.692463527822376e-08, + "loss": 0.4024, + "step": 12287 + }, + { + "epoch": 0.97, + "learning_rate": 3.670465347201724e-08, + "loss": 0.4269, + "step": 12288 + }, + { + "epoch": 0.97, + "learning_rate": 3.6485327700869214e-08, + "loss": 0.3188, + "step": 12289 + }, + { + "epoch": 0.97, + "learning_rate": 3.6266657979220356e-08, + "loss": 0.3658, + "step": 12290 + }, + { + "epoch": 0.97, + "learning_rate": 3.604864432147026e-08, + "loss": 0.3063, + "step": 12291 + }, + { + "epoch": 0.97, + "learning_rate": 3.5831286741973006e-08, + "loss": 0.3376, + "step": 12292 + }, + { + "epoch": 0.97, + "learning_rate": 3.561458525504047e-08, + "loss": 0.3113, + "step": 12293 + }, + { + "epoch": 0.97, + "learning_rate": 3.539853987494235e-08, + "loss": 0.3219, + "step": 12294 + }, + { + "epoch": 0.97, + "learning_rate": 3.518315061590394e-08, + "loss": 0.2272, + "step": 12295 + }, + { + "epoch": 0.97, + "learning_rate": 3.496841749210722e-08, + "loss": 0.2917, + "step": 12296 + }, + { + "epoch": 0.97, + "learning_rate": 3.4754340517691996e-08, + "loss": 0.2599, + "step": 12297 + }, + { + "epoch": 0.97, + "learning_rate": 3.454091970675366e-08, + "loss": 0.4119, + "step": 12298 + }, + { + "epoch": 0.97, + "learning_rate": 3.4328155073344306e-08, + "loss": 0.3751, + "step": 12299 + }, + { + "epoch": 0.97, + "learning_rate": 3.411604663147494e-08, + "loss": 0.3124, + "step": 12300 + }, + { + "epoch": 0.97, + "learning_rate": 3.3904594395111066e-08, + "loss": 0.3034, + "step": 12301 + }, + { + "epoch": 0.97, + "learning_rate": 3.369379837817599e-08, + "loss": 0.3334, + "step": 12302 + }, + { + "epoch": 0.97, + "learning_rate": 3.3483658594548606e-08, + "loss": 0.3482, + "step": 12303 + }, + { + "epoch": 0.97, + "learning_rate": 3.327417505806785e-08, + "loss": 0.2933, + "step": 12304 + }, + { + "epoch": 0.97, + "learning_rate": 3.30653477825249e-08, + "loss": 0.3221, + "step": 12305 + }, + { + "epoch": 0.97, + "learning_rate": 3.2857176781671e-08, + "loss": 0.4464, + "step": 12306 + }, + { + "epoch": 0.98, + "learning_rate": 3.264966206921294e-08, + "loss": 0.2984, + "step": 12307 + }, + { + "epoch": 0.98, + "learning_rate": 3.244280365881536e-08, + "loss": 0.2738, + "step": 12308 + }, + { + "epoch": 0.98, + "learning_rate": 3.223660156409847e-08, + "loss": 0.3831, + "step": 12309 + }, + { + "epoch": 0.98, + "learning_rate": 3.203105579863919e-08, + "loss": 0.3796, + "step": 12310 + }, + { + "epoch": 0.98, + "learning_rate": 3.1826166375972246e-08, + "loss": 0.365, + "step": 12311 + }, + { + "epoch": 0.98, + "learning_rate": 3.162193330958796e-08, + "loss": 0.285, + "step": 12312 + }, + { + "epoch": 0.98, + "learning_rate": 3.141835661293557e-08, + "loss": 0.303, + "step": 12313 + }, + { + "epoch": 0.98, + "learning_rate": 3.12154362994177e-08, + "loss": 0.4375, + "step": 12314 + }, + { + "epoch": 0.98, + "learning_rate": 3.1013172382396984e-08, + "loss": 0.3302, + "step": 12315 + }, + { + "epoch": 0.98, + "learning_rate": 3.0811564875190544e-08, + "loss": 0.3792, + "step": 12316 + }, + { + "epoch": 0.98, + "learning_rate": 3.061061379107555e-08, + "loss": 0.2985, + "step": 12317 + }, + { + "epoch": 0.98, + "learning_rate": 3.04103191432803e-08, + "loss": 0.2888, + "step": 12318 + }, + { + "epoch": 0.98, + "learning_rate": 3.0210680944995354e-08, + "loss": 0.4233, + "step": 12319 + }, + { + "epoch": 0.98, + "learning_rate": 3.001169920936575e-08, + "loss": 0.2801, + "step": 12320 + }, + { + "epoch": 0.98, + "learning_rate": 2.981337394949324e-08, + "loss": 0.3678, + "step": 12321 + }, + { + "epoch": 0.98, + "learning_rate": 2.961570517843626e-08, + "loss": 0.3405, + "step": 12322 + }, + { + "epoch": 0.98, + "learning_rate": 2.9418692909211066e-08, + "loss": 0.3177, + "step": 12323 + }, + { + "epoch": 0.98, + "learning_rate": 2.9222337154789504e-08, + "loss": 0.3458, + "step": 12324 + }, + { + "epoch": 0.98, + "learning_rate": 2.902663792810012e-08, + "loss": 0.3641, + "step": 12325 + }, + { + "epoch": 0.98, + "learning_rate": 2.8831595242030387e-08, + "loss": 0.2877, + "step": 12326 + }, + { + "epoch": 0.98, + "learning_rate": 2.863720910942114e-08, + "loss": 0.3668, + "step": 12327 + }, + { + "epoch": 0.98, + "learning_rate": 2.8443479543073248e-08, + "loss": 0.3146, + "step": 12328 + }, + { + "epoch": 0.98, + "learning_rate": 2.825040655574207e-08, + "loss": 0.3382, + "step": 12329 + }, + { + "epoch": 0.98, + "learning_rate": 2.8057990160139658e-08, + "loss": 0.5162, + "step": 12330 + }, + { + "epoch": 0.98, + "learning_rate": 2.7866230368936986e-08, + "loss": 0.3044, + "step": 12331 + }, + { + "epoch": 0.98, + "learning_rate": 2.767512719476062e-08, + "loss": 0.405, + "step": 12332 + }, + { + "epoch": 0.98, + "learning_rate": 2.7484680650193827e-08, + "loss": 0.3077, + "step": 12333 + }, + { + "epoch": 0.98, + "learning_rate": 2.729489074777547e-08, + "loss": 0.2895, + "step": 12334 + }, + { + "epoch": 0.98, + "learning_rate": 2.7105757500002215e-08, + "loss": 0.3598, + "step": 12335 + }, + { + "epoch": 0.98, + "learning_rate": 2.6917280919329656e-08, + "loss": 0.3908, + "step": 12336 + }, + { + "epoch": 0.98, + "learning_rate": 2.6729461018166758e-08, + "loss": 0.2664, + "step": 12337 + }, + { + "epoch": 0.98, + "learning_rate": 2.654229780887918e-08, + "loss": 0.2869, + "step": 12338 + }, + { + "epoch": 0.98, + "learning_rate": 2.6355791303792622e-08, + "loss": 0.2547, + "step": 12339 + }, + { + "epoch": 0.98, + "learning_rate": 2.6169941515188368e-08, + "loss": 0.4525, + "step": 12340 + }, + { + "epoch": 0.98, + "learning_rate": 2.5984748455301077e-08, + "loss": 0.3583, + "step": 12341 + }, + { + "epoch": 0.98, + "learning_rate": 2.5800212136326552e-08, + "loss": 0.3449, + "step": 12342 + }, + { + "epoch": 0.98, + "learning_rate": 2.561633257041507e-08, + "loss": 0.4563, + "step": 12343 + }, + { + "epoch": 0.98, + "learning_rate": 2.5433109769674724e-08, + "loss": 0.4856, + "step": 12344 + }, + { + "epoch": 0.98, + "learning_rate": 2.52505437461692e-08, + "loss": 0.3805, + "step": 12345 + }, + { + "epoch": 0.98, + "learning_rate": 2.5068634511919986e-08, + "loss": 0.4865, + "step": 12346 + }, + { + "epoch": 0.98, + "learning_rate": 2.4887382078905287e-08, + "loss": 0.3398, + "step": 12347 + }, + { + "epoch": 0.98, + "learning_rate": 2.4706786459058885e-08, + "loss": 0.3696, + "step": 12348 + }, + { + "epoch": 0.98, + "learning_rate": 2.4526847664273488e-08, + "loss": 0.3389, + "step": 12349 + }, + { + "epoch": 0.98, + "learning_rate": 2.434756570639518e-08, + "loss": 0.293, + "step": 12350 + }, + { + "epoch": 0.98, + "learning_rate": 2.4168940597230074e-08, + "loss": 0.4668, + "step": 12351 + }, + { + "epoch": 0.98, + "learning_rate": 2.3990972348539864e-08, + "loss": 0.255, + "step": 12352 + }, + { + "epoch": 0.98, + "learning_rate": 2.381366097204296e-08, + "loss": 0.3882, + "step": 12353 + }, + { + "epoch": 0.98, + "learning_rate": 2.363700647941336e-08, + "loss": 0.3793, + "step": 12354 + }, + { + "epoch": 0.98, + "learning_rate": 2.3461008882283977e-08, + "loss": 0.3071, + "step": 12355 + }, + { + "epoch": 0.98, + "learning_rate": 2.3285668192243317e-08, + "loss": 0.4089, + "step": 12356 + }, + { + "epoch": 0.98, + "learning_rate": 2.311098442083659e-08, + "loss": 0.3857, + "step": 12357 + }, + { + "epoch": 0.98, + "learning_rate": 2.293695757956571e-08, + "loss": 0.25, + "step": 12358 + }, + { + "epoch": 0.98, + "learning_rate": 2.2763587679889288e-08, + "loss": 0.3484, + "step": 12359 + }, + { + "epoch": 0.98, + "learning_rate": 2.2590874733223744e-08, + "loss": 0.3381, + "step": 12360 + }, + { + "epoch": 0.98, + "learning_rate": 2.2418818750939986e-08, + "loss": 0.3079, + "step": 12361 + }, + { + "epoch": 0.98, + "learning_rate": 2.2247419744368946e-08, + "loss": 0.3943, + "step": 12362 + }, + { + "epoch": 0.98, + "learning_rate": 2.207667772479494e-08, + "loss": 0.3572, + "step": 12363 + }, + { + "epoch": 0.98, + "learning_rate": 2.190659270346118e-08, + "loss": 0.3074, + "step": 12364 + }, + { + "epoch": 0.98, + "learning_rate": 2.1737164691566502e-08, + "loss": 0.3893, + "step": 12365 + }, + { + "epoch": 0.98, + "learning_rate": 2.156839370026753e-08, + "loss": 0.2938, + "step": 12366 + }, + { + "epoch": 0.98, + "learning_rate": 2.140027974067649e-08, + "loss": 0.3326, + "step": 12367 + }, + { + "epoch": 0.98, + "learning_rate": 2.1232822823862297e-08, + "loss": 0.3438, + "step": 12368 + }, + { + "epoch": 0.98, + "learning_rate": 2.1066022960852806e-08, + "loss": 0.3707, + "step": 12369 + }, + { + "epoch": 0.98, + "learning_rate": 2.0899880162630336e-08, + "loss": 0.3165, + "step": 12370 + }, + { + "epoch": 0.98, + "learning_rate": 2.073439444013392e-08, + "loss": 0.316, + "step": 12371 + }, + { + "epoch": 0.98, + "learning_rate": 2.0569565804260393e-08, + "loss": 0.2551, + "step": 12372 + }, + { + "epoch": 0.98, + "learning_rate": 2.04053942658633e-08, + "loss": 0.3113, + "step": 12373 + }, + { + "epoch": 0.98, + "learning_rate": 2.0241879835752875e-08, + "loss": 0.3002, + "step": 12374 + }, + { + "epoch": 0.98, + "learning_rate": 2.0079022524694957e-08, + "loss": 0.199, + "step": 12375 + }, + { + "epoch": 0.98, + "learning_rate": 1.991682234341208e-08, + "loss": 0.3103, + "step": 12376 + }, + { + "epoch": 0.98, + "learning_rate": 1.9755279302585696e-08, + "loss": 0.3701, + "step": 12377 + }, + { + "epoch": 0.98, + "learning_rate": 1.959439341285285e-08, + "loss": 0.3296, + "step": 12378 + }, + { + "epoch": 0.98, + "learning_rate": 1.943416468480619e-08, + "loss": 0.3173, + "step": 12379 + }, + { + "epoch": 0.98, + "learning_rate": 1.9274593128996155e-08, + "loss": 0.3488, + "step": 12380 + }, + { + "epoch": 0.98, + "learning_rate": 1.9115678755929902e-08, + "loss": 0.2423, + "step": 12381 + }, + { + "epoch": 0.98, + "learning_rate": 1.8957421576071277e-08, + "loss": 0.3379, + "step": 12382 + }, + { + "epoch": 0.98, + "learning_rate": 1.879982159984084e-08, + "loss": 0.339, + "step": 12383 + }, + { + "epoch": 0.98, + "learning_rate": 1.864287883761695e-08, + "loss": 0.4081, + "step": 12384 + }, + { + "epoch": 0.98, + "learning_rate": 1.8486593299730236e-08, + "loss": 0.3091, + "step": 12385 + }, + { + "epoch": 0.98, + "learning_rate": 1.8330964996474688e-08, + "loss": 0.3271, + "step": 12386 + }, + { + "epoch": 0.98, + "learning_rate": 1.817599393809544e-08, + "loss": 0.3311, + "step": 12387 + }, + { + "epoch": 0.98, + "learning_rate": 1.802168013479877e-08, + "loss": 0.4229, + "step": 12388 + }, + { + "epoch": 0.98, + "learning_rate": 1.7868023596743224e-08, + "loss": 0.353, + "step": 12389 + }, + { + "epoch": 0.98, + "learning_rate": 1.771502433404737e-08, + "loss": 0.3955, + "step": 12390 + }, + { + "epoch": 0.98, + "learning_rate": 1.7562682356786488e-08, + "loss": 0.2438, + "step": 12391 + }, + { + "epoch": 0.98, + "learning_rate": 1.7410997674989215e-08, + "loss": 0.2723, + "step": 12392 + }, + { + "epoch": 0.98, + "learning_rate": 1.7259970298645345e-08, + "loss": 0.2759, + "step": 12393 + }, + { + "epoch": 0.98, + "learning_rate": 1.7109600237698032e-08, + "loss": 0.3287, + "step": 12394 + }, + { + "epoch": 0.98, + "learning_rate": 1.6959887502049356e-08, + "loss": 0.3311, + "step": 12395 + }, + { + "epoch": 0.98, + "learning_rate": 1.6810832101556984e-08, + "loss": 0.3271, + "step": 12396 + }, + { + "epoch": 0.98, + "learning_rate": 1.666243404603529e-08, + "loss": 0.2997, + "step": 12397 + }, + { + "epoch": 0.98, + "learning_rate": 1.651469334525424e-08, + "loss": 0.3459, + "step": 12398 + }, + { + "epoch": 0.98, + "learning_rate": 1.6367610008944935e-08, + "loss": 0.3003, + "step": 12399 + }, + { + "epoch": 0.98, + "learning_rate": 1.622118404678963e-08, + "loss": 0.3169, + "step": 12400 + }, + { + "epoch": 0.98, + "learning_rate": 1.607541546843061e-08, + "loss": 0.3777, + "step": 12401 + }, + { + "epoch": 0.98, + "learning_rate": 1.593030428346576e-08, + "loss": 0.2519, + "step": 12402 + }, + { + "epoch": 0.98, + "learning_rate": 1.578585050144965e-08, + "loss": 0.3807, + "step": 12403 + }, + { + "epoch": 0.98, + "learning_rate": 1.564205413189468e-08, + "loss": 0.3554, + "step": 12404 + }, + { + "epoch": 0.98, + "learning_rate": 1.5498915184268826e-08, + "loss": 0.3699, + "step": 12405 + }, + { + "epoch": 0.98, + "learning_rate": 1.5356433667996772e-08, + "loss": 0.3391, + "step": 12406 + }, + { + "epoch": 0.98, + "learning_rate": 1.5214609592461015e-08, + "loss": 0.4468, + "step": 12407 + }, + { + "epoch": 0.98, + "learning_rate": 1.507344296699964e-08, + "loss": 0.3558, + "step": 12408 + }, + { + "epoch": 0.98, + "learning_rate": 1.4932933800907435e-08, + "loss": 0.3824, + "step": 12409 + }, + { + "epoch": 0.98, + "learning_rate": 1.4793082103435885e-08, + "loss": 0.3835, + "step": 12410 + }, + { + "epoch": 0.98, + "learning_rate": 1.4653887883794293e-08, + "loss": 0.3674, + "step": 12411 + }, + { + "epoch": 0.98, + "learning_rate": 1.451535115114866e-08, + "loss": 0.3383, + "step": 12412 + }, + { + "epoch": 0.98, + "learning_rate": 1.4377471914619468e-08, + "loss": 0.3781, + "step": 12413 + }, + { + "epoch": 0.98, + "learning_rate": 1.424025018328612e-08, + "loss": 0.3055, + "step": 12414 + }, + { + "epoch": 0.98, + "learning_rate": 1.4103685966183612e-08, + "loss": 0.3523, + "step": 12415 + }, + { + "epoch": 0.98, + "learning_rate": 1.396777927230475e-08, + "loss": 0.2649, + "step": 12416 + }, + { + "epoch": 0.98, + "learning_rate": 1.383253011059682e-08, + "loss": 0.3205, + "step": 12417 + }, + { + "epoch": 0.98, + "learning_rate": 1.3697938489967144e-08, + "loss": 0.3111, + "step": 12418 + }, + { + "epoch": 0.98, + "learning_rate": 1.3564004419277522e-08, + "loss": 0.3626, + "step": 12419 + }, + { + "epoch": 0.98, + "learning_rate": 1.3430727907346453e-08, + "loss": 0.4115, + "step": 12420 + }, + { + "epoch": 0.98, + "learning_rate": 1.329810896294914e-08, + "loss": 0.3974, + "step": 12421 + }, + { + "epoch": 0.98, + "learning_rate": 1.3166147594818601e-08, + "loss": 0.391, + "step": 12422 + }, + { + "epoch": 0.98, + "learning_rate": 1.3034843811644548e-08, + "loss": 0.3474, + "step": 12423 + }, + { + "epoch": 0.98, + "learning_rate": 1.290419762207007e-08, + "loss": 0.4286, + "step": 12424 + }, + { + "epoch": 0.98, + "learning_rate": 1.2774209034700503e-08, + "loss": 0.2913, + "step": 12425 + }, + { + "epoch": 0.98, + "learning_rate": 1.2644878058093446e-08, + "loss": 0.2679, + "step": 12426 + }, + { + "epoch": 0.98, + "learning_rate": 1.2516204700765422e-08, + "loss": 0.2983, + "step": 12427 + }, + { + "epoch": 0.98, + "learning_rate": 1.2388188971188542e-08, + "loss": 0.3908, + "step": 12428 + }, + { + "epoch": 0.98, + "learning_rate": 1.2260830877792729e-08, + "loss": 0.4374, + "step": 12429 + }, + { + "epoch": 0.98, + "learning_rate": 1.2134130428962387e-08, + "loss": 0.3571, + "step": 12430 + }, + { + "epoch": 0.98, + "learning_rate": 1.2008087633040843e-08, + "loss": 0.3237, + "step": 12431 + }, + { + "epoch": 0.98, + "learning_rate": 1.1882702498328125e-08, + "loss": 0.4175, + "step": 12432 + }, + { + "epoch": 0.98, + "learning_rate": 1.175797503307874e-08, + "loss": 0.2618, + "step": 12433 + }, + { + "epoch": 0.99, + "learning_rate": 1.1633905245507227e-08, + "loss": 0.437, + "step": 12434 + }, + { + "epoch": 0.99, + "learning_rate": 1.1510493143782609e-08, + "loss": 0.3234, + "step": 12435 + }, + { + "epoch": 0.99, + "learning_rate": 1.1387738736029496e-08, + "loss": 0.3155, + "step": 12436 + }, + { + "epoch": 0.99, + "learning_rate": 1.1265642030331426e-08, + "loss": 0.3013, + "step": 12437 + }, + { + "epoch": 0.99, + "learning_rate": 1.114420303472974e-08, + "loss": 0.3903, + "step": 12438 + }, + { + "epoch": 0.99, + "learning_rate": 1.1023421757216934e-08, + "loss": 0.2791, + "step": 12439 + }, + { + "epoch": 0.99, + "learning_rate": 1.090329820574887e-08, + "loss": 0.3305, + "step": 12440 + }, + { + "epoch": 0.99, + "learning_rate": 1.0783832388234772e-08, + "loss": 0.3902, + "step": 12441 + }, + { + "epoch": 0.99, + "learning_rate": 1.0665024312539462e-08, + "loss": 0.4853, + "step": 12442 + }, + { + "epoch": 0.99, + "learning_rate": 1.0546873986486682e-08, + "loss": 0.237, + "step": 12443 + }, + { + "epoch": 0.99, + "learning_rate": 1.0429381417856877e-08, + "loss": 0.3397, + "step": 12444 + }, + { + "epoch": 0.99, + "learning_rate": 1.0312546614384966e-08, + "loss": 0.3208, + "step": 12445 + }, + { + "epoch": 0.99, + "learning_rate": 1.0196369583763688e-08, + "loss": 0.399, + "step": 12446 + }, + { + "epoch": 0.99, + "learning_rate": 1.0080850333644698e-08, + "loss": 0.3021, + "step": 12447 + }, + { + "epoch": 0.99, + "learning_rate": 9.965988871633025e-09, + "loss": 0.3117, + "step": 12448 + }, + { + "epoch": 0.99, + "learning_rate": 9.851785205291508e-09, + "loss": 0.4609, + "step": 12449 + }, + { + "epoch": 0.99, + "learning_rate": 9.738239342141909e-09, + "loss": 0.446, + "step": 12450 + }, + { + "epoch": 0.99, + "learning_rate": 9.625351289658247e-09, + "loss": 0.3323, + "step": 12451 + }, + { + "epoch": 0.99, + "learning_rate": 9.513121055273467e-09, + "loss": 0.2897, + "step": 12452 + }, + { + "epoch": 0.99, + "learning_rate": 9.401548646380543e-09, + "loss": 0.3091, + "step": 12453 + }, + { + "epoch": 0.99, + "learning_rate": 9.290634070322491e-09, + "loss": 0.4003, + "step": 12454 + }, + { + "epoch": 0.99, + "learning_rate": 9.180377334404577e-09, + "loss": 0.1987, + "step": 12455 + }, + { + "epoch": 0.99, + "learning_rate": 9.070778445885442e-09, + "loss": 0.4143, + "step": 12456 + }, + { + "epoch": 0.99, + "learning_rate": 8.961837411982643e-09, + "loss": 0.3138, + "step": 12457 + }, + { + "epoch": 0.99, + "learning_rate": 8.853554239869333e-09, + "loss": 0.4325, + "step": 12458 + }, + { + "epoch": 0.99, + "learning_rate": 8.745928936675363e-09, + "loss": 0.4349, + "step": 12459 + }, + { + "epoch": 0.99, + "learning_rate": 8.638961509486177e-09, + "loss": 0.2921, + "step": 12460 + }, + { + "epoch": 0.99, + "learning_rate": 8.53265196534725e-09, + "loss": 0.2778, + "step": 12461 + }, + { + "epoch": 0.99, + "learning_rate": 8.427000311256317e-09, + "loss": 0.4513, + "step": 12462 + }, + { + "epoch": 0.99, + "learning_rate": 8.322006554171147e-09, + "loss": 0.2507, + "step": 12463 + }, + { + "epoch": 0.99, + "learning_rate": 8.217670701005098e-09, + "loss": 0.3415, + "step": 12464 + }, + { + "epoch": 0.99, + "learning_rate": 8.113992758628231e-09, + "loss": 0.3276, + "step": 12465 + }, + { + "epoch": 0.99, + "learning_rate": 8.010972733867306e-09, + "loss": 0.3055, + "step": 12466 + }, + { + "epoch": 0.99, + "learning_rate": 7.908610633504676e-09, + "loss": 0.372, + "step": 12467 + }, + { + "epoch": 0.99, + "learning_rate": 7.806906464281617e-09, + "loss": 0.3064, + "step": 12468 + }, + { + "epoch": 0.99, + "learning_rate": 7.70586023289388e-09, + "loss": 0.3051, + "step": 12469 + }, + { + "epoch": 0.99, + "learning_rate": 7.605471945996146e-09, + "loss": 0.3066, + "step": 12470 + }, + { + "epoch": 0.99, + "learning_rate": 7.50574161019757e-09, + "loss": 0.3397, + "step": 12471 + }, + { + "epoch": 0.99, + "learning_rate": 7.406669232065122e-09, + "loss": 0.376, + "step": 12472 + }, + { + "epoch": 0.99, + "learning_rate": 7.3082548181213635e-09, + "loss": 0.3996, + "step": 12473 + }, + { + "epoch": 0.99, + "learning_rate": 7.210498374848884e-09, + "loss": 0.381, + "step": 12474 + }, + { + "epoch": 0.99, + "learning_rate": 7.113399908681429e-09, + "loss": 0.3214, + "step": 12475 + }, + { + "epoch": 0.99, + "learning_rate": 7.016959426013881e-09, + "loss": 0.2364, + "step": 12476 + }, + { + "epoch": 0.99, + "learning_rate": 6.9211769331978265e-09, + "loss": 0.3409, + "step": 12477 + }, + { + "epoch": 0.99, + "learning_rate": 6.8260524365371115e-09, + "loss": 0.3773, + "step": 12478 + }, + { + "epoch": 0.99, + "learning_rate": 6.731585942297836e-09, + "loss": 0.4537, + "step": 12479 + }, + { + "epoch": 0.99, + "learning_rate": 6.637777456698358e-09, + "loss": 0.3293, + "step": 12480 + }, + { + "epoch": 0.99, + "learning_rate": 6.544626985915958e-09, + "loss": 0.3378, + "step": 12481 + }, + { + "epoch": 0.99, + "learning_rate": 6.45213453608573e-09, + "loss": 0.3524, + "step": 12482 + }, + { + "epoch": 0.99, + "learning_rate": 6.360300113295026e-09, + "loss": 0.3845, + "step": 12483 + }, + { + "epoch": 0.99, + "learning_rate": 6.269123723593451e-09, + "loss": 0.3039, + "step": 12484 + }, + { + "epoch": 0.99, + "learning_rate": 6.178605372982871e-09, + "loss": 0.2838, + "step": 12485 + }, + { + "epoch": 0.99, + "learning_rate": 6.088745067424073e-09, + "loss": 0.423, + "step": 12486 + }, + { + "epoch": 0.99, + "learning_rate": 5.9995428128334365e-09, + "loss": 0.34, + "step": 12487 + }, + { + "epoch": 0.99, + "learning_rate": 5.910998615085151e-09, + "loss": 0.3649, + "step": 12488 + }, + { + "epoch": 0.99, + "learning_rate": 5.8231124800089965e-09, + "loss": 0.3113, + "step": 12489 + }, + { + "epoch": 0.99, + "learning_rate": 5.735884413391457e-09, + "loss": 0.3674, + "step": 12490 + }, + { + "epoch": 0.99, + "learning_rate": 5.6493144209768255e-09, + "loss": 0.4484, + "step": 12491 + }, + { + "epoch": 0.99, + "learning_rate": 5.5634025084660985e-09, + "loss": 0.3713, + "step": 12492 + }, + { + "epoch": 0.99, + "learning_rate": 5.47814868151364e-09, + "loss": 0.2951, + "step": 12493 + }, + { + "epoch": 0.99, + "learning_rate": 5.393552945736069e-09, + "loss": 0.343, + "step": 12494 + }, + { + "epoch": 0.99, + "learning_rate": 5.309615306701155e-09, + "loss": 0.427, + "step": 12495 + }, + { + "epoch": 0.99, + "learning_rate": 5.226335769936697e-09, + "loss": 0.3856, + "step": 12496 + }, + { + "epoch": 0.99, + "learning_rate": 5.143714340926087e-09, + "loss": 0.3654, + "step": 12497 + }, + { + "epoch": 0.99, + "learning_rate": 5.0617510251105284e-09, + "loss": 0.4147, + "step": 12498 + }, + { + "epoch": 0.99, + "learning_rate": 4.980445827885705e-09, + "loss": 0.3495, + "step": 12499 + }, + { + "epoch": 0.99, + "learning_rate": 4.899798754605112e-09, + "loss": 0.3858, + "step": 12500 + }, + { + "epoch": 0.99, + "learning_rate": 4.819809810578946e-09, + "loss": 0.4444, + "step": 12501 + }, + { + "epoch": 0.99, + "learning_rate": 4.740479001076326e-09, + "loss": 0.333, + "step": 12502 + }, + { + "epoch": 0.99, + "learning_rate": 4.66180633131752e-09, + "loss": 0.3694, + "step": 12503 + }, + { + "epoch": 0.99, + "learning_rate": 4.583791806485049e-09, + "loss": 0.4066, + "step": 12504 + }, + { + "epoch": 0.99, + "learning_rate": 4.506435431714806e-09, + "loss": 0.4212, + "step": 12505 + }, + { + "epoch": 0.99, + "learning_rate": 4.429737212100493e-09, + "loss": 0.3487, + "step": 12506 + }, + { + "epoch": 0.99, + "learning_rate": 4.353697152692515e-09, + "loss": 0.3849, + "step": 12507 + }, + { + "epoch": 0.99, + "learning_rate": 4.278315258496868e-09, + "loss": 0.3703, + "step": 12508 + }, + { + "epoch": 0.99, + "learning_rate": 4.203591534478468e-09, + "loss": 0.4146, + "step": 12509 + }, + { + "epoch": 0.99, + "learning_rate": 4.129525985556715e-09, + "loss": 0.2678, + "step": 12510 + }, + { + "epoch": 0.99, + "learning_rate": 4.056118616608817e-09, + "loss": 0.3386, + "step": 12511 + }, + { + "epoch": 0.99, + "learning_rate": 3.9833694324686864e-09, + "loss": 0.3546, + "step": 12512 + }, + { + "epoch": 0.99, + "learning_rate": 3.9112784379247145e-09, + "loss": 0.5038, + "step": 12513 + }, + { + "epoch": 0.99, + "learning_rate": 3.839845637725326e-09, + "loss": 0.2828, + "step": 12514 + }, + { + "epoch": 0.99, + "learning_rate": 3.769071036573424e-09, + "loss": 0.3067, + "step": 12515 + }, + { + "epoch": 0.99, + "learning_rate": 3.698954639129726e-09, + "loss": 0.3475, + "step": 12516 + }, + { + "epoch": 0.99, + "learning_rate": 3.6294964500116492e-09, + "loss": 0.3959, + "step": 12517 + }, + { + "epoch": 0.99, + "learning_rate": 3.560696473789982e-09, + "loss": 0.3961, + "step": 12518 + }, + { + "epoch": 0.99, + "learning_rate": 3.4925547149977645e-09, + "loss": 0.4157, + "step": 12519 + }, + { + "epoch": 0.99, + "learning_rate": 3.425071178120298e-09, + "loss": 0.3912, + "step": 12520 + }, + { + "epoch": 0.99, + "learning_rate": 3.3582458676018058e-09, + "loss": 0.2732, + "step": 12521 + }, + { + "epoch": 0.99, + "learning_rate": 3.292078787842101e-09, + "loss": 0.3382, + "step": 12522 + }, + { + "epoch": 0.99, + "learning_rate": 3.226569943197699e-09, + "loss": 0.2733, + "step": 12523 + }, + { + "epoch": 0.99, + "learning_rate": 3.1617193379818167e-09, + "loss": 0.4054, + "step": 12524 + }, + { + "epoch": 0.99, + "learning_rate": 3.0975269764654816e-09, + "loss": 0.2913, + "step": 12525 + }, + { + "epoch": 0.99, + "learning_rate": 3.033992862875312e-09, + "loss": 0.428, + "step": 12526 + }, + { + "epoch": 0.99, + "learning_rate": 2.9711170013935196e-09, + "loss": 0.387, + "step": 12527 + }, + { + "epoch": 0.99, + "learning_rate": 2.9088993961612355e-09, + "loss": 0.3736, + "step": 12528 + }, + { + "epoch": 0.99, + "learning_rate": 2.8473400512762928e-09, + "loss": 0.3005, + "step": 12529 + }, + { + "epoch": 0.99, + "learning_rate": 2.7864389707887853e-09, + "loss": 0.3369, + "step": 12530 + }, + { + "epoch": 0.99, + "learning_rate": 2.726196158712169e-09, + "loss": 0.3069, + "step": 12531 + }, + { + "epoch": 0.99, + "learning_rate": 2.66661161901105e-09, + "loss": 0.3614, + "step": 12532 + }, + { + "epoch": 0.99, + "learning_rate": 2.607685355610068e-09, + "loss": 0.3253, + "step": 12533 + }, + { + "epoch": 0.99, + "learning_rate": 2.549417372388341e-09, + "loss": 0.4844, + "step": 12534 + }, + { + "epoch": 0.99, + "learning_rate": 2.4918076731828e-09, + "loss": 0.3283, + "step": 12535 + }, + { + "epoch": 0.99, + "learning_rate": 2.434856261785967e-09, + "loss": 0.2898, + "step": 12536 + }, + { + "epoch": 0.99, + "learning_rate": 2.378563141949286e-09, + "loss": 0.2564, + "step": 12537 + }, + { + "epoch": 0.99, + "learning_rate": 2.322928317378681e-09, + "loss": 0.2901, + "step": 12538 + }, + { + "epoch": 0.99, + "learning_rate": 2.267951791737888e-09, + "loss": 0.3123, + "step": 12539 + }, + { + "epoch": 0.99, + "learning_rate": 2.213633568646234e-09, + "loss": 0.4275, + "step": 12540 + }, + { + "epoch": 0.99, + "learning_rate": 2.1599736516808577e-09, + "loss": 0.2546, + "step": 12541 + }, + { + "epoch": 0.99, + "learning_rate": 2.106972044373379e-09, + "loss": 0.3233, + "step": 12542 + }, + { + "epoch": 0.99, + "learning_rate": 2.0546287502165583e-09, + "loss": 0.4461, + "step": 12543 + }, + { + "epoch": 0.99, + "learning_rate": 2.002943772654309e-09, + "loss": 0.3252, + "step": 12544 + }, + { + "epoch": 0.99, + "learning_rate": 1.951917115091684e-09, + "loss": 0.4288, + "step": 12545 + }, + { + "epoch": 0.99, + "learning_rate": 1.901548780887108e-09, + "loss": 0.3061, + "step": 12546 + }, + { + "epoch": 0.99, + "learning_rate": 1.851838773357928e-09, + "loss": 0.3566, + "step": 12547 + }, + { + "epoch": 0.99, + "learning_rate": 1.8027870957781912e-09, + "loss": 0.3798, + "step": 12548 + }, + { + "epoch": 0.99, + "learning_rate": 1.7543937513753161e-09, + "loss": 0.3491, + "step": 12549 + }, + { + "epoch": 0.99, + "learning_rate": 1.7066587433378634e-09, + "loss": 0.4012, + "step": 12550 + }, + { + "epoch": 0.99, + "learning_rate": 1.659582074807764e-09, + "loss": 0.3714, + "step": 12551 + }, + { + "epoch": 0.99, + "learning_rate": 1.6131637488858708e-09, + "loss": 0.327, + "step": 12552 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674037686275178e-09, + "loss": 0.3279, + "step": 12553 + }, + { + "epoch": 0.99, + "learning_rate": 1.5223021370458502e-09, + "loss": 0.3626, + "step": 12554 + }, + { + "epoch": 0.99, + "learning_rate": 1.4778588571107144e-09, + "loss": 0.3642, + "step": 12555 + }, + { + "epoch": 0.99, + "learning_rate": 1.4340739317497688e-09, + "loss": 0.4269, + "step": 12556 + }, + { + "epoch": 0.99, + "learning_rate": 1.390947363845152e-09, + "loss": 0.5046, + "step": 12557 + }, + { + "epoch": 0.99, + "learning_rate": 1.3484791562357048e-09, + "loss": 0.3263, + "step": 12558 + }, + { + "epoch": 0.99, + "learning_rate": 1.3066693117191886e-09, + "loss": 0.4385, + "step": 12559 + }, + { + "epoch": 1.0, + "learning_rate": 1.2655178330467366e-09, + "loss": 0.3122, + "step": 12560 + }, + { + "epoch": 1.0, + "learning_rate": 1.2250247229295132e-09, + "loss": 0.3618, + "step": 12561 + }, + { + "epoch": 1.0, + "learning_rate": 1.185189984034274e-09, + "loss": 0.3676, + "step": 12562 + }, + { + "epoch": 1.0, + "learning_rate": 1.1460136189822556e-09, + "loss": 0.2376, + "step": 12563 + }, + { + "epoch": 1.0, + "learning_rate": 1.1074956303536165e-09, + "loss": 0.4167, + "step": 12564 + }, + { + "epoch": 1.0, + "learning_rate": 1.0696360206852162e-09, + "loss": 0.3419, + "step": 12565 + }, + { + "epoch": 1.0, + "learning_rate": 1.0324347924695055e-09, + "loss": 0.4047, + "step": 12566 + }, + { + "epoch": 1.0, + "learning_rate": 9.958919481556362e-10, + "loss": 0.2741, + "step": 12567 + }, + { + "epoch": 1.0, + "learning_rate": 9.600074901505718e-10, + "loss": 0.353, + "step": 12568 + }, + { + "epoch": 1.0, + "learning_rate": 9.24781420816867e-10, + "loss": 0.3367, + "step": 12569 + }, + { + "epoch": 1.0, + "learning_rate": 8.902137424726675e-10, + "loss": 0.3097, + "step": 12570 + }, + { + "epoch": 1.0, + "learning_rate": 8.56304457396151e-10, + "loss": 0.3515, + "step": 12571 + }, + { + "epoch": 1.0, + "learning_rate": 8.230535678188656e-10, + "loss": 0.317, + "step": 12572 + }, + { + "epoch": 1.0, + "learning_rate": 7.904610759312814e-10, + "loss": 0.3451, + "step": 12573 + }, + { + "epoch": 1.0, + "learning_rate": 7.585269838783494e-10, + "loss": 0.4171, + "step": 12574 + }, + { + "epoch": 1.0, + "learning_rate": 7.272512937628318e-10, + "loss": 0.3135, + "step": 12575 + }, + { + "epoch": 1.0, + "learning_rate": 6.966340076441924e-10, + "loss": 0.3872, + "step": 12576 + }, + { + "epoch": 1.0, + "learning_rate": 6.666751275385963e-10, + "loss": 0.2341, + "step": 12577 + }, + { + "epoch": 1.0, + "learning_rate": 6.3737465542002e-10, + "loss": 0.325, + "step": 12578 + }, + { + "epoch": 1.0, + "learning_rate": 6.087325932147003e-10, + "loss": 0.3125, + "step": 12579 + }, + { + "epoch": 1.0, + "learning_rate": 5.807489428111268e-10, + "loss": 0.3959, + "step": 12580 + }, + { + "epoch": 1.0, + "learning_rate": 5.534237060511594e-10, + "loss": 0.3242, + "step": 12581 + }, + { + "epoch": 1.0, + "learning_rate": 5.267568847344695e-10, + "loss": 0.294, + "step": 12582 + }, + { + "epoch": 1.0, + "learning_rate": 5.007484806152097e-10, + "loss": 0.4567, + "step": 12583 + }, + { + "epoch": 1.0, + "learning_rate": 4.753984954086743e-10, + "loss": 0.3379, + "step": 12584 + }, + { + "epoch": 1.0, + "learning_rate": 4.5070693078130834e-10, + "loss": 0.2175, + "step": 12585 + }, + { + "epoch": 1.0, + "learning_rate": 4.266737883606986e-10, + "loss": 0.3164, + "step": 12586 + }, + { + "epoch": 1.0, + "learning_rate": 4.0329906972780276e-10, + "loss": 0.3333, + "step": 12587 + }, + { + "epoch": 1.0, + "learning_rate": 3.805827764236103e-10, + "loss": 0.4057, + "step": 12588 + }, + { + "epoch": 1.0, + "learning_rate": 3.585249099435917e-10, + "loss": 0.4247, + "step": 12589 + }, + { + "epoch": 1.0, + "learning_rate": 3.3712547173769816e-10, + "loss": 0.4979, + "step": 12590 + }, + { + "epoch": 1.0, + "learning_rate": 3.163844632181334e-10, + "loss": 0.4358, + "step": 12591 + }, + { + "epoch": 1.0, + "learning_rate": 2.963018857493616e-10, + "loss": 0.3786, + "step": 12592 + }, + { + "epoch": 1.0, + "learning_rate": 2.7687774065254804e-10, + "loss": 0.3109, + "step": 12593 + }, + { + "epoch": 1.0, + "learning_rate": 2.581120292077799e-10, + "loss": 0.3399, + "step": 12594 + }, + { + "epoch": 1.0, + "learning_rate": 2.400047526518456e-10, + "loss": 0.4601, + "step": 12595 + }, + { + "epoch": 1.0, + "learning_rate": 2.2255591217490437e-10, + "loss": 0.4284, + "step": 12596 + }, + { + "epoch": 1.0, + "learning_rate": 2.057655089271471e-10, + "loss": 0.362, + "step": 12597 + }, + { + "epoch": 1.0, + "learning_rate": 1.8963354401324575e-10, + "loss": 0.4245, + "step": 12598 + }, + { + "epoch": 1.0, + "learning_rate": 1.74160018496794e-10, + "loss": 0.3849, + "step": 12599 + }, + { + "epoch": 1.0, + "learning_rate": 1.593449333947561e-10, + "loss": 0.3316, + "step": 12600 + }, + { + "epoch": 1.0, + "learning_rate": 1.4518828968523857e-10, + "loss": 0.3028, + "step": 12601 + }, + { + "epoch": 1.0, + "learning_rate": 1.3169008829749808e-10, + "loss": 0.3564, + "step": 12602 + }, + { + "epoch": 1.0, + "learning_rate": 1.1885033012193348e-10, + "loss": 0.262, + "step": 12603 + }, + { + "epoch": 1.0, + "learning_rate": 1.0666901600453473e-10, + "loss": 0.3091, + "step": 12604 + }, + { + "epoch": 1.0, + "learning_rate": 9.51461467457726e-11, + "loss": 0.4002, + "step": 12605 + }, + { + "epoch": 1.0, + "learning_rate": 8.428172310503968e-11, + "loss": 0.3488, + "step": 12606 + }, + { + "epoch": 1.0, + "learning_rate": 7.40757457984298e-11, + "loss": 0.3398, + "step": 12607 + }, + { + "epoch": 1.0, + "learning_rate": 6.452821549651766e-11, + "loss": 0.5005, + "step": 12608 + }, + { + "epoch": 1.0, + "learning_rate": 5.563913282990996e-11, + "loss": 0.4372, + "step": 12609 + }, + { + "epoch": 1.0, + "learning_rate": 4.7408498381473765e-11, + "loss": 0.4303, + "step": 12610 + }, + { + "epoch": 1.0, + "learning_rate": 3.983631269521837e-11, + "loss": 0.3557, + "step": 12611 + }, + { + "epoch": 1.0, + "learning_rate": 3.292257626963391e-11, + "loss": 0.35, + "step": 12612 + }, + { + "epoch": 1.0, + "learning_rate": 2.6667289557691378e-11, + "loss": 0.4285, + "step": 12613 + }, + { + "epoch": 1.0, + "learning_rate": 2.1070452974614187e-11, + "loss": 0.4084, + "step": 12614 + }, + { + "epoch": 1.0, + "learning_rate": 1.6132066886775932e-11, + "loss": 0.4266, + "step": 12615 + }, + { + "epoch": 1.0, + "learning_rate": 1.1852131619471963e-11, + "loss": 0.2784, + "step": 12616 + }, + { + "epoch": 1.0, + "learning_rate": 8.230647454698926e-12, + "loss": 0.416, + "step": 12617 + }, + { + "epoch": 1.0, + "learning_rate": 5.267614631154772e-12, + "loss": 0.4712, + "step": 12618 + }, + { + "epoch": 1.0, + "learning_rate": 2.9630333442387525e-12, + "loss": 0.3506, + "step": 12619 + }, + { + "epoch": 1.0, + "learning_rate": 1.3169037449412004e-12, + "loss": 0.476, + "step": 12620 + }, + { + "epoch": 1.0, + "learning_rate": 3.29225942063971e-13, + "loss": 0.4015, + "step": 12621 + }, + { + "epoch": 1.0, + "learning_rate": 0.0, + "loss": 0.3396, + "step": 12622 + }, + { + "epoch": 1.0, + "step": 12622, + "total_flos": 1.0198728881668096e+16, + "train_loss": 0.3764946734946799, + "train_runtime": 93134.7898, + "train_samples_per_second": 17.348, + "train_steps_per_second": 0.136 + } + ], + "logging_steps": 1.0, + "max_steps": 12622, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 50000, + "total_flos": 1.0198728881668096e+16, + "train_batch_size": 2, + "trial_name": null, + "trial_params": null +} diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/README.md b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/README.md new file mode 100644 index 0000000000000000000000000000000000000000..bd59d328a8903f11f9d765cf25417b1f803fa4e9 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/README.md @@ -0,0 +1,202 @@ +--- +base_model: local_pretrained_llm/Meta-Llama-3.1-8B-Instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.9.0 \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_config.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5d7680cb39c3b92dab96fd82e6af076361cbcc4b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_config.json @@ -0,0 +1,46 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "local_pretrained_llm/Meta-Llama-3.1-8B-Instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "wh", + "output_projection", + "down_proj", + "up_proj", + "node_embedding", + "embed_gvp_input_features", + "wg", + "fc1", + "fc2", + "ws", + "out_proj", + "gate_proj", + "wv", + "mm_struc_projector", + "v_proj", + "k_proj", + "q_proj", + "o_proj", + "embed_confidence", + "embed_gvp_output" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_model.safetensors b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..44b760164c9c2f7f1c6e60fec3abef10237a6643 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa00dedc205ff8207fbbbb6465ba0e8084bcdda7ea91fff447d4bd936f775a0 +size 377762600 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/README.md b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/README.md new file mode 100644 index 0000000000000000000000000000000000000000..bd59d328a8903f11f9d765cf25417b1f803fa4e9 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/README.md @@ -0,0 +1,202 @@ +--- +base_model: local_pretrained_llm/Meta-Llama-3.1-8B-Instruct +library_name: peft +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.9.0 \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_config.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1b66ec6d32884ed4398e48c02cce717f72294412 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_config.json @@ -0,0 +1,46 @@ +{ + "alpha_pattern": {}, + "auto_mapping": null, + "base_model_name_or_path": "local_pretrained_llm/Meta-Llama-3.1-8B-Instruct", + "bias": "none", + "fan_in_fan_out": false, + "inference_mode": true, + "init_lora_weights": true, + "layers_pattern": null, + "layers_to_transform": null, + "loftq_config": {}, + "lora_alpha": 16, + "lora_dropout": 0.05, + "megatron_config": null, + "megatron_core": "megatron.core", + "modules_to_save": null, + "peft_type": "LORA", + "r": 64, + "rank_pattern": {}, + "revision": null, + "target_modules": [ + "wv", + "fc1", + "v_proj", + "gate_proj", + "ws", + "embed_confidence", + "output_projection", + "node_embedding", + "down_proj", + "mm_struc_projector", + "wg", + "embed_gvp_output", + "out_proj", + "q_proj", + "embed_gvp_input_features", + "up_proj", + "o_proj", + "k_proj", + "fc2", + "wh" + ], + "task_type": "CAUSAL_LM", + "use_dora": false, + "use_rslora": false +} \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_model.safetensors b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..44b760164c9c2f7f1c6e60fec3abef10237a6643 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa00dedc205ff8207fbbbb6465ba0e8084bcdda7ea91fff447d4bd936f775a0 +size 377762600 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae187af0acd6244e379aa2a9ab226e16944d10f --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd016b3a6b4aedab3b3f59ffd9ceb18394fbf653a08bd6c89f6cb3406bbb1779 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0820252df637a1cd5b2d53953c9e53c00b1f0b8 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff31bf7bf6b945019daadbacde99ac803b5a4d49d18e16d38e1115ba23da1fb9 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9642abd47ab8a136b6a1b9f6c7ba648d7ade466 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f1b30ee4f699e075bfc7ec995d6d0dd54b220b99735f26097e29bcda9da7035 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..595842c5f8c8180e48274c45b28b7c82bc99ed6a --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7197783a899f74b6c3806adc441d19385cf7210b29cd6616a1f95d04653a88ce +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0cd333677e675117d711d3b118c5d667bcf8ff5 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5572866a0d2ea915f6f73e608a4752672c98a34af1804becabd9e0500f495c2b +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..295319d9a2db0177fc5fa2d075ef69efa8093dc6 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86493d85aee50bcccf5295669edb6ad0bea990f3dc7b43808b4765b6b6cc0f10 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e0b8a300aa9ae5c9bc861128fd41e636040358 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7fe647dab126df5b0c91bf109b0c299e80c02b4d040c6e8480dae2673c58ca +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75bd30558cf0d80f458dcefaf9ceca36e9ba22b9 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5aa64ed65ee004d40e1de2de3474d1c866afda2f56a103c1682327aa9b8d1d +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d4386fb42b0c8b90e28a83a2aca1be92995b8af --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c167edbb231fd6f91ff8078f9f7fe042ef8ca187298adefb6cefae06c66fee +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a417dd803ef44aa1851b490d6b79eeaf1b4f1661 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6907aec8b135edaee144dfd2a0fc798fe209340a5fd498fb4c2719b1bb1d291 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d16eebbdbe3e136df864a7e6a465ec764600fb54 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a41d13691174e9e501cbef896d7d77b3a9bd528d117859d74a7cc34eb223ebd4 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa9122f160b70b54a001d3f63ac7d22298d079e8 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ad3601a7190135a02ebc1fa69cf06c0710f9dad6923c360d7129d3abdbfcb2 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed6d0498f3c8747fa21dd58e1b4c32cdaaf0962 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aac32a1b705912af0cef462ab16e19c6606335d4f0b9ea19dc4359963774ced +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b60780baae40070bf5c1d57b39726dc793973f --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b48e76c73d5174a21787a304fc3a54d937196e96241f805f39d585a1ecfb9f9f +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80219cbcc794feca3dbf33e7ff778e12a4e5897b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae329426755521e0c49e03b06ccd080519117f14eb51f92345c908468caa67a4 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e87cadd11523c5b0727bbddc586c54802122a6 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ddf6b1f04b520614556f94302500e4bea13c68e3aeee4eceee218c4cf837014 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01f1e67d98d4ef8ef8a2db4596d7e8c26e5bcf2d --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808b1332e5d4adcbe4a7d228d2070503888b5955241d2d0f306fe73cc75f6ef6 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d31288a7fcc25fcb0eb6524ef000feb71328bcc --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc7fe6019ecd16a47e4c811003bac328e79adcca925515a6d849330b191ae45a +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93bbd3bb15bd48e4c653718c524052cedcbebdab --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb53851308f22822d0b64e0de6bb313e22db4a50af4c1966ef4990e4330997a +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166a3b39e6c6d304d163fc43bd5e92e2a7e2aec6 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33775ef22021bed50b588e8513b532da91c29d952a7be653e3b5e99897552d94 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1730fa1e32f68bfeccb9e553c2388bf93444b96 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3676054eddaf4e174c4b7c031eb94fdaa1176c4d0478befe53f5d2c75ed252a +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..badef57727d7ce49ef40cb1d46e77718829111e1 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d5df982d6c702aeb077efea5717d92aeb46ef4b952b79101af751c771a2ff6 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e797f9b74f5facb5c99b5c7418c2214e17b1c4c --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3a07fdd76de61b2c77d2c7c352c40f7795bc90de331913029043dd6f65f165 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..829577154d106877a327cbbd92493afd2462c808 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:558b7939e9df54715ee7ca512ebdbc1175753b0454afab684bdb2beb1ae58715 +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cffe7f3979bd2e37cb6503b7870f2799dae4bf53 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e956faaeafd7e2435a62e84c977f0a24f54aaf0e23c18d5e1df4921309a61a8d +size 70808568 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6abdce057f631e45feceb0f764c6cba308b4fe25 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd191f4e0ab249146132d093959da36955f237d92521ab78cceceec7010510a +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..810f576971c19ffb448bce3e4e0b5e19c74d39e2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4648cebd15c553a0f47f1fc380642aa0125a3a648c6d0ff9c6fd7af75974f8a1 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82492b60dbe6370bf86fb2c7fd7a8cf7ed991980 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43921b75196bf449e1be93300eac8cc8785769833b4458ccf1d64a2ea79bf7b1 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fd141c94179d1340f8b357ee837213548fcdda2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463b8706ae2c0e24383242c62a01e9ec7395ea5e5d7a65984d122d7e61b09201 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d6e4bc55365dae6a759484d6cf20027f897a7a --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf910e1014415ede3da803d1080fa630a662114dd0b26a20bae0757868ae166 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c237e464ada7da9a7123835e93bc7a3184b0dbdc --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977f467df4c42b3625f310901f3c7beabdc55a15e6da5625f3ed9a9bfcb31549 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be81f76d35915d95645d7e94bbde5de90fd3d18d --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f628e9124b21ecc3dafb6da3ed41a3d452334be35b5996ae364fdfc801eabe95 +size 70808560 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_0_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_0_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59dedd5644cce167dc754653826c8cf765226868 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_0_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aea9402564469c22d6190d6105d4813b4f52808cc747cdc25cfcde99ed53897 +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_10_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_10_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de7e6e14a88047a583352f0a373fa014a4136d0 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_10_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e867af97010b9cd10d360a1dedeb9b40c58ea9fd0e55bf55915e337b7a4a68 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_11_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_11_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4274c0ada414dba6b67f6ddf87bc8ea2149601b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_11_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e29ed3b08206b74bcc07bdefdd3ce8c27630faa35407189afe3be1a4d5b9afc1 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_12_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_12_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60918030717b2dbe4b87058077269f6a1c98a35 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_12_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aad20c7f45073befe83fee8bba9263fde1fb2a5986ae192eb0e7843d7150aaf8 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_13_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_13_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6aec3ff827c68b84d252c3e13c0a5ced4302736 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_13_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ca20f348c7482dc9cde9cfe878df11a80e6f86cff404a0e0610a8b1afe4766 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_14_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_14_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6eafc05541cd0744c1112d8dc8a9f2dfc976eb1 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_14_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da649e02c9b3b7d7c1c4e419ba55a11c242f47dad18c0a191d98313157fb7934 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_15_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_15_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16e2378fef2ce51b69e711e64409f5fa785631f --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_15_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6290296df1af6b2a03dba02d6f482d671f18a304a144888b49dc65a6bc3a22 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_16_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_16_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..974af522fa160f6718853f1fc79fd19d567c61a9 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_16_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58581cc1fd9e8402f315cf02ffb7459603b4e657a64ca241be885efacf68f48 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_17_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_17_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e87b3b4c7f38db0d2be561740f788fc770871c --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_17_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd8482387abc342730bb9a4f03b32eef424a4a9f92166b045828f512fbc75d0 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_18_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_18_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d6cacd460fce233a8d9a89e88f6d8004695f79 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_18_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81a4ab2c9f47a5ed81921664463c9b26a98d3616412ed699b479b0247de9ec8 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_19_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_19_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..974dc5dc3978add2d0125b21d93c09f1f6f314f8 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_19_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9efc91cc7e72d98ead36ae1d97e704765939829e84f743606cebfeb1ee2d26b +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_1_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_1_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f23f474ef1959c600534ce8a41063e926e909e66 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_1_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8e9679e71b6c2aa6a8071106f16433b6790ca27c360c3913b168bcfdc1f860d +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_20_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_20_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66bb2ee7928ee76b754d697e67c24d575353d155 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_20_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7df94c6da3f2b7c276275fbfb6cdd8d28e2de42a061451047e86c8e3685ca8d +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_21_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_21_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..174dff9b6bc7a2509879d18a31fadd0eeb79ff5e --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_21_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4404052573d57a74878656d767614503aaa56de824b46e351c6e7f09af292b +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_22_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_22_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8aefb003a44a029be6974ec6d882b5bcddcf764 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_22_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde5ffdd60b3fac18771a5545383922ec784360519220be5edeb1cb79b75e3e0 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_23_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_23_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49cd31039e520e2ebcaf752e4b148f17fed5dfb --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_23_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99326afd4b32bac05b7cc39627f18a4dee36ccd0cb7b2e48bd527e26e7825ad +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_24_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_24_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..540c565ef8183a9f769b981f431af60a19f21ab2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_24_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1ff7138d79b59640e08d20c2c9b905963f6d8bfbfb1e81b5976bcf116929a7 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_25_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_25_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4923323340fdd04b9630b3d3212d1044b13b15a --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_25_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a35f371007097defcb585a371997458917f75f907b97e9de363588f3552657c1 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_26_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_26_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8363f5c20f063ab88b3b672f22bf103dd276df --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_26_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4679f5888535eddc91ede85a985d6fe76884649789ff5947903154da2c5e827f +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_27_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_27_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..807fd3fc0d3a786740f89cd0c0da88febefea904 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_27_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca284d698323501714e82fbf099fbbe407770e6a322d9ea4e17ff41b9d78de9 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_28_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_28_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cba443eb0a27bb8ff16ce7ef0ed39062d2fb099 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_28_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f90f987274c348e61c06fabf32520661fac4ddc6d7b5db4549539ec64e0feb7 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_29_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_29_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dedae10518a348172ded877f4fe40951b7e060ed --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_29_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af88c336cd6cd5d298aedd43237910de2779babc1cd152d98b9c34d68069825c +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_2_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_2_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd98d80802818aadf3faee18801196b897d6da3 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_2_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ded8608cc6754761740f26494895c2d0e89fc8e78698847795eade9b163caf +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_30_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_30_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8325697fa5e31ae6abe0c1a0a20c198645df132 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_30_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c25be5ec8fe8c0e346f067a2fd8af73ee7721414e4cfc87fd71f1e1546f5e0d +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_31_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_31_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd7fb18137371f0f8db1c5d78d4b288d724a1411 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_31_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55d7484d6348825c5d2dd8bef2d7f8da0a8f208c7595dd171b191f9a8735a16 +size 1046008 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_3_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_3_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eaf4f39209e5ee126218d8f373aa43918a054c5 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_3_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da997fccf95c2f302d08528f21e6a96e26388da1fee7fd011b867839d442330f +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_4_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_4_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..854c9ec0018bc0ff82d436b2e0fe9b8dbe2def40 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_4_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51a5e2ac327dd67ac3deabd2f341c4c49231fed120f12a52420a45b159d8724 +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_5_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_5_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4d8eabc04fa17eb2113184062df80ae1a90be9 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_5_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53753fc443d6cd1fa747ec516197307e61eadc263d06a1366c2e03c6ad75a22 +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_6_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_6_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f57c77d7f8a90b17d280b4ff752ff79c18ad6ea --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_6_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16765ed61e9a74fb15574a6ac1a74e075ac7ecbf6eec19cd4ac179ddf229709b +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_7_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_7_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9648b9df6d4b0809927a44f58f7ed5583a473555 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_7_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6be1d58ff0270e7b5950c1bb9ba40786c7c325d28e38673336ba7aba8e734d1 +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_8_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_8_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8246e4f9abbd97dd0fbbea006d0b080216c6c158 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_8_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f2843692d893221a3c1c12d44d978a9d7f63ef6dbed63353b87f0dd9bf406f +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_9_mp_rank_00_model_states.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_9_mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c89dddfabf241e9b5b74cef12838f413cd8a70 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/global_step12527/zero_pp_rank_9_mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4feae29a5ee3b0cf04f4c23978cff20640dd1038018125458d052863b84ead2a +size 1045095 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/latest b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/latest new file mode 100644 index 0000000000000000000000000000000000000000..0db5e4b47ba74ec6debb8a87853841eba0b6b6e6 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/latest @@ -0,0 +1 @@ +global_step12527 \ No newline at end of file diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_0.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_0.pth new file mode 100644 index 0000000000000000000000000000000000000000..bb7ccc282b13ed451f3e9a050418306e5b539aa2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_0.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9393950a0822ecc99dedcc6e65daf93cdc278c2bc2488f271f132354279914 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_1.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_1.pth new file mode 100644 index 0000000000000000000000000000000000000000..29134b6b6efec746904e038d3aae52f25e9ea0b6 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_1.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fee5d669b8e2dc6cff4d9dd1a9f7211bd3980bb40141024c40c35cce4cbf56 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_10.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_10.pth new file mode 100644 index 0000000000000000000000000000000000000000..47e541bdfc268c93aa8f9b61e59f8893d67449ed --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_10.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8429e3b8860adff6b20811914d2116e91681a3e7aa7b44bce7c270d7edd4d9 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_11.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_11.pth new file mode 100644 index 0000000000000000000000000000000000000000..d64831964c3a04a75d7b88625ee0412c5d842eb5 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_11.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c2fec8cfd3c6e4c63c27d990bc9e26315391d61ffc8c251551459f8e8e5b4cc +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_12.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_12.pth new file mode 100644 index 0000000000000000000000000000000000000000..85f296261a3b03fa798a1ebc27c10afa27ccbf9c --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_12.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f6941025f78bd69ac010ec42fbab6a14145a4e8a6de258904a1e56f92530f6 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_13.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_13.pth new file mode 100644 index 0000000000000000000000000000000000000000..5a992b0325f1b126c3fe02aa2a66f2cce51a32d2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_13.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae1bbc85497a05eefc3e6fb2d4be77c357d21d5b892f17f39863401de2f6576 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_14.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_14.pth new file mode 100644 index 0000000000000000000000000000000000000000..85e20f7d550d54c78b6fb73e44e475b8c68a1755 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_14.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba464d4155f26b60c036aca0d4c1a65b69592dda06db143400eed5be811a6b5 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_15.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_15.pth new file mode 100644 index 0000000000000000000000000000000000000000..0c6e841eeb3e1ae2fb9b367d1814758c62408091 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_15.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55b78e28bea3185e2937b30091edb98cb1caec381efefc91b2196709ec25336 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_16.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_16.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3fda621e11888265ced4316a14e1a95e3f52caa --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_16.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3856c56dfa8f5b76bcf1f5c7db9ff1deb7c319969fb9fd40e5acd3f8b659cd9 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_17.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_17.pth new file mode 100644 index 0000000000000000000000000000000000000000..c696c96f3746c3d344d9ccb126b5a674e7aab22b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_17.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46a096b348af95bb392ca83b6c8eaa94e25bc0eab4e012b5c9a9118fb8b0617 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_18.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_18.pth new file mode 100644 index 0000000000000000000000000000000000000000..9017eb0ba44c4930b07c07c7b19f10b80fa4bcdf --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_18.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3548e6a3924d55c42670275f71065a6bae5b8b5e2f276928be0495843ebd9ef +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_19.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_19.pth new file mode 100644 index 0000000000000000000000000000000000000000..136d6e084bfafa58798d64e61ec11f07043dcb1f --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_19.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a561f33ee91b982f55e1b49767a2d57383e98375d25a3b192afac5d713303aa0 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_2.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_2.pth new file mode 100644 index 0000000000000000000000000000000000000000..7f8d0b7772d0e23d61d3050068356f318341a457 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_2.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143808c42405217219d510eaaf8fde9016f9a21b41a6a7b21b299d147944db5e +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_20.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_20.pth new file mode 100644 index 0000000000000000000000000000000000000000..054b71d010589da498cfcc5b84840af1b3deed11 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_20.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1aeef4fe88d4fa46a2d93d4f926c9dc723c0bb444d778b5f04b7f510a8d221 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_21.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_21.pth new file mode 100644 index 0000000000000000000000000000000000000000..df86290418435849c96b147e33cd62df0e699de0 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_21.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6942e01ea1514f343ad03aac5a8ba8d0f4412e98b99852f5afc5f239765cbbdc +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_22.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_22.pth new file mode 100644 index 0000000000000000000000000000000000000000..1fa6f59b5949ab66334569ac0ed56795a02e08bb --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_22.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb409154b9b2f999f3aae4ba32a769dcc797bdb4028dc5adbd31b3cf60503ae0 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_23.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_23.pth new file mode 100644 index 0000000000000000000000000000000000000000..697fd20b3057d61ed786495533b055f0f565bb3c --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_23.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8223af18e9ff50707d422b6686a6a87e932507e288eb35dc99b28673bb8599 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_24.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_24.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ed231e586a920bf4bd35e8dcfefb0bf680d5a47 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_24.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61e9013510a8165e9e1f0ad33c7d60e7f1e94ccb157214f103947e1ec3821f4d +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_25.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_25.pth new file mode 100644 index 0000000000000000000000000000000000000000..6561f4b425ea366abf77344d9cc9fb038ea029db --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_25.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c13b4322e7c8de348c4d82985eed158cc0e1eb0f3ce758bf39ed86948e195f +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_26.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_26.pth new file mode 100644 index 0000000000000000000000000000000000000000..95abc3e3836f302ab05e79fd3575aace65ca8165 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_26.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0e5dc8810e0991c3749a067fdad27a393c4c269060bcb120c5ddeb8b76965f +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_27.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_27.pth new file mode 100644 index 0000000000000000000000000000000000000000..afc1628ccb1f2165b61a27b1ded3efad15d3189e --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_27.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1303ac764228b0ea9c57ee1558302b3bcb299add12dd9f477a17fad6a2faef37 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_28.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_28.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd49407900cbb18eeeb687304d4f8f87e8bcee0a --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_28.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb60ca009a3ef6f21820251120e6640429ff1f576b0afe1c036410c01fd7ed3 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_29.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_29.pth new file mode 100644 index 0000000000000000000000000000000000000000..d351daf2cd1df7baba4af94c30d2f647c45d703b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_29.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5824ffd8b3d661602b2779ef2f3aede289b0726001d64df5c10ad8a4c768e0ca +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_3.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_3.pth new file mode 100644 index 0000000000000000000000000000000000000000..eea85473b2e266f36807fcd679f40347d8f7d889 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_3.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84bfb8b6d3426f80f5405b3e4f10951da80728b3e577d83e8d57a5350699b590 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_30.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_30.pth new file mode 100644 index 0000000000000000000000000000000000000000..dec4fce0df4df4263639221f85bd40401b926980 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_30.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4f4405c89f0cde8a73c677eeba9f12a8bf359f48deec3bfd5540e69c149072 +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_31.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_31.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0a3efd2db2ba05fd8b268ab9129386cac90d77b --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_31.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae12b492f42b2af21501fffa199275958e75965f0854f48cb320335222aa86bf +size 14519 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_4.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_4.pth new file mode 100644 index 0000000000000000000000000000000000000000..98673710e4279b7f9b47234aa7cdda77f560f906 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40aca054c93eca713c9a4a4ede576d39727f04141c29e12b28b6332c34504255 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_5.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_5.pth new file mode 100644 index 0000000000000000000000000000000000000000..207b7fc7f88fed3be7a5633b61bea20f776b58d2 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_5.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f259f9c75e45242b9c9f58de7ed7c3eeb46c32aa2817580e50d7788909f5c5d5 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_6.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_6.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7d627572907838d768322ab57c6bab43a5c1ea5 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_6.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b9a394abb99bdde5c04cd18363d7b2ff3fa1051580e2aa1972131ce936fa7c +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_7.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_7.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5047801db351402c9168c3d92f500e80ecfd8ab --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_7.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8910c06f8a514b6475702b9fddd5cd11af67a99dd45e8c140dbda3d497102ec9 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_8.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_8.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb68ba8d6468458166f1f72dd7f1936dcad253b5 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_8.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d758dad501842b397a01297f2a3cf878354d74b7addee65318e727b40ff83d19 +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_9.pth b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_9.pth new file mode 100644 index 0000000000000000000000000000000000000000..42591970042a51ba7f009c586624c4eb8926def8 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/rng_state_9.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea9cbaa5564948ed33a9566c891841c2329ee1c7a37d12d95c16958558849ce +size 14512 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/scheduler.pt b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..305f34d79a32cd3598e3350532f840c6c24a4b1f --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee82098380db97f0414b19b55c3d4d4cdb2d5cf1e33e7c4a5bd8a57b034044f +size 1064 diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/special_tokens_map.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..b43be96621d147110fb8a18b5776ec6e38516127 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/special_tokens_map.json @@ -0,0 +1,17 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": "<|eot_id|>" +} diff --git a/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/tokenizer.json b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..5cc5f00a5b203e90a27a3bd60d1ec393b07971e8 --- /dev/null +++ b/pannot-Meta-Llama-3.1-8B-Instruct-finetune-lora-v02/checkpoint-12527/tokenizer.json @@ -0,0 +1,410563 @@ +{ + "version": "1.0", + "truncation": null, + "padding": null, + "added_tokens": [ + { + "id": 128000, + "content": "<|begin_of_text|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128001, + "content": "<|end_of_text|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128002, + "content": "<|reserved_special_token_0|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128003, + "content": "<|reserved_special_token_1|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128004, + "content": "<|finetune_right_pad_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128005, + "content": "<|reserved_special_token_2|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128006, + "content": "<|start_header_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128007, + "content": "<|end_header_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128008, + "content": "<|eom_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128009, + "content": "<|eot_id|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128010, + "content": "<|python_tag|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128011, + "content": "<|reserved_special_token_3|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128012, + "content": "<|reserved_special_token_4|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128013, + "content": "<|reserved_special_token_5|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128014, + "content": "<|reserved_special_token_6|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128015, + "content": "<|reserved_special_token_7|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128016, + "content": "<|reserved_special_token_8|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128017, + "content": "<|reserved_special_token_9|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128018, + "content": "<|reserved_special_token_10|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128019, + "content": "<|reserved_special_token_11|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128020, + "content": "<|reserved_special_token_12|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128021, + "content": "<|reserved_special_token_13|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128022, + "content": "<|reserved_special_token_14|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128023, + "content": "<|reserved_special_token_15|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128024, + "content": "<|reserved_special_token_16|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128025, + "content": "<|reserved_special_token_17|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128026, + "content": "<|reserved_special_token_18|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128027, + "content": "<|reserved_special_token_19|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128028, + "content": "<|reserved_special_token_20|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128029, + "content": "<|reserved_special_token_21|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128030, + "content": "<|reserved_special_token_22|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128031, + "content": "<|reserved_special_token_23|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128032, + "content": "<|reserved_special_token_24|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128033, + "content": "<|reserved_special_token_25|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128034, + "content": "<|reserved_special_token_26|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128035, + "content": "<|reserved_special_token_27|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128036, + "content": "<|reserved_special_token_28|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128037, + "content": "<|reserved_special_token_29|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128038, + "content": "<|reserved_special_token_30|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128039, + "content": "<|reserved_special_token_31|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128040, + "content": "<|reserved_special_token_32|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128041, + "content": "<|reserved_special_token_33|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128042, + "content": "<|reserved_special_token_34|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128043, + "content": "<|reserved_special_token_35|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128044, + "content": "<|reserved_special_token_36|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128045, + "content": "<|reserved_special_token_37|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128046, + "content": "<|reserved_special_token_38|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128047, + "content": "<|reserved_special_token_39|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128048, + "content": "<|reserved_special_token_40|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128049, + "content": "<|reserved_special_token_41|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128050, + "content": "<|reserved_special_token_42|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128051, + "content": "<|reserved_special_token_43|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128052, + "content": "<|reserved_special_token_44|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128053, + "content": "<|reserved_special_token_45|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128054, + "content": "<|reserved_special_token_46|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128055, + "content": "<|reserved_special_token_47|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128056, + "content": "<|reserved_special_token_48|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128057, + "content": "<|reserved_special_token_49|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128058, + "content": "<|reserved_special_token_50|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128059, + "content": "<|reserved_special_token_51|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128060, + "content": "<|reserved_special_token_52|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128061, + "content": "<|reserved_special_token_53|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128062, + "content": "<|reserved_special_token_54|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128063, + "content": "<|reserved_special_token_55|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128064, + "content": "<|reserved_special_token_56|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128065, + "content": "<|reserved_special_token_57|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128066, + "content": "<|reserved_special_token_58|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128067, + "content": "<|reserved_special_token_59|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128068, + "content": "<|reserved_special_token_60|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128069, + "content": "<|reserved_special_token_61|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128070, + "content": "<|reserved_special_token_62|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128071, + "content": "<|reserved_special_token_63|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128072, + "content": "<|reserved_special_token_64|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128073, + "content": "<|reserved_special_token_65|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128074, + "content": "<|reserved_special_token_66|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128075, + "content": "<|reserved_special_token_67|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128076, + "content": "<|reserved_special_token_68|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128077, + "content": "<|reserved_special_token_69|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128078, + "content": "<|reserved_special_token_70|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128079, + "content": "<|reserved_special_token_71|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128080, + "content": "<|reserved_special_token_72|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128081, + "content": "<|reserved_special_token_73|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128082, + "content": "<|reserved_special_token_74|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128083, + "content": "<|reserved_special_token_75|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128084, + "content": "<|reserved_special_token_76|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128085, + "content": "<|reserved_special_token_77|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128086, + "content": "<|reserved_special_token_78|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128087, + "content": "<|reserved_special_token_79|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128088, + "content": "<|reserved_special_token_80|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128089, + "content": "<|reserved_special_token_81|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128090, + "content": "<|reserved_special_token_82|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128091, + "content": "<|reserved_special_token_83|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128092, + "content": "<|reserved_special_token_84|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128093, + "content": "<|reserved_special_token_85|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128094, + "content": "<|reserved_special_token_86|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128095, + "content": "<|reserved_special_token_87|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128096, + "content": "<|reserved_special_token_88|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128097, + "content": "<|reserved_special_token_89|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128098, + "content": "<|reserved_special_token_90|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128099, + "content": "<|reserved_special_token_91|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128100, + "content": "<|reserved_special_token_92|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128101, + "content": "<|reserved_special_token_93|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128102, + "content": "<|reserved_special_token_94|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128103, + "content": "<|reserved_special_token_95|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128104, + "content": "<|reserved_special_token_96|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128105, + "content": "<|reserved_special_token_97|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128106, + "content": "<|reserved_special_token_98|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128107, + "content": "<|reserved_special_token_99|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128108, + "content": "<|reserved_special_token_100|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128109, + "content": "<|reserved_special_token_101|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128110, + "content": "<|reserved_special_token_102|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128111, + "content": "<|reserved_special_token_103|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128112, + "content": "<|reserved_special_token_104|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128113, + "content": "<|reserved_special_token_105|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128114, + "content": "<|reserved_special_token_106|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128115, + "content": "<|reserved_special_token_107|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128116, + "content": "<|reserved_special_token_108|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128117, + "content": "<|reserved_special_token_109|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128118, + "content": "<|reserved_special_token_110|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128119, + "content": "<|reserved_special_token_111|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128120, + "content": "<|reserved_special_token_112|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128121, + "content": "<|reserved_special_token_113|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128122, + "content": "<|reserved_special_token_114|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128123, + "content": "<|reserved_special_token_115|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128124, + "content": "<|reserved_special_token_116|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128125, + "content": "<|reserved_special_token_117|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128126, + "content": "<|reserved_special_token_118|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128127, + "content": "<|reserved_special_token_119|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128128, + "content": "<|reserved_special_token_120|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128129, + "content": "<|reserved_special_token_121|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128130, + "content": "<|reserved_special_token_122|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128131, + "content": "<|reserved_special_token_123|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128132, + "content": "<|reserved_special_token_124|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128133, + "content": "<|reserved_special_token_125|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128134, + "content": "<|reserved_special_token_126|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128135, + "content": "<|reserved_special_token_127|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128136, + "content": "<|reserved_special_token_128|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128137, + "content": "<|reserved_special_token_129|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128138, + "content": "<|reserved_special_token_130|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128139, + "content": "<|reserved_special_token_131|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128140, + "content": "<|reserved_special_token_132|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128141, + "content": "<|reserved_special_token_133|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128142, + "content": "<|reserved_special_token_134|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128143, + "content": "<|reserved_special_token_135|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128144, + "content": "<|reserved_special_token_136|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128145, + "content": "<|reserved_special_token_137|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128146, + "content": "<|reserved_special_token_138|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128147, + "content": "<|reserved_special_token_139|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128148, + "content": "<|reserved_special_token_140|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128149, + "content": "<|reserved_special_token_141|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128150, + "content": "<|reserved_special_token_142|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128151, + "content": "<|reserved_special_token_143|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128152, + "content": "<|reserved_special_token_144|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128153, + "content": "<|reserved_special_token_145|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128154, + "content": "<|reserved_special_token_146|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128155, + "content": "<|reserved_special_token_147|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128156, + "content": "<|reserved_special_token_148|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128157, + "content": "<|reserved_special_token_149|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128158, + "content": "<|reserved_special_token_150|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128159, + "content": "<|reserved_special_token_151|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128160, + "content": "<|reserved_special_token_152|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128161, + "content": "<|reserved_special_token_153|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128162, + "content": "<|reserved_special_token_154|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128163, + "content": "<|reserved_special_token_155|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128164, + "content": "<|reserved_special_token_156|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128165, + "content": "<|reserved_special_token_157|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128166, + "content": "<|reserved_special_token_158|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128167, + "content": "<|reserved_special_token_159|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128168, + "content": "<|reserved_special_token_160|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128169, + "content": "<|reserved_special_token_161|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128170, + "content": "<|reserved_special_token_162|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128171, + "content": "<|reserved_special_token_163|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128172, + "content": "<|reserved_special_token_164|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128173, + "content": "<|reserved_special_token_165|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128174, + "content": "<|reserved_special_token_166|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128175, + "content": "<|reserved_special_token_167|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128176, + "content": "<|reserved_special_token_168|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128177, + "content": "<|reserved_special_token_169|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128178, + "content": "<|reserved_special_token_170|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128179, + "content": "<|reserved_special_token_171|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128180, + "content": "<|reserved_special_token_172|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128181, + "content": "<|reserved_special_token_173|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128182, + "content": "<|reserved_special_token_174|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128183, + "content": "<|reserved_special_token_175|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128184, + "content": "<|reserved_special_token_176|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128185, + "content": "<|reserved_special_token_177|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128186, + "content": "<|reserved_special_token_178|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128187, + "content": "<|reserved_special_token_179|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128188, + "content": "<|reserved_special_token_180|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128189, + "content": "<|reserved_special_token_181|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128190, + "content": "<|reserved_special_token_182|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128191, + "content": "<|reserved_special_token_183|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128192, + "content": "<|reserved_special_token_184|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128193, + "content": "<|reserved_special_token_185|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128194, + "content": "<|reserved_special_token_186|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128195, + "content": "<|reserved_special_token_187|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128196, + "content": "<|reserved_special_token_188|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128197, + "content": "<|reserved_special_token_189|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128198, + "content": "<|reserved_special_token_190|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128199, + "content": "<|reserved_special_token_191|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128200, + "content": "<|reserved_special_token_192|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128201, + "content": "<|reserved_special_token_193|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128202, + "content": "<|reserved_special_token_194|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128203, + "content": "<|reserved_special_token_195|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128204, + "content": "<|reserved_special_token_196|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128205, + "content": "<|reserved_special_token_197|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128206, + "content": "<|reserved_special_token_198|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128207, + "content": "<|reserved_special_token_199|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128208, + "content": "<|reserved_special_token_200|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128209, + "content": "<|reserved_special_token_201|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128210, + "content": "<|reserved_special_token_202|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128211, + "content": "<|reserved_special_token_203|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128212, + "content": "<|reserved_special_token_204|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128213, + "content": "<|reserved_special_token_205|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128214, + "content": "<|reserved_special_token_206|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128215, + "content": "<|reserved_special_token_207|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128216, + "content": "<|reserved_special_token_208|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128217, + "content": "<|reserved_special_token_209|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128218, + "content": "<|reserved_special_token_210|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128219, + "content": "<|reserved_special_token_211|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128220, + "content": "<|reserved_special_token_212|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128221, + "content": "<|reserved_special_token_213|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128222, + "content": "<|reserved_special_token_214|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128223, + "content": "<|reserved_special_token_215|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128224, + "content": "<|reserved_special_token_216|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128225, + "content": "<|reserved_special_token_217|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128226, + "content": "<|reserved_special_token_218|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128227, + "content": "<|reserved_special_token_219|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128228, + "content": "<|reserved_special_token_220|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128229, + "content": "<|reserved_special_token_221|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128230, + "content": "<|reserved_special_token_222|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128231, + "content": "<|reserved_special_token_223|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128232, + "content": "<|reserved_special_token_224|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128233, + "content": "<|reserved_special_token_225|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128234, + "content": "<|reserved_special_token_226|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128235, + "content": "<|reserved_special_token_227|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128236, + "content": "<|reserved_special_token_228|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128237, + "content": "<|reserved_special_token_229|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128238, + "content": "<|reserved_special_token_230|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128239, + "content": "<|reserved_special_token_231|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128240, + "content": "<|reserved_special_token_232|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128241, + "content": "<|reserved_special_token_233|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128242, + "content": "<|reserved_special_token_234|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128243, + "content": "<|reserved_special_token_235|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128244, + "content": "<|reserved_special_token_236|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128245, + "content": "<|reserved_special_token_237|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128246, + "content": "<|reserved_special_token_238|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128247, + "content": "<|reserved_special_token_239|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128248, + "content": "<|reserved_special_token_240|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128249, + "content": "<|reserved_special_token_241|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128250, + "content": "<|reserved_special_token_242|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128251, + "content": "<|reserved_special_token_243|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128252, + "content": "<|reserved_special_token_244|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128253, + "content": "<|reserved_special_token_245|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128254, + "content": "<|reserved_special_token_246|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + }, + { + "id": 128255, + "content": "<|reserved_special_token_247|>", + "single_word": false, + "lstrip": false, + "rstrip": false, + "normalized": false, + "special": true + } + ], + "normalizer": null, + "pre_tokenizer": { + "type": "Sequence", + "pretokenizers": [ + { + "type": "Split", + "pattern": { + "Regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?\\p{L}+|\\p{N}{1,3}| ?[^\\s\\p{L}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+" + }, + "behavior": "Isolated", + "invert": false + }, + { + "type": "ByteLevel", + "add_prefix_space": false, + "trim_offsets": true, + "use_regex": false + } + ] + }, + "post_processor": { + "type": "Sequence", + "processors": [ + { + "type": "ByteLevel", + "add_prefix_space": true, + "trim_offsets": false, + "use_regex": true + }, + { + "type": "TemplateProcessing", + "single": [ + { + "SpecialToken": { + "id": "<|begin_of_text|>", + "type_id": 0 + } + }, + { + "Sequence": { + "id": "A", + "type_id": 0 + } + } + ], + "pair": [ + { + "SpecialToken": { + "id": "<|begin_of_text|>", + "type_id": 0 + } + }, + { + "Sequence": { + "id": "A", + "type_id": 0 + } + }, + { + "SpecialToken": { + "id": "<|begin_of_text|>", + "type_id": 1 + } + }, + { + "Sequence": { + "id": "B", + "type_id": 1 + } + } + ], + "special_tokens": { + "<|begin_of_text|>": { + "id": "<|begin_of_text|>", + "ids": [ + 128000 + ], + "tokens": [ + "<|begin_of_text|>" + ] + } + } + } + ] + }, + "decoder": { + "type": "ByteLevel", + "add_prefix_space": true, + "trim_offsets": true, + "use_regex": true + }, + "model": { + "type": "BPE", + "dropout": null, + "unk_token": null, + "continuing_subword_prefix": null, + "end_of_word_suffix": null, + "fuse_unk": false, + "byte_fallback": false, + "ignore_merges": true, + "vocab": { + "!": 0, + "\"": 1, + "#": 2, + "$": 3, + "%": 4, + "&": 5, + "'": 6, + "(": 7, + ")": 8, + "*": 9, + "+": 10, + ",": 11, + "-": 12, + ".": 13, + "/": 14, + "0": 15, + "1": 16, + "2": 17, + "3": 18, + "4": 19, + "5": 20, + "6": 21, + "7": 22, + "8": 23, + "9": 24, + ":": 25, + ";": 26, + "<": 27, + "=": 28, + ">": 29, + "?": 30, + "@": 31, + "A": 32, + "B": 33, + "C": 34, + "D": 35, + "E": 36, + "F": 37, + "G": 38, + "H": 39, + "I": 40, + "J": 41, + "K": 42, + "L": 43, + "M": 44, + "N": 45, + "O": 46, + "P": 47, + "Q": 48, + "R": 49, + "S": 50, + "T": 51, + "U": 52, + "V": 53, + "W": 54, + "X": 55, + "Y": 56, + "Z": 57, + "[": 58, + "\\": 59, + "]": 60, + "^": 61, + "_": 62, + "`": 63, + "a": 64, + "b": 65, + "c": 66, + "d": 67, + "e": 68, + "f": 69, + "g": 70, + "h": 71, + "i": 72, + "j": 73, + "k": 74, + "l": 75, + "m": 76, + "n": 77, + "o": 78, + "p": 79, + "q": 80, + "r": 81, + "s": 82, + "t": 83, + "u": 84, + "v": 85, + "w": 86, + "x": 87, + "y": 88, + "z": 89, + "{": 90, + "|": 91, + "}": 92, + "~": 93, + "¡": 94, + "¢": 95, + "£": 96, + "¤": 97, + "¥": 98, + "¦": 99, + "§": 100, + "¨": 101, + "©": 102, + "ª": 103, + "«": 104, + "¬": 105, + "®": 106, + "¯": 107, + "°": 108, + "±": 109, + "²": 110, + "³": 111, + "´": 112, + "µ": 113, + "¶": 114, + "·": 115, + "¸": 116, + "¹": 117, + "º": 118, + "»": 119, + "¼": 120, + "½": 121, + "¾": 122, + "¿": 123, + "À": 124, + "Á": 125, + "Â": 126, + "Ã": 127, + "Ä": 128, + "Å": 129, + "Æ": 130, + "Ç": 131, + "È": 132, + "É": 133, + "Ê": 134, + "Ë": 135, + "Ì": 136, + "Í": 137, + "Î": 138, + "Ï": 139, + "Ð": 140, + "Ñ": 141, + "Ò": 142, + "Ó": 143, + "Ô": 144, + "Õ": 145, + "Ö": 146, + "×": 147, + "Ø": 148, + "Ù": 149, + "Ú": 150, + "Û": 151, + "Ü": 152, + "Ý": 153, + "Þ": 154, + "ß": 155, + "à": 156, + "á": 157, + "â": 158, + "ã": 159, + "ä": 160, + "å": 161, + "æ": 162, + "ç": 163, + "è": 164, + "é": 165, + "ê": 166, + "ë": 167, + "ì": 168, + "í": 169, + "î": 170, + "ï": 171, + "ð": 172, + "ñ": 173, + "ò": 174, + "ó": 175, + "ô": 176, + "õ": 177, + "ö": 178, + "÷": 179, + "ø": 180, + "ù": 181, + "ú": 182, + "û": 183, + "ü": 184, + "ý": 185, + "þ": 186, + "ÿ": 187, + "Ā": 188, + "ā": 189, + "Ă": 190, + "ă": 191, + "Ą": 192, + "ą": 193, + "Ć": 194, + "ć": 195, + "Ĉ": 196, + "ĉ": 197, + "Ċ": 198, + "ċ": 199, + "Č": 200, + "č": 201, + "Ď": 202, + "ď": 203, + "Đ": 204, + "đ": 205, + "Ē": 206, + "ē": 207, + "Ĕ": 208, + "ĕ": 209, + "Ė": 210, + "ė": 211, + "Ę": 212, + "ę": 213, + "Ě": 214, + "ě": 215, + "Ĝ": 216, + "ĝ": 217, + "Ğ": 218, + "ğ": 219, + "Ġ": 220, + "ġ": 221, + "Ģ": 222, + "ģ": 223, + "Ĥ": 224, + "ĥ": 225, + "Ħ": 226, + "ħ": 227, + "Ĩ": 228, + "ĩ": 229, + "Ī": 230, + "ī": 231, + "Ĭ": 232, + "ĭ": 233, + "Į": 234, + "į": 235, + "İ": 236, + "ı": 237, + "IJ": 238, + "ij": 239, + "Ĵ": 240, + "ĵ": 241, + "Ķ": 242, + "ķ": 243, + "ĸ": 244, + "Ĺ": 245, + "ĺ": 246, + "Ļ": 247, + "ļ": 248, + "Ľ": 249, + "ľ": 250, + "Ŀ": 251, + "ŀ": 252, + "Ł": 253, + "ł": 254, + "Ń": 255, + "ĠĠ": 256, + "ĠĠĠĠ": 257, + "in": 258, + "Ġt": 259, + "ĠĠĠĠĠĠĠĠ": 260, + "er": 261, + "ĠĠĠ": 262, + "on": 263, + "Ġa": 264, + "re": 265, + "at": 266, + "st": 267, + "en": 268, + "or": 269, + "Ġth": 270, + "ĊĊ": 271, + "Ġc": 272, + "le": 273, + "Ġs": 274, + "it": 275, + "an": 276, + "ar": 277, + "al": 278, + "Ġthe": 279, + ";Ċ": 280, + "Ġp": 281, + "Ġf": 282, + "ou": 283, + "Ġ=": 284, + "is": 285, + "ĠĠĠĠĠĠĠ": 286, + "ing": 287, + "es": 288, + "Ġw": 289, + "ion": 290, + "ed": 291, + "ic": 292, + "Ġb": 293, + "Ġd": 294, + "et": 295, + "Ġm": 296, + "Ġo": 297, + "ĉĉ": 298, + "ro": 299, + "as": 300, + "el": 301, + "ct": 302, + "nd": 303, + "Ġin": 304, + "Ġh": 305, + "ent": 306, + "id": 307, + "Ġn": 308, + "am": 309, + "ĠĠĠĠĠĠĠĠĠĠĠ": 310, + "Ġto": 311, + "Ġre": 312, + "--": 313, + "Ġ{": 314, + "Ġof": 315, + "om": 316, + ");Ċ": 317, + "im": 318, + "čĊ": 319, + "Ġ(": 320, + "il": 321, + "//": 322, + "Ġand": 323, + "ur": 324, + "se": 325, + "Ġl": 326, + "ex": 327, + "ĠS": 328, + "ad": 329, + "Ġ\"": 330, + "ch": 331, + "ut": 332, + "if": 333, + "**": 334, + "Ġ}": 335, + "em": 336, + "ol": 337, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 338, + "th": 339, + ")Ċ": 340, + "Ġ{Ċ": 341, + "Ġg": 342, + "ig": 343, + "iv": 344, + ",Ċ": 345, + "ce": 346, + "od": 347, + "Ġv": 348, + "ate": 349, + "ĠT": 350, + "ag": 351, + "ay": 352, + "Ġ*": 353, + "ot": 354, + "us": 355, + "ĠC": 356, + "Ġst": 357, + "ĠI": 358, + "un": 359, + "ul": 360, + "ue": 361, + "ĠA": 362, + "ow": 363, + "Ġ'": 364, + "ew": 365, + "Ġ<": 366, + "ation": 367, + "()": 368, + "Ġfor": 369, + "ab": 370, + "ort": 371, + "um": 372, + "ame": 373, + "Ġis": 374, + "pe": 375, + "tr": 376, + "ck": 377, + "âĢ": 378, + "Ġy": 379, + "ist": 380, + "----": 381, + ".ĊĊ": 382, + "he": 383, + "Ġe": 384, + "lo": 385, + "ĠM": 386, + "Ġbe": 387, + "ers": 388, + "Ġon": 389, + "Ġcon": 390, + "ap": 391, + "ub": 392, + "ĠP": 393, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 394, + "ass": 395, + "int": 396, + ">Ċ": 397, + "ly": 398, + "urn": 399, + "Ġ$": 400, + ";ĊĊ": 401, + "av": 402, + "port": 403, + "ir": 404, + "->": 405, + "nt": 406, + "ction": 407, + "end": 408, + "Ġde": 409, + "00": 410, + "ith": 411, + "out": 412, + "turn": 413, + "our": 414, + "ĠĠĠĠĠ": 415, + "lic": 416, + "res": 417, + "pt": 418, + "==": 419, + "Ġthis": 420, + "Ġwh": 421, + "Ġif": 422, + "ĠD": 423, + "ver": 424, + "age": 425, + "ĠB": 426, + "ht": 427, + "ext": 428, + "=\"": 429, + "Ġthat": 430, + "****": 431, + "ĠR": 432, + "Ġit": 433, + "ess": 434, + "ĠF": 435, + "Ġr": 436, + "os": 437, + "and": 438, + "Ġas": 439, + "ect": 440, + "ke": 441, + "rom": 442, + "Ġ//": 443, + "con": 444, + "ĠL": 445, + "(\"": 446, + "qu": 447, + "lass": 448, + "Ġwith": 449, + "iz": 450, + "de": 451, + "ĠN": 452, + "Ġal": 453, + "op": 454, + "up": 455, + "get": 456, + "Ġ}Ċ": 457, + "ile": 458, + "Ġan": 459, + "ata": 460, + "ore": 461, + "ri": 462, + "Ġpro": 463, + ";čĊ": 464, + "ĉĉĉĉ": 465, + "ter": 466, + "ain": 467, + "ĠW": 468, + "ĠE": 469, + "Ġcom": 470, + "Ġreturn": 471, + "art": 472, + "ĠH": 473, + "ack": 474, + "import": 475, + "ublic": 476, + "Ġor": 477, + "est": 478, + "ment": 479, + "ĠG": 480, + "able": 481, + "Ġ-": 482, + "ine": 483, + "ill": 484, + "ind": 485, + "ere": 486, + "::": 487, + "ity": 488, + "Ġ+": 489, + "Ġtr": 490, + "elf": 491, + "ight": 492, + "('": 493, + "orm": 494, + "ult": 495, + "str": 496, + "..": 497, + "\",": 498, + "Ġyou": 499, + "ype": 500, + "pl": 501, + "Ġnew": 502, + "Ġj": 503, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 504, + "Ġfrom": 505, + "Ġex": 506, + "ĠO": 507, + "20": 508, + "ld": 509, + "Ġ[": 510, + "oc": 511, + ":Ċ": 512, + "Ġse": 513, + "Ġle": 514, + "--------": 515, + ".s": 516, + "{Ċ": 517, + "',": 518, + "ant": 519, + "Ġat": 520, + "ase": 521, + ".c": 522, + "Ġch": 523, + "": 524, + "ave": 525, + "ang": 526, + "Ġare": 527, + "Ġint": 528, + "âĢĻ": 529, + "_t": 530, + "ert": 531, + "ial": 532, + "act": 533, + "}Ċ": 534, + "ive": 535, + "ode": 536, + "ost": 537, + "Ġclass": 538, + "Ġnot": 539, + "og": 540, + "ord": 541, + "alue": 542, + "all": 543, + "ff": 544, + "();Ċ": 545, + "ont": 546, + "ime": 547, + "are": 548, + "ĠU": 549, + "Ġpr": 550, + "Ġ:": 551, + "ies": 552, + "ize": 553, + "ure": 554, + "Ġby": 555, + "ire": 556, + "Ġ}ĊĊ": 557, + ".p": 558, + "Ġsh": 559, + "ice": 560, + "ast": 561, + "ption": 562, + "tring": 563, + "ok": 564, + "__": 565, + "cl": 566, + "##": 567, + "Ġhe": 568, + "ard": 569, + ").": 570, + "Ġ@": 571, + "iew": 572, + "ĉĉĉ": 573, + "Ġwas": 574, + "ip": 575, + "this": 576, + "Ġu": 577, + "ĠThe": 578, + "ide": 579, + "ace": 580, + "ib": 581, + "ac": 582, + "rou": 583, + "Ġwe": 584, + "ject": 585, + "Ġpublic": 586, + "ak": 587, + "ve": 588, + "ath": 589, + "oid": 590, + "Ġ=>": 591, + "ust": 592, + "que": 593, + "Ġres": 594, + "))": 595, + "'s": 596, + "Ġk": 597, + "ans": 598, + "yst": 599, + "unction": 600, + "********": 601, + "Ġi": 602, + "Ġus": 603, + "pp": 604, + "10": 605, + "one": 606, + "ail": 607, + "====": 608, + "name": 609, + "Ġstr": 610, + "Ġ/": 611, + "Ġ&": 612, + "ach": 613, + "div": 614, + "ystem": 615, + "ell": 616, + "Ġhave": 617, + "err": 618, + "ould": 619, + "ull": 620, + "pon": 621, + "ĠJ": 622, + "_p": 623, + "Ġ==": 624, + "ign": 625, + "St": 626, + ".Ċ": 627, + "Ġpl": 628, + ");ĊĊ": 629, + "form": 630, + "put": 631, + "ount": 632, + "}ĊĊ": 633, + "dd": 634, + "ite": 635, + "Ġget": 636, + "rr": 637, + "ome": 638, + "ĠâĢ": 639, + "aram": 640, + "cc": 641, + "Ġ*/": 642, + "ER": 643, + "In": 644, + "les": 645, + "_s": 646, + "ong": 647, + "ie": 648, + "Ġcan": 649, + "ĠV": 650, + "erv": 651, + "pr": 652, + "Ġun": 653, + "row": 654, + "ber": 655, + "Ġdo": 656, + "ll": 657, + "Ġel": 658, + "Ġself": 659, + "ated": 660, + "ary": 661, + "Ġ.": 662, + "']": 663, + "ud": 664, + "Ġen": 665, + "ĠTh": 666, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 667, + "te": 668, + "_c": 669, + "uct": 670, + "Ġab": 671, + "ork": 672, + ".get": 673, + "Ġ#": 674, + "aw": 675, + "ress": 676, + "ob": 677, + "Name": 678, + "201": 679, + "app": 680, + "['": 681, + "Ġall": 682, + "ory": 683, + "ition": 684, + "ance": 685, + "ear": 686, + "Ġcont": 687, + "vent": 688, + "ia": 689, + "Ġwill": 690, + "IN": 691, + "ĠĠĠĠĠĠĠĠĠ": 692, + "return": 693, + "Ġ": 694, + "data": 695, + ")ĊĊ": 696, + "Re": 697, + "ple": 698, + "ild": 699, + "ther": 700, + "Ġyour": 701, + "\"Ċ": 702, + "($": 703, + "Ġout": 704, + "),": 705, + "Ġhas": 706, + "String": 707, + "so": 708, + "Ġup": 709, + "ax": 710, + "Ġdef": 711, + "Ġbo": 712, + "ge": 713, + "alse": 714, + "ON": 715, + "per": 716, + "12": 717, + "ich": 718, + "Ġbut": 719, + "ĠĊ": 720, + "Ġ_": 721, + "_m": 722, + "add": 723, + "quest": 724, + "odel": 725, + "self": 726, + "ery": 727, + "ft": 728, + "ens": 729, + "////": 730, + "ake": 731, + ".C": 732, + "Ġgo": 733, + "Ġfunction": 734, + "ĠK": 735, + "ivate": 736, + "Ġim": 737, + "Ġconst": 738, + ".t": 739, + "Ġ*/Ċ": 740, + ");čĊ": 741, + "Ġvoid": 742, + "Ġset": 743, + "ĠSystem": 744, + "cri": 745, + "()Ċ": 746, + "li": 747, + "ĉif": 748, + ".m": 749, + "ally": 750, + "set": 751, + "ep": 752, + "âĢĻs": 753, + "bo": 754, + "def": 755, + "',Ċ": 756, + "Ġme": 757, + "Ġ!": 758, + "atch": 759, + "\">": 760, + "\",Ċ": 761, + "ec": 762, + "ĠIn": 763, + "ph": 764, + "Ġ|": 765, + "_f": 766, + "Ġvar": 767, + "ence": 768, + "Id": 769, + "ree": 770, + "ink": 771, + "lect": 772, + "ug": 773, + "eth": 774, + "Ġelse": 775, + "----------------": 776, + "19": 777, + "cont": 778, + "Ġso": 779, + "atic": 780, + "Ġlo": 781, + "pro": 782, + "ton": 783, + "ss": 784, + "own": 785, + "abel": 786, + "oint": 787, + "ous": 788, + "eld": 789, + "ST": 790, + "The": 791, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 792, + "RE": 793, + "\":": 794, + "olor": 795, + "tp": 796, + "eg": 797, + "key": 798, + "ude": 799, + "ĠSt": 800, + "ound": 801, + "Ġar": 802, + "\");Ċ": 803, + "ener": 804, + "ser": 805, + "11": 806, + "bject": 807, + "essage": 808, + "fer": 809, + "Ġmore": 810, + "ations": 811, + "ents": 812, + "Ġhis": 813, + "Ġthey": 814, + ".S": 815, + "ĠY": 816, + "use": 817, + "ne": 818, + "ish": 819, + "old": 820, + "_d": 821, + "io": 822, + "ield": 823, + "Ġper": 824, + "Cont": 825, + "ings": 826, + "####": 827, + "Ġdata": 828, + "Ġsa": 829, + "ef": 830, + "fo": 831, + "Ġone": 832, + "eng": 833, + "Ġdis": 834, + "AT": 835, + "Ġname": 836, + "Ġtrue": 837, + "val": 838, + "led": 839, + ".f": 840, + "Ġne": 841, + "Ġend": 842, + "32": 843, + ".T": 844, + "16": 845, + "cre": 846, + "ark": 847, + "log": 848, + "Ex": 849, + "error": 850, + "_id": 851, + "urre": 852, + "ange": 853, + "Ġnull": 854, + "rray": 855, + "Ġmy": 856, + "pan": 857, + "ict": 858, + "ator": 859, + "View": 860, + "List": 861, + "ĉreturn": 862, + "âĢĿ": 863, + "Ġpre": 864, + "Ġx": 865, + "clude": 866, + "arg": 867, + "15": 868, + "ov": 869, + ".h": 870, + "Ġ>": 871, + "Ġtheir": 872, + "')": 873, + "irst": 874, + "ick": 875, + "gh": 876, + "LE": 877, + "OR": 878, + "Ġprivate": 879, + "tem": 880, + "čĊčĊ": 881, + "user": 882, + "Ġ)": 883, + "com": 884, + ".A": 885, + "\";Ċ": 886, + "Ġid": 887, + "read": 888, + "Ġwho": 889, + "_b": 890, + "\">Ċ": 891, + "Ġtime": 892, + "Ġman": 893, + "ry": 894, + "========": 895, + "roup": 896, + "rop": 897, + "public": 898, + "vel": 899, + "umber": 900, + "ble": 901, + "Ġwhich": 902, + "****************": 903, + "Ġany": 904, + "Ġfalse": 905, + "we": 906, + "Ġvalue": 907, + "Ġli": 908, + "\")": 909, + "nder": 910, + "gr": 911, + "Ġno": 912, + "param": 913, + "25": 914, + "fig": 915, + ".com": 916, + "Ġapp": 917, + "_l": 918, + "ions": 919, + ".D": 920, + "ĠCh": 921, + "Ġabout": 922, + "Ġadd": 923, + "Ġsu": 924, + "Ġstring": 925, + "ID": 926, + "Ġover": 927, + "string": 928, + ".l": 929, + "ource": 930, + "000": 931, + "_C": 932, + "]Ċ": 933, + "Ġqu": 934, + "ĠString": 935, + "ca": 936, + "SE": 937, + "Ġro": 938, + "sh": 939, + "ual": 940, + "Type": 941, + "son": 942, + "new": 943, + "ern": 944, + "Ġag": 945, + "AR": 946, + "];Ċ": 947, + "].": 948, + "Ġ?": 949, + "ical": 950, + "Ġdes": 951, + "uth": 952, + "ix": 953, + "ays": 954, + "Ġtype": 955, + "'t": 956, + "ault": 957, + "Ġinter": 958, + "var": 959, + ".b": 960, + "Ġpart": 961, + ".d": 962, + "urrent": 963, + "IT": 964, + "EN": 965, + "30": 966, + "enc": 967, + "(f": 968, + "ra": 969, + "value": 970, + "cho": 971, + "18": 972, + "utton": 973, + "ose": 974, + "14": 975, + "Ġ!=": 976, + "ater": 977, + "é": 978, + "reate": 979, + "oll": 980, + "pos": 981, + "yle": 982, + "ng": 983, + "AL": 984, + "using": 985, + "ames": 986, + "Ġ{čĊ": 987, + "ates": 988, + "ely": 989, + "Ġwork": 990, + "Ġem": 991, + "inal": 992, + "Ġsp": 993, + "Ġwhen": 994, + ".set": 995, + "ĠĠĠĠĠĠ": 996, + "):Ċ": 997, + "to": 998, + "quire": 999, + "indow": 1000, + "lement": 1001, + "pect": 1002, + "ash": 1003, + "[i": 1004, + "Ġuse": 1005, + ".F": 1006, + "pec": 1007, + "Ġad": 1008, + "ove": 1009, + "ception": 1010, + "ength": 1011, + "include": 1012, + "ader": 1013, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1014, + "atus": 1015, + "Th": 1016, + "itle": 1017, + "rit": 1018, + "void": 1019, + "().": 1020, + "(Ċ": 1021, + "Ġoff": 1022, + "Ġother": 1023, + "Ġ&&": 1024, + "';Ċ": 1025, + "ms": 1026, + "Ġbeen": 1027, + "Ġte": 1028, + "ml": 1029, + "co": 1030, + "nc": 1031, + "13": 1032, + "ervice": 1033, + "Ġ%": 1034, + "**Ċ": 1035, + "ann": 1036, + "ade": 1037, + "ĊĊĊĊ": 1038, + "lock": 1039, + "const": 1040, + "100": 1041, + "ponse": 1042, + "Ġsup": 1043, + "++": 1044, + "date": 1045, + "Ġacc": 1046, + "Ġhad": 1047, + "Ġbu": 1048, + "200": 1049, + "ĠRe": 1050, + "Ġwere": 1051, + "Ġfile": 1052, + "Ġwould": 1053, + "ĠâĢľ": 1054, + "ven": 1055, + "iss": 1056, + "Ġour": 1057, + "class": 1058, + "raw": 1059, + "Ġyear": 1060, + "Data": 1061, + "Ġval": 1062, + "Ġsome": 1063, + "fter": 1064, + "ys": 1065, + "Ġ///": 1066, + "round": 1067, + "view": 1068, + "Ġpe": 1069, + "Ġthere": 1070, + "Ġsaid": 1071, + "du": 1072, + "of": 1073, + "line": 1074, + "/*": 1075, + "duct": 1076, + "Ġher": 1077, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1078, + "Res": 1079, + "Ġco": 1080, + "Ġcomm": 1081, + "ise": 1082, + "min": 1083, + "ĠĠĠĠĊ": 1084, + "#include": 1085, + "ethod": 1086, + ".P": 1087, + "ute": 1088, + "Ġass": 1089, + "Int": 1090, + "ask": 1091, + "loc": 1092, + "Ġlike": 1093, + "ody": 1094, + "Ġlet": 1095, + "load": 1096, + "Ġam": 1097, + "rol": 1098, + "Ġgr": 1099, + "yp": 1100, + "Ġalso": 1101, + "ĠIt": 1102, + "url": 1103, + "ific": 1104, + "ors": 1105, + "_P": 1106, + "_n": 1107, + "igh": 1108, + "Ġthan": 1109, + "Com": 1110, + "AN": 1111, + "UL": 1112, + "ating": 1113, + "17": 1114, + "ĠThis": 1115, + "ref": 1116, + "_S": 1117, + "Ġstatic": 1118, + "roll": 1119, + "Ġjust": 1120, + "Ġresult": 1121, + "ian": 1122, + "idth": 1123, + "Ġthem": 1124, + "));Ċ": 1125, + "der": 1126, + "reak": 1127, + "Con": 1128, + "://": 1129, + "ule": 1130, + "...": 1131, + "arch": 1132, + "ement": 1133, + "Ġ<<": 1134, + "50": 1135, + "ush": 1136, + "ense": 1137, + "arr": 1138, + "Ġinto": 1139, + "cess": 1140, + "amp": 1141, + "ied": 1142, + "ument": 1143, + "Ġ\\": 1144, + "],": 1145, + "wo": 1146, + "als": 1147, + "Ġwhat": 1148, + "anc": 1149, + "Value": 1150, + "='": 1151, + "olum": 1152, + "Ġpos": 1153, + "ages": 1154, + "ayer": 1155, + "Ġsc": 1156, + "ues": 1157, + "\")Ċ": 1158, + "_T": 1159, + "Ġlist": 1160, + "(s": 1161, + "Ġcase": 1162, + "Ch": 1163, + "ĉĉĉĉĉ": 1164, + "////////": 1165, + "ponent": 1166, + "Ġz": 1167, + "Ġkn": 1168, + "let": 1169, + "DE": 1170, + "red": 1171, + "Ġfe": 1172, + "Ġ},Ċ": 1173, + "Ġ,": 1174, + "(t": 1175, + "Ġfirst": 1176, + "');Ċ": 1177, + "word": 1178, + "Ġimport": 1179, + "Ġact": 1180, + "Ġchar": 1181, + "CT": 1182, + "ĠTr": 1183, + "ople": 1184, + "={": 1185, + "ĉf": 1186, + "24": 1187, + "ient": 1188, + "cent": 1189, + ".j": 1190, + "lection": 1191, + "))Ċ": 1192, + "Ġonly": 1193, + "Ġprint": 1194, + "mer": 1195, + ".W": 1196, + "ock": 1197, + "Ġ--": 1198, + "Text": 1199, + "Ġop": 1200, + "ank": 1201, + "Ġits": 1202, + "Ġback": 1203, + "[\"": 1204, + "Ġneed": 1205, + "Ġcl": 1206, + "Ġsub": 1207, + "Ġla": 1208, + "((": 1209, + ".\"": 1210, + "Object": 1211, + "Ġstart": 1212, + "file": 1213, + "(self": 1214, + "ner": 1215, + "ey": 1216, + "Ġuser": 1217, + "Ġent": 1218, + "ĠCom": 1219, + "its": 1220, + "ĠCon": 1221, + "ouble": 1222, + "ower": 1223, + "item": 1224, + "very": 1225, + "ĠWe": 1226, + "64": 1227, + "lick": 1228, + "ĠQ": 1229, + "php": 1230, + "ttp": 1231, + "':": 1232, + "ics": 1233, + "Ġunder": 1234, + "Ġ*Ċ": 1235, + ".L": 1236, + ");": 1237, + "ices": 1238, + "Ġreg": 1239, + ")čĊ": 1240, + "ĉpublic": 1241, + "SS": 1242, + "Ġthen": 1243, + "reat": 1244, + "ious": 1245, + ".G": 1246, + "ek": 1247, + "irect": 1248, + "heck": 1249, + "cript": 1250, + "ning": 1251, + "ĠUn": 1252, + "Ġmay": 1253, + "ĠWh": 1254, + "Bo": 1255, + "Item": 1256, + "struct": 1257, + ".st": 1258, + "ream": 1259, + "ible": 1260, + "loat": 1261, + "Ġorg": 1262, + "und": 1263, + "sum": 1264, + "_in": 1265, + "../": 1266, + "_M": 1267, + "Ġhow": 1268, + "rite": 1269, + "'Ċ": 1270, + "To": 1271, + "40": 1272, + "ww": 1273, + "Ġpeople": 1274, + "index": 1275, + ".n": 1276, + "http": 1277, + "(m": 1278, + "ector": 1279, + "Ġind": 1280, + "Ġjav": 1281, + "],Ċ": 1282, + "ĠHe": 1283, + "_st": 1284, + "ful": 1285, + "ole": 1286, + "){Ċ": 1287, + "Ġshould": 1288, + "opy": 1289, + "elp": 1290, + "ier": 1291, + "_name": 1292, + "erson": 1293, + "ION": 1294, + "ote": 1295, + "Ġtest": 1296, + "Ġbet": 1297, + "rror": 1298, + "ular": 1299, + "ãĢ": 1300, + "ĠÐ": 1301, + "bs": 1302, + "ting": 1303, + "Ġmake": 1304, + "Tr": 1305, + "Ġafter": 1306, + "arget": 1307, + "RO": 1308, + "olumn": 1309, + "rc": 1310, + "_re": 1311, + "define": 1312, + "22": 1313, + "Ġright": 1314, + "right": 1315, + "day": 1316, + "Ġlong": 1317, + "[]": 1318, + "(p": 1319, + "td": 1320, + "cond": 1321, + "ĠPro": 1322, + "Ġrem": 1323, + "ptions": 1324, + "vid": 1325, + ".g": 1326, + "Ġext": 1327, + "Ġ__": 1328, + "')Ċ": 1329, + "pace": 1330, + "mp": 1331, + "Ġmin": 1332, + "stance": 1333, + "air": 1334, + "action": 1335, + "wh": 1336, + "type": 1337, + "util": 1338, + "ait": 1339, + "": 1340, + "IC": 1341, + "text": 1342, + "Ġph": 1343, + "Ġfl": 1344, + ".M": 1345, + "ccess": 1346, + "br": 1347, + "fore": 1348, + "ersion": 1349, + "),Ċ": 1350, + ".re": 1351, + "ateg": 1352, + "Ġloc": 1353, + "ins": 1354, + "-s": 1355, + "trib": 1356, + "ĠInt": 1357, + "Ġarray": 1358, + ",\"": 1359, + "Pro": 1360, + "(c": 1361, + "ession": 1362, + ">ĊĊ": 1363, + "Ġshe": 1364, + "\"]": 1365, + "aph": 1366, + "Ġexp": 1367, + "erty": 1368, + "ĠSe": 1369, + "Ġpar": 1370, + "unc": 1371, + "ET": 1372, + "Ġread": 1373, + "print": 1374, + "Ġrel": 1375, + "Ġform": 1376, + "Ġdr": 1377, + "Exception": 1378, + "input": 1379, + "Ġtrans": 1380, + "########": 1381, + "order": 1382, + "By": 1383, + "Ġaw": 1384, + "ities": 1385, + "uff": 1386, + "play": 1387, + ".add": 1388, + "ĠâĢĵ": 1389, + "Ġwant": 1390, + "Ġcomp": 1391, + "ments": 1392, + "Ġ||": 1393, + "az": 1394, + "be": 1395, + "Ġnumber": 1396, + "Ġrequire": 1397, + "ĠEx": 1398, + "60": 1399, + "Ġcol": 1400, + "Ġkey": 1401, + "ember": 1402, + "Ġtwo": 1403, + "Ġsize": 1404, + "Ġwhere": 1405, + "UT": 1406, + "result": 1407, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1408, + "ough": 1409, + "orld": 1410, + "ood": 1411, + "uch": 1412, + "ative": 1413, + "ger": 1414, + "arent": 1415, + "Ġ/*": 1416, + "Ġarg": 1417, + "Ġwhile": 1418, + "23": 1419, + "(this": 1420, + "Ġrec": 1421, + "Ġdif": 1422, + "State": 1423, + "Ġspec": 1424, + "ride": 1425, + "_F": 1426, + "Ġlook": 1427, + "AM": 1428, + "ility": 1429, + "eter": 1430, + "âĢĻt": 1431, + "ĊĊĊ": 1432, + "ayout": 1433, + "--------------------------------": 1434, + "ager": 1435, + "Ġcould": 1436, + "Ġbr": 1437, + "ends": 1438, + "ures": 1439, + "Ġknow": 1440, + "ets": 1441, + "ĠIf": 1442, + "ĠSh": 1443, + ".w": 1444, + "back": 1445, + "Ġser": 1446, + "Ġ+=": 1447, + "Ġfr": 1448, + "());Ċ": 1449, + "Ġhand": 1450, + "Ind": 1451, + "ULL": 1452, + "Im": 1453, + "();ĊĊ": 1454, + "Ġmost": 1455, + "Ġtry": 1456, + "Ġnow": 1457, + "rough": 1458, + ">čĊ": 1459, + "ackage": 1460, + "Ġhim": 1461, + "._": 1462, + "ify": 1463, + "Ġbreak": 1464, + "Ġ);Ċ": 1465, + "ren": 1466, + "#define": 1467, + "itt": 1468, + "Ġap": 1469, + "ĉc": 1470, + "(n": 1471, + "ĠYou": 1472, + ":ĊĊ": 1473, + "-m": 1474, + "Ġevery": 1475, + "ustom": 1476, + "lient": 1477, + "ocument": 1478, + "cription": 1479, + "Error": 1480, + "-b": 1481, + "о": 1482, + "][": 1483, + "99": 1484, + "trans": 1485, + "Ġpoint": 1486, + "Ġstd": 1487, + "Ġfil": 1488, + "Time": 1489, + "80": 1490, + "Ġmod": 1491, + "Ġ->": 1492, + "Ġerror": 1493, + "ah": 1494, + "Ġtext": 1495, + "roller": 1496, + "lose": 1497, + "ql": 1498, + "Ġpol": 1499, + ">": 1500, + "Ġshow": 1501, + "User": 1502, + "ased": 1503, + "Ġ{ĊĊ": 1504, + "Ġfind": 1505, + "а": 1506, + "ED": 1507, + "span": 1508, + "enu": 1509, + "Ġcurrent": 1510, + "Ġused": 1511, + "cept": 1512, + "clud": 1513, + "Ġplay": 1514, + "Ġlog": 1515, + "ution": 1516, + "fl": 1517, + "Ġsee": 1518, + "indows": 1519, + "Ġhelp": 1520, + "Ġthese": 1521, + "Ġpass": 1522, + "Ġdown": 1523, + "Ġeven": 1524, + "ason": 1525, + "uild": 1526, + "from": 1527, + "(d": 1528, + "Ġbl": 1529, + "label": 1530, + "else": 1531, + "е": 1532, + "Ġ(!": 1533, + "ized": 1534, + "(),": 1535, + "Ġob": 1536, + "Ġitem": 1537, + "ump": 1538, + "UR": 1539, + "orn": 1540, + "Ġdon": 1541, + "Se": 1542, + "man": 1543, + "27": 1544, + "ample": 1545, + "tn": 1546, + "================": 1547, + "He": 1548, + "gram": 1549, + "Ġdid": 1550, + "wn": 1551, + "_h": 1552, + "iver": 1553, + "Ġsm": 1554, + "Ġthrough": 1555, + "ĠAn": 1556, + "che": 1557, + "Ġinv": 1558, + "ouse": 1559, + "Ġes": 1560, + "ĠNew": 1561, + "export": 1562, + "mary": 1563, + "uto": 1564, + "ler": 1565, + "Ġlast": 1566, + "Ġevent": 1567, + "try": 1568, + "ï¼": 1569, + "ily": 1570, + "igned": 1571, + "ines": 1572, + "ollow": 1573, + "icense": 1574, + "sole": 1575, + "lear": 1576, + "(int": 1577, + "Ġagain": 1578, + "Ġhigh": 1579, + "html": 1580, + "Index": 1581, + "uthor": 1582, + "Ġ/**Ċ": 1583, + "Ġline": 1584, + "Event": 1585, + "_D": 1586, + "Ġdoes": 1587, + "itial": 1588, + "Ġcr": 1589, + "ars": 1590, + "28": 1591, + "Ġtem": 1592, + "cause": 1593, + "face": 1594, + "Ġ`": 1595, + "_A": 1596, + "Button": 1597, + "ature": 1598, + "ected": 1599, + "ES": 1600, + "ister": 1601, + "ĉĊ": 1602, + "Ġbefore": 1603, + "ale": 1604, + "other": 1605, + "Ġbecause": 1606, + "roid": 1607, + "Ġed": 1608, + "ik": 1609, + "reg": 1610, + "ĠDe": 1611, + "Ġdist": 1612, + "},Ċ": 1613, + "Ġstate": 1614, + "Ġcons": 1615, + "rint": 1616, + "att": 1617, + "Ġhere": 1618, + "ined": 1619, + "Ġfinal": 1620, + "Ġ\"\"": 1621, + "Key": 1622, + "LO": 1623, + "Ġdel": 1624, + "pty": 1625, + "thing": 1626, + "26": 1627, + "ĠAnd": 1628, + "Ġrun": 1629, + "ĠX": 1630, + "ym": 1631, + ".app": 1632, + "Ġvery": 1633, + "ces": 1634, + "_N": 1635, + "ared": 1636, + "ward": 1637, + "list": 1638, + "ited": 1639, + "olog": 1640, + "itch": 1641, + "Box": 1642, + "ife": 1643, + "33": 1644, + "Ġac": 1645, + "Ġmodel": 1646, + "Ġmon": 1647, + "Ġway": 1648, + "lete": 1649, + "Ġcall": 1650, + "Ġatt": 1651, + "Ġcal": 1652, + "vert": 1653, + "Ġdec": 1654, + "lease": 1655, + "oun": 1656, + "Ġ});Ċ": 1657, + "fr": 1658, + "formation": 1659, + "etail": 1660, + "Ġnum": 1661, + "aj": 1662, + "query": 1663, + "Ġwell": 1664, + "Ġobject": 1665, + "ĠAs": 1666, + "Ġyears": 1667, + "Color": 1668, + "IS": 1669, + "Ġdefault": 1670, + "Wh": 1671, + "Ġins": 1672, + "aint": 1673, + "Ġjava": 1674, + "Ġsim": 1675, + "ĠAr": 1676, + "mon": 1677, + "til": 1678, + "();čĊ": 1679, + "):": 1680, + "Set": 1681, + "29": 1682, + "atter": 1683, + "Ġview": 1684, + "Ġpres": 1685, + "array": 1686, + "We": 1687, + "At": 1688, + "Ġbel": 1689, + "Ġmany": 1690, + "21": 1691, + "Man": 1692, + "ender": 1693, + "Ġbeing": 1694, + "Ġgood": 1695, + "ĉĉĉĉĉĉ": 1696, + "ational": 1697, + "ware": 1698, + ".log": 1699, + "{čĊ": 1700, + "Ġusing": 1701, + "_B": 1702, + "Ġ:=": 1703, + "_w": 1704, + "ists": 1705, + "lish": 1706, + "Ġstud": 1707, + "ĠAl": 1708, + "Ġgu": 1709, + "config": 1710, + "uring": 1711, + "time": 1712, + "oken": 1713, + "amespace": 1714, + "Ġrequest": 1715, + "Ġchild": 1716, + "ĠÃ": 1717, + "lob": 1718, + "Ġparam": 1719, + "Ġ}čĊ": 1720, + "01": 1721, + "Ġecho": 1722, + "function": 1723, + "********************************": 1724, + "ps": 1725, + "Element": 1726, + "alk": 1727, + "lication": 1728, + "by": 1729, + "Size": 1730, + "rawing": 1731, + "Ġperson": 1732, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1733, + "\\n": 1734, + "object": 1735, + "ince": 1736, + "En": 1737, + "File": 1738, + "uf": 1739, + "ffect": 1740, + "AC": 1741, + "Ġstyle": 1742, + "summary": 1743, + "Ġque": 1744, + "_r": 1745, + "Ġ($": 1746, + "Model": 1747, + "ident": 1748, + "Ġmethod": 1749, + "IL": 1750, + "ott": 1751, + "less": 1752, + "ING": 1753, + "Ġ()": 1754, + "Ġexpect": 1755, + "ync": 1756, + "package": 1757, + "35": 1758, + "urs": 1759, + "Ġprot": 1760, + "./": 1761, + "pre": 1762, + "Ġ)Ċ": 1763, + "ma": 1764, + "Ġsur": 1765, + "Ġfound": 1766, + "Info": 1767, + "par": 1768, + "imes": 1769, + ".e": 1770, + "ains": 1771, + "Ġpost": 1772, + "-d": 1773, + "45": 1774, + "olean": 1775, + "Ġsl": 1776, + "PE": 1777, + "Ġsuch": 1778, + "select": 1779, + "ainer": 1780, + "Ġthink": 1781, + "Ġdiffer": 1782, + ".r": 1783, + "/**Ċ": 1784, + "FF": 1785, + "ool": 1786, + "plate": 1787, + "qual": 1788, + "ĠFor": 1789, + "Ġmuch": 1790, + "uc": 1791, + "(new": 1792, + "odule": 1793, + "Ġsom": 1794, + "Ġhttp": 1795, + "ĠList": 1796, + "Ġcount": 1797, + "Ġinst": 1798, + "char": 1799, + "mit": 1800, + ".id": 1801, + "aking": 1802, + "Ġgener": 1803, + "px": 1804, + "vice": 1805, + "37": 1806, + "_data": 1807, + "ĠNULL": 1808, + "}čĊ": 1809, + "idd": 1810, + "ãĢĤ": 1811, + "Ġmed": 1812, + "org": 1813, + "ider": 1814, + "ache": 1815, + "work": 1816, + "Ġcheck": 1817, + "ween": 1818, + "Ġ((": 1819, + "the": 1820, + "ants": 1821, + "><": 1822, + ".B": 1823, + "-c": 1824, + "Ġopen": 1825, + "Ġest": 1826, + "ĠĠĠĠĠĠĠĠĊ": 1827, + "Ġnext": 1828, + "IM": 1829, + "ÑĤ": 1830, + "OT": 1831, + "ó": 1832, + "Ġfollow": 1833, + "content": 1834, + "ĠĠĠĠĠĠĠĠĠĠĠĠ": 1835, + "Ġinclud": 1836, + "HE": 1837, + "ĠRes": 1838, + "Ġhref": 1839, + "и": 1840, + "Ġcar": 1841, + "ypes": 1842, + "image": 1843, + "Un": 1844, + "Ġbool": 1845, + "AD": 1846, + "Ġgame": 1847, + ".Form": 1848, + "rows": 1849, + "*/": 1850, + "velop": 1851, + ".Drawing": 1852, + "Ġpath": 1853, + "ision": 1854, + "Ġeach": 1855, + "ĠPl": 1856, + "_type": 1857, + "Path": 1858, + "nection": 1859, + "Ġav": 1860, + "').": 1861, + "Ġsupport": 1862, + "ENT": 1863, + "rem": 1864, + "\").": 1865, + "Ġown": 1866, + "Ġcor": 1867, + "count": 1868, + "miss": 1869, + "ually": 1870, + "Ġmem": 1871, + "std": 1872, + "ience": 1873, + "search": 1874, + "\"ĊĊ": 1875, + "Form": 1876, + "Ġsex": 1877, + "ename": 1878, + "Ġsign": 1879, + "Ġet": 1880, + "ĠĠĠĠĠĠĠĠĠĠ": 1881, + "','": 1882, + "ĠApp": 1883, + "Ġthose": 1884, + "off": 1885, + "Ġerr": 1886, + "Ġsystem": 1887, + "Ġbest": 1888, + "code": 1889, + "Ġsame": 1890, + "Ġdi": 1891, + "uss": 1892, + "Ġcreate": 1893, + "ather": 1894, + "Array": 1895, + ".in": 1896, + "fe": 1897, + "Service": 1898, + "UN": 1899, + "ats": 1900, + "ĠZ": 1901, + "alth": 1902, + "Ġmade": 1903, + "true": 1904, + "AB": 1905, + "Ġmark": 1906, + "rid": 1907, + "ified": 1908, + ",čĊ": 1909, + "yn": 1910, + "press": 1911, + "Ġgroup": 1912, + "Ġfin": 1913, + "ĠLicense": 1914, + "Field": 1915, + "eger": 1916, + "Ġworld": 1917, + "iness": 1918, + "ty": 1919, + "Ġprocess": 1920, + "(b": 1921, + "Ġcre": 1922, + "arn": 1923, + "ives": 1924, + "Ġmain": 1925, + "ideo": 1926, + "36": 1927, + "_g": 1928, + "AG": 1929, + "valid": 1930, + "img": 1931, + "PI": 1932, + "Ġcolor": 1933, + "Ġreport": 1934, + "Ġtake": 1935, + "rib": 1936, + "OM": 1937, + "Ġday": 1938, + "Request": 1939, + "Ġsk": 1940, + "bers": 1941, + "ĉs": 1942, + ".Add": 1943, + "oot": 1944, + "Image": 1945, + "Ġcomple": 1946, + "ollection": 1947, + "Ġtop": 1948, + "Ġfree": 1949, + "AS": 1950, + "De": 1951, + "ĠOn": 1952, + "IG": 1953, + "90": 1954, + "eta": 1955, + "Date": 1956, + "Ġaction": 1957, + "34": 1958, + "Over": 1959, + "itor": 1960, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 1961, + "not": 1962, + "Ġindex": 1963, + "her": 1964, + "icon": 1965, + "On": 1966, + ";čĊčĊ": 1967, + "ivity": 1968, + "mand": 1969, + ".Windows": 1970, + "OL": 1971, + "Ġreal": 1972, + "Ġmax": 1973, + "land": 1974, + "....": 1975, + "raph": 1976, + "Ġbuild": 1977, + "leg": 1978, + "assword": 1979, + "?ĊĊ": 1980, + "â̦": 1981, + "ook": 1982, + "uck": 1983, + "Ġmessage": 1984, + "test": 1985, + "ivers": 1986, + "38": 1987, + "Ġinput": 1988, + "Ġart": 1989, + "Ġbetween": 1990, + "Get": 1991, + "enter": 1992, + "ground": 1993, + "ene": 1994, + "á": 1995, + ".length": 1996, + "Node": 1997, + "(i": 1998, + "Class": 1999, + "for": 2000, + "ĠâĢĶ": 2001, + "ten": 2002, + "oin": 2003, + "Ġke": 2004, + "ui": 2005, + "ĠIN": 2006, + "Ġtable": 2007, + "sub": 2008, + "ĠLe": 2009, + "Ġhead": 2010, + "Ġmust": 2011, + "////////////////": 2012, + ".util": 2013, + "Context": 2014, + "Ġorder": 2015, + "Ġmov": 2016, + "over": 2017, + "Ġcontin": 2018, + "Ġsay": 2019, + "static": 2020, + ".Text": 2021, + "ĠclassName": 2022, + "pany": 2023, + "Ġter": 2024, + "head": 2025, + "rg": 2026, + "Ġproduct": 2027, + "This": 2028, + ".âĢĿ": 2029, + "ĠBut": 2030, + "70": 2031, + "loy": 2032, + "Ġdouble": 2033, + "sg": 2034, + "Ġplace": 2035, + ".x": 2036, + "message": 2037, + "Ġinformation": 2038, + "private": 2039, + "Ġoper": 2040, + "ced": 2041, + "db": 2042, + "\">": 2043, + "Param": 2044, + "icle": 2045, + "Ġweek": 2046, + "Ġprop": 2047, + "table": 2048, + "idget": 2049, + "place": 2050, + "Prop": 2051, + "ĠAll": 2052, + "els": 2053, + "box": 2054, + ".ĊĊĊĊ": 2055, + ".R": 2056, + "ĠTo": 2057, + "iter": 2058, + "Sh": 2059, + "uration": 2060, + "older": 2061, + "_list": 2062, + "come": 2063, + "Ġsw": 2064, + "ization": 2065, + "ĉfor": 2066, + "bl": 2067, + "Ġprogram": 2068, + "(e": 2069, + "ape": 2070, + "check": 2071, + ".Forms": 2072, + "Ġund": 2073, + "ategory": 2074, + "75": 2075, + "ags": 2076, + "Ġresponse": 2077, + "US": 2078, + "request": 2079, + "Ġstruct": 2080, + "escription": 2081, + "Ġcode": 2082, + "_H": 2083, + "uffer": 2084, + "Ġwithout": 2085, + "lobal": 2086, + "Manager": 2087, + "ilter": 2088, + "PO": 2089, + "ĉthis": 2090, + "option": 2091, + "Ġsol": 2092, + "Ġ===": 2093, + "akes": 2094, + "Controller": 2095, + "44": 2096, + "Message": 2097, + "Ġref": 2098, + "ever": 2099, + "ĠSo": 2100, + "aining": 2101, + ".append": 2102, + "Ġstill": 2103, + "Ġprovid": 2104, + "Ġassert": 2105, + "med": 2106, + "Ġcap": 2107, + "usiness": 2108, + "Ġrep": 2109, + "tings": 2110, + "ved": 2111, + ".N": 2112, + "api": 2113, + "OD": 2114, + "Ġfield": 2115, + "iven": 2116, + "oto": 2117, + "âĢľ": 2118, + "col": 2119, + "(x": 2120, + "ght": 2121, + "Result": 2122, + "Code": 2123, + ".is": 2124, + "link": 2125, + "Ġcour": 2126, + "An": 2127, + "Ġteam": 2128, + "ĉint": 2129, + "ift": 2130, + "55": 2131, + "Ġsecond": 2132, + "Ġgoing": 2133, + "Ġrange": 2134, + "_E": 2135, + "ness": 2136, + "39": 2137, + "Ġfam": 2138, + "Ġnil": 2139, + "ĠCont": 2140, + "ailable": 2141, + "utes": 2142, + "atab": 2143, + "Ġfact": 2144, + "Ġvis": 2145, + "(&": 2146, + "ĠAN": 2147, + "31": 2148, + "Al": 2149, + "title": 2150, + "Ġandroid": 2151, + "CE": 2152, + "\\\"": 2153, + "irt": 2154, + "Ġwrit": 2155, + "н": 2156, + "ĉm": 2157, + "ftware": 2158, + "ond": 2159, + "Ġret": 2160, + "osition": 2161, + "Ġhome": 2162, + "Ġleft": 2163, + "args": 2164, + "meric": 2165, + "48": 2166, + "Ġdirect": 2167, + "oci": 2168, + "Pl": 2169, + "As": 2170, + "ret": 2171, + "ado": 2172, + "Of": 2173, + "chn": 2174, + "ĠGet": 2175, + "ee": 2176, + "ross": 2177, + "();": 2178, + "____": 2179, + ".ph": 2180, + "It": 2181, + "oute": 2182, + "Ġexper": 2183, + "chool": 2184, + "www": 2185, + "},": 2186, + "Ġallow": 2187, + "ĠÂ": 2188, + "())": 2189, + "size": 2190, + "ism": 2191, + "ai": 2192, + "tract": 2193, + "ane": 2194, + "...ĊĊ": 2195, + "context": 2196, + "Ġbeg": 2197, + "CH": 2198, + "Ġpage": 2199, + "hip": 2200, + "no": 2201, + "core": 2202, + "sp": 2203, + "Ġdifferent": 2204, + "iable": 2205, + "ĠMe": 2206, + "_IN": 2207, + "button": 2208, + "ĠIs": 2209, + "ervices": 2210, + "Ġca": 2211, + "Ġaround": 2212, + "App": 2213, + "ration": 2214, + "Ġrece": 2215, + "Ġreally": 2216, + "Ġimage": 2217, + "Ġtarget": 2218, + "Ġdep": 2219, + "opyright": 2220, + "tra": 2221, + "ingle": 2222, + "ital": 2223, + "Layout": 2224, + "Ġboth": 2225, + "Override": 2226, + "arm": 2227, + "=>": 2228, + "aterial": 2229, + "iled": 2230, + "Ġput": 2231, + "Qu": 2232, + "ÑĢ": 2233, + "ung": 2234, + "map": 2235, + "ĉĉĉĉĉĉĉĉ": 2236, + "Ġlevel": 2237, + "Component": 2238, + "book": 2239, + "creen": 2240, + "_RE": 2241, + "Ġconfig": 2242, + "ãģ": 2243, + "Or": 2244, + ".data": 2245, + "Ġdocument": 2246, + "\",\"": 2247, + "tribute": 2248, + "ux": 2249, + "Log": 2250, + "ference": 2251, + "post": 2252, + "_e": 2253, + "Ġlocal": 2254, + "andom": 2255, + "assert": 2256, + "Val": 2257, + "lected": 2258, + "ina": 2259, + "atabase": 2260, + "Add": 2261, + "Ġcontent": 2262, + ".print": 2263, + "signed": 2264, + "ric": 2265, + ".\"ĊĊ": 2266, + "Ġfa": 2267, + "!ĊĊ": 2268, + "-f": 2269, + "ived": 2270, + "Ġquest": 2271, + ".ex": 2272, + "Ġfloat": 2273, + "Ġdevelop": 2274, + "оÐ": 2275, + "Map": 2276, + "ading": 2277, + "Ġposs": 2278, + "UE": 2279, + "namespace": 2280, + "_O": 2281, + "ĉb": 2282, + ".Get": 2283, + ">(": 2284, + "json": 2285, + "etails": 2286, + "66": 2287, + "Ġtoo": 2288, + "Ġextends": 2289, + "ĠNone": 2290, + "Ġfore": 2291, + "(String": 2292, + "format": 2293, + "Ġgreat": 2294, + "inter": 2295, + "cale": 2296, + "Ñģ": 2297, + "ron": 2298, + "iving": 2299, + "Ent": 2300, + "ency": 2301, + "xt": 2302, + "oy": 2303, + "05": 2304, + "Ġmonth": 2305, + "Ġhapp": 2306, + "Ġsuper": 2307, + "bar": 2308, + "default": 2309, + "_de": 2310, + "ords": 2311, + "ln": 2312, + "({Ċ": 2313, + "ĠInd": 2314, + "ases": 2315, + "Ġtitle": 2316, + "Ġcontext": 2317, + "08": 2318, + "oh": 2319, + "-p": 2320, + "Em": 2321, + "Ġmet": 2322, + "Test": 2323, + "Ġlife": 2324, + "_v": 2325, + "ĠUS": 2326, + "UI": 2327, + "ocation": 2328, + "md": 2329, + "Ġ[Ċ": 2330, + "Ġ]": 2331, + "sw": 2332, + "Ġincre": 2333, + "script": 2334, + "ential": 2335, + "ways": 2336, + ".de": 2337, + "Ġsrc": 2338, + "Ġcatch": 2339, + "ĠAmeric": 2340, + "//Ċ": 2341, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2342, + "Ġpay": 2343, + "plit": 2344, + "âĢĶ": 2345, + "Ġcoun": 2346, + "obj": 2347, + ".php": 2348, + "Ġchange": 2349, + "ething": 2350, + "'re": 2351, + "aster": 2352, + "los": 2353, + "lation": 2354, + "ĠĠĊ": 2355, + "Le": 2356, + "ä": 2357, + "({": 2358, + "ready": 2359, + "ĠNo": 2360, + "Ġposition": 2361, + "Ġold": 2362, + "Ġbook": 2363, + "abled": 2364, + "bug": 2365, + "202": 2366, + "Hand": 2367, + "};ĊĊ": 2368, + "isplay": 2369, + "aving": 2370, + "04": 2371, + "Ġgover": 2372, + "Ġversion": 2373, + "System": 2374, + "nect": 2375, + "response": 2376, + "Style": 2377, + "Up": 2378, + "angu": 2379, + "Ġthree": 2380, + "init": 2381, + "ero": 2382, + "Ġlaw": 2383, + "endif": 2384, + "Ġbase": 2385, + "email": 2386, + "(l": 2387, + "_V": 2388, + "Ġconf": 2389, + "ATE": 2390, + "Ġduring": 2391, + "tes": 2392, + "Ġconsole": 2393, + "ĠPr": 2394, + "Ġspe": 2395, + "ves": 2396, + "65": 2397, + "path": 2398, + "ialog": 2399, + "dition": 2400, + "_to": 2401, + "ards": 2402, + "Ġagainst": 2403, + "etwork": 2404, + "ĠPh": 2405, + "_L": 2406, + "cur": 2407, + "imit": 2408, + "With": 2409, + "Ġpower": 2410, + "ium": 2411, + "';ĊĊ": 2412, + "Ġwom": 2413, + "left": 2414, + "ources": 2415, + "atri": 2416, + "ĠIm": 2417, + "ĠMan": 2418, + "orth": 2419, + "${": 2420, + "88": 2421, + "quals": 2422, + "ese": 2423, + "_size": 2424, + "Ġiss": 2425, + "otal": 2426, + "-g": 2427, + "ique": 2428, + "rame": 2429, + "Ġwidth": 2430, + "erg": 2431, + ")(": 2432, + "ittle": 2433, + "TR": 2434, + "ĠThey": 2435, + "ences": 2436, + "02": 2437, + "rl": 2438, + "ons": 2439, + "Ġlabel": 2440, + ".y": 2441, + "-t": 2442, + "update": 2443, + "anel": 2444, + "sc": 2445, + ".to": 2446, + "Ġproject": 2447, + "ü": 2448, + "Ġelement": 2449, + "Ġsuccess": 2450, + "ĉĉĊ": 2451, + ".sh": 2452, + "ram": 2453, + "ched": 2454, + "())Ċ": 2455, + "Ġ(Ċ": 2456, + "Ġdate": 2457, + "Ġtot": 2458, + "_ST": 2459, + "All": 2460, + "ification": 2461, + "ĉvar": 2462, + "Ġtri": 2463, + "chem": 2464, + "my": 2465, + "Ġbig": 2466, + "ĠAd": 2467, + "ĠAt": 2468, + "ots": 2469, + "num": 2470, + "Act": 2471, + "Ġmap": 2472, + "era": 2473, + "cope": 2474, + ".$": 2475, + ",âĢĿ": 2476, + "Ġpop": 2477, + "Ġfew": 2478, + "Ġlen": 2479, + "uid": 2480, + "eters": 2481, + "ules": 2482, + "ÃŃ": 2483, + "source": 2484, + "https": 2485, + "Ġdem": 2486, + "Ġear": 2487, + "################": 2488, + "Ġmatch": 2489, + "ories": 2490, + "49": 2491, + "aces": 2492, + "ĠCl": 2493, + "Ġnode": 2494, + "78": 2495, + "irc": 2496, + "local": 2497, + "unity": 2498, + "};Ċ": 2499, + "Ġanother": 2500, + "<<": 2501, + "ogle": 2502, + "Ġsit": 2503, + "ework": 2504, + "TE": 2505, + ".I": 2506, + "NS": 2507, + "ology": 2508, + "ought": 2509, + ".Cont": 2510, + ">>": 2511, + "Ġcare": 2512, + "state": 2513, + "ĉprivate": 2514, + "Ġeffect": 2515, + "++)": 2516, + "_file": 2517, + "ending": 2518, + "Line": 2519, + "For": 2520, + "ior": 2521, + "ĠSc": 2522, + "Ġfun": 2523, + ".Size": 2524, + "ĉelse": 2525, + "])": 2526, + "start": 2527, + "vious": 2528, + "Ġ},": 2529, + "ours": 2530, + "Ġleg": 2531, + "Ġservice": 2532, + "Ġsince": 2533, + "iron": 2534, + "Label": 2535, + "Ġnon": 2536, + "Ġlos": 2537, + "iction": 2538, + "Ġfull": 2539, + "acter": 2540, + "board": 2541, + "gress": 2542, + "Ġturn": 2543, + "ither": 2544, + "09": 2545, + ".size": 2546, + "Ġbody": 2547, + "resh": 2548, + "eturn": 2549, + "199": 2550, + "(_": 2551, + "yles": 2552, + "ormal": 2553, + "pi": 2554, + "Ġsomething": 2555, + "!--": 2556, + "uint": 2557, + "Ġprodu": 2558, + "Ġstand": 2559, + "Ġproble": 2560, + "Ġavailable": 2561, + "mt": 2562, + "ĠBl": 2563, + "Ġ...": 2564, + "Ġblock": 2565, + "Input": 2566, + "Ġkeep": 2567, + "Count": 2568, + "open": 2569, + "Ġ['": 2570, + "Ġthrow": 2571, + "uilder": 2572, + "Action": 2573, + "Ġthings": 2574, + "True": 2575, + "Ġurl": 2576, + "ĠBo": 2577, + "printf": 2578, + "Ġred": 2579, + "js": 2580, + ".create": 2581, + "ĠOr": 2582, + "Status": 2583, + "Instance": 2584, + "Ġcontrol": 2585, + "Ġcome": 2586, + "Ġcustom": 2587, + "location": 2588, + "07": 2589, + "model": 2590, + "ĠčĊ": 2591, + "Ġsource": 2592, + "Ġeas": 2593, + ".out": 2594, + "]ĊĊ": 2595, + "oney": 2596, + "Ġawait": 2597, + "Ġpartic": 2598, + "AP": 2599, + "ublish": 2600, + "odes": 2601, + "_pro": 2602, + "ply": 2603, + "riter": 2604, + "Ġprov": 2605, + "Ġmill": 2606, + "HT": 2607, + "])Ċ": 2608, + "Ġchang": 2609, + "Ġask": 2610, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2611, + "Ġoutput": 2612, + "Ġemail": 2613, + "68": 2614, + ".push": 2615, + "Ġ}čĊčĊ": 2616, + "ination": 2617, + "47": 2618, + "atrix": 2619, + "Table": 2620, + "uccess": 2621, + "]);Ċ": 2622, + "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 2623, + "Ġdisc": 2624, + "([": 2625, + "Ġbusiness": 2626, + "height": 2627, + ".html": 2628, + "ta": 2629, + "field": 2630, + "Ġrequired": 2631, + "_R": 2632, + "Ġgovern": 2633, + "}čĊčĊ": 2634, + "lex": 2635, + "500": 2636, + ".,": 2637, + "ĠSet": 2638, + "urch": 2639, + "///": 2640, + "ts": 2641, + "af": 2642, + "Ġmight": 2643, + "istory": 2644, + "Str": 2645, + "Ġnever": 2646, + "Response": 2647, + "arse": 2648, + "ada": 2649, + "ĠHow": 2650, + "Ġ*)": 2651, + "Ġ;": 2652, + "Ġhard": 2653, + "Ad": 2654, + "Ġintern": 2655, + "used": 2656, + "(data": 2657, + "mod": 2658, + "annel": 2659, + "Ġnp": 2660, + "ugg": 2661, + "Ġ/>Ċ": 2662, + "Ġcalled": 2663, + "body": 2664, + "Ġcho": 2665, + "(r": 2666, + "_set": 2667, + "ird": 2668, + "Ġ>=": 2669, + "Ġ};Ċ": 2670, + "Ġoptions": 2671, + "ĠGener": 2672, + "Ġheight": 2673, + "Point": 2674, + "You": 2675, + "ety": 2676, + "Click": 2677, + "Ġsmall": 2678, + "Ġide": 2679, + "Ġaccess": 2680, + "anguage": 2681, + "Ġprotected": 2682, + "Ġjob": 2683, + "ĠThere": 2684, + "Def": 2685, + "Ġaddress": 2686, + "Ġuint": 2687, + "Not": 2688, + "oo": 2689, + "aps": 2690, + "
&": 5909,
+ "CON": 5910,
+ "Ġrepl": 5911,
+ "Ġregular": 5912,
+ "Storage": 5913,
+ "ramework": 5914,
+ "Ġgoal": 5915,
+ "Ġtouch": 5916,
+ ".widget": 5917,
+ "Ġbuilt": 5918,
+ "des": 5919,
+ "Part": 5920,
+ "(re": 5921,
+ "Ġworth": 5922,
+ "hib": 5923,
+ "game": 5924,
+ "91": 5925,
+ "192": 5926,
+ "Ġв": 5927,
+ "acion": 5928,
+ "ĠWhite": 5929,
+ "(type": 5930,
+ "(`": 5931,
+ "81": 5932,
+ "Ġnatural": 5933,
+ "Ġinj": 5934,
+ "Ġcalcul": 5935,
+ "ĠApril": 5936,
+ ".List": 5937,
+ "Ġassociated": 5938,
+ "ĉSystem": 5939,
+ "~~": 5940,
+ "=[": 5941,
+ "Ġstorage": 5942,
+ "Ġbytes": 5943,
+ "Ġtravel": 5944,
+ "Ġsou": 5945,
+ "Ġpassed": 5946,
+ "!=": 5947,
+ "ascript": 5948,
+ ".open": 5949,
+ "Ġgrid": 5950,
+ "Ġbus": 5951,
+ "Ġrecogn": 5952,
+ "Ab": 5953,
+ "Ġhon": 5954,
+ "ĠCenter": 5955,
+ "Ġprec": 5956,
+ "build": 5957,
+ "73": 5958,
+ "HTML": 5959,
+ "ĠSan": 5960,
+ "Ġcountries": 5961,
+ "aled": 5962,
+ "token": 5963,
+ "kt": 5964,
+ "Ġqual": 5965,
+ "Last": 5966,
+ "adow": 5967,
+ "Ġmanufact": 5968,
+ "idad": 5969,
+ "jango": 5970,
+ "Next": 5971,
+ "xf": 5972,
+ ".a": 5973,
+ "Ġporno": 5974,
+ "ĠPM": 5975,
+ "erve": 5976,
+ "iting": 5977,
+ "_th": 5978,
+ "ci": 5979,
+ "=None": 5980,
+ "gs": 5981,
+ "Ġlogin": 5982,
+ "atives": 5983,
+ "']);Ċ": 5984,
+ "Äħ": 5985,
+ "Ġill": 5986,
+ "IA": 5987,
+ "children": 5988,
+ "DO": 5989,
+ "Ġlevels": 5990,
+ "Ġ{{": 5991,
+ "Ġlooks": 5992,
+ "Ġ\"#": 5993,
+ "ToString": 5994,
+ "Ġnecessary": 5995,
+ "ĠĠĠĊ": 5996,
+ "cell": 5997,
+ "Entry": 5998,
+ "Ġ'#": 5999,
+ "Ġextrem": 6000,
+ "Selector": 6001,
+ "Ġplaceholder": 6002,
+ "Load": 6003,
+ "Ġreleased": 6004,
+ "ORE": 6005,
+ "Enumer": 6006,
+ "ĠTV": 6007,
+ "SET": 6008,
+ "inq": 6009,
+ "Press": 6010,
+ "ĠDepartment": 6011,
+ "Ġproperties": 6012,
+ "Ġrespond": 6013,
+ "Search": 6014,
+ "ael": 6015,
+ "Ġrequ": 6016,
+ "ĠBook": 6017,
+ "/Ċ": 6018,
+ "(st": 6019,
+ "Ġfinancial": 6020,
+ "icket": 6021,
+ "_input": 6022,
+ "Ġthreat": 6023,
+ "(in": 6024,
+ "Strip": 6025,
+ "ìĿ": 6026,
+ "ção": 6027,
+ "71": 6028,
+ "Ġevidence": 6029,
+ "));": 6030,
+ "ĠBro": 6031,
+ "Ġ[];Ċ": 6032,
+ "Ġou": 6033,
+ "buf": 6034,
+ "Script": 6035,
+ "dat": 6036,
+ "Ġrule": 6037,
+ "#import": 6038,
+ "=\"/": 6039,
+ "Serial": 6040,
+ "Ġstarting": 6041,
+ "[index": 6042,
+ "ae": 6043,
+ "Ġcontrib": 6044,
+ "session": 6045,
+ "_new": 6046,
+ "utable": 6047,
+ "ober": 6048,
+ "Ġ\"./": 6049,
+ "Ġlogger": 6050,
+ "Ġrecently": 6051,
+ "Ġreturned": 6052,
+ "ččĊ": 6053,
+ ")))Ċ": 6054,
+ "itions": 6055,
+ "Ġseek": 6056,
+ "Ġcommunic": 6057,
+ "Ġ\".": 6058,
+ "Ġusername": 6059,
+ "ECT": 6060,
+ "DS": 6061,
+ "Ġotherwise": 6062,
+ "ĠGerman": 6063,
+ ".aw": 6064,
+ "Adapter": 6065,
+ "ixel": 6066,
+ "Ġsystems": 6067,
+ "Ġdrop": 6068,
+ "83": 6069,
+ "Ġstructure": 6070,
+ "Ġ$(\"#": 6071,
+ "encies": 6072,
+ "anning": 6073,
+ "ĠLink": 6074,
+ "ĠResponse": 6075,
+ "Ġstri": 6076,
+ "ż": 6077,
+ "ĠDB": 6078,
+ "æĹ": 6079,
+ "android": 6080,
+ "submit": 6081,
+ "otion": 6082,
+ "92": 6083,
+ "(@": 6084,
+ ".test": 6085,
+ "82": 6086,
+ "ĊĊĊĊĊĊĊĊ": 6087,
+ "];čĊ": 6088,
+ "Ġdirectly": 6089,
+ "Ġ\"%": 6090,
+ "ris": 6091,
+ "elta": 6092,
+ "AIL": 6093,
+ "){čĊ": 6094,
+ "mine": 6095,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 6096,
+ "(k": 6097,
+ "bon": 6098,
+ "asic": 6099,
+ "pite": 6100,
+ "___": 6101,
+ "Max": 6102,
+ "Ġerrors": 6103,
+ "ĠWhile": 6104,
+ "Ġarguments": 6105,
+ "Ġensure": 6106,
+ "Right": 6107,
+ "-based": 6108,
+ "Web": 6109,
+ "Ġ-=": 6110,
+ "Ġintrodu": 6111,
+ "ĠInst": 6112,
+ "ĠWash": 6113,
+ "ordin": 6114,
+ "join": 6115,
+ "Database": 6116,
+ "Ġgrad": 6117,
+ "Ġusually": 6118,
+ "ITE": 6119,
+ "Props": 6120,
+ "?>Ċ": 6121,
+ "ĠGo": 6122,
+ "@Override": 6123,
+ "REF": 6124,
+ "Ġip": 6125,
+ "ĠAustral": 6126,
+ "Ġist": 6127,
+ "ViewById": 6128,
+ "Ġserious": 6129,
+ "Ġcustomer": 6130,
+ ".prototype": 6131,
+ "odo": 6132,
+ "cor": 6133,
+ "Ġdoor": 6134,
+ "ĠWITHOUT": 6135,
+ "Ġplant": 6136,
+ "Ġbegan": 6137,
+ "Ġdistance": 6138,
+ "()).": 6139,
+ "Ġchance": 6140,
+ "Ġord": 6141,
+ "came": 6142,
+ "pragma": 6143,
+ "Ġprotect": 6144,
+ "ragment": 6145,
+ "ĠNode": 6146,
+ "ening": 6147,
+ "Ñĩ": 6148,
+ "Ġroute": 6149,
+ "ĠSchool": 6150,
+ "hi": 6151,
+ "Ġneighb": 6152,
+ "After": 6153,
+ "licit": 6154,
+ "Ġcontr": 6155,
+ "Ġprimary": 6156,
+ "AA": 6157,
+ ".WriteLine": 6158,
+ "utils": 6159,
+ "Ġbi": 6160,
+ "Red": 6161,
+ ".Linq": 6162,
+ ".object": 6163,
+ "Ġleaders": 6164,
+ "unities": 6165,
+ "Ġgun": 6166,
+ "onth": 6167,
+ "ĠDev": 6168,
+ "FILE": 6169,
+ "Ġcomments": 6170,
+ "_len": 6171,
+ "arrow": 6172,
+ "amount": 6173,
+ "Range": 6174,
+ "sert": 6175,
+ "GridView": 6176,
+ "Ġupdated": 6177,
+ "ĠMo": 6178,
+ "Ġinform": 6179,
+ "ociety": 6180,
+ "ala": 6181,
+ "Access": 6182,
+ "Ġhab": 6183,
+ "Ġcreat": 6184,
+ "_arg": 6185,
+ "ĠJanuary": 6186,
+ "ĠDay": 6187,
+ "\")čĊ": 6188,
+ "uple": 6189,
+ "document": 6190,
+ "gorith": 6191,
+ "menu": 6192,
+ "ĠOver": 6193,
+ "bb": 6194,
+ ".title": 6195,
+ "_out": 6196,
+ "Ġled": 6197,
+ "uri": 6198,
+ "Ġ?>": 6199,
+ "gl": 6200,
+ "Ġbank": 6201,
+ "ayment": 6202,
+ "ĉprintf": 6203,
+ "MD": 6204,
+ "Ġsample": 6205,
+ "Ġhands": 6206,
+ "ĠVersion": 6207,
+ "uario": 6208,
+ "Ġoffers": 6209,
+ "ityEngine": 6210,
+ "Ġshape": 6211,
+ "Ġsleep": 6212,
+ "_point": 6213,
+ "Settings": 6214,
+ "Ġachie": 6215,
+ "Ġsold": 6216,
+ "ota": 6217,
+ ".bind": 6218,
+ "Am": 6219,
+ "Ġsafe": 6220,
+ "Store": 6221,
+ "Ġshared": 6222,
+ "Ġpriv": 6223,
+ "_VAL": 6224,
+ "Ġsens": 6225,
+ "){": 6226,
+ "Ġremember": 6227,
+ "shared": 6228,
+ "element": 6229,
+ "Ġshoot": 6230,
+ "Vert": 6231,
+ "cout": 6232,
+ "Ġenv": 6233,
+ "_label": 6234,
+ "Ġ>Ċ": 6235,
+ "run": 6236,
+ "Ġscene": 6237,
+ "(array": 6238,
+ "device": 6239,
+ "_title": 6240,
+ "agon": 6241,
+ "]čĊ": 6242,
+ "aby": 6243,
+ "Ġbecame": 6244,
+ "boolean": 6245,
+ "Ġpark": 6246,
+ "ĠCode": 6247,
+ "upload": 6248,
+ "riday": 6249,
+ "ĠSeptember": 6250,
+ "Fe": 6251,
+ "Ġsen": 6252,
+ "cing": 6253,
+ "FL": 6254,
+ "Col": 6255,
+ "uts": 6256,
+ "_page": 6257,
+ "inn": 6258,
+ "Ġimplied": 6259,
+ "aling": 6260,
+ "Ġyourself": 6261,
+ ".Count": 6262,
+ "conf": 6263,
+ "Ġaud": 6264,
+ "_init": 6265,
+ ".)": 6266,
+ "Ġwrote": 6267,
+ "003": 6268,
+ "NG": 6269,
+ ".Error": 6270,
+ "ä»": 6271,
+ ".for": 6272,
+ "Ġequal": 6273,
+ "ĠRequest": 6274,
+ "Ġserial": 6275,
+ "Ġallows": 6276,
+ "XX": 6277,
+ "Ġmiddle": 6278,
+ "chor": 6279,
+ "195": 6280,
+ "94": 6281,
+ "ø": 6282,
+ "erval": 6283,
+ ".Column": 6284,
+ "reading": 6285,
+ "Ġescort": 6286,
+ "ĠAugust": 6287,
+ "Ġquickly": 6288,
+ "Ġweap": 6289,
+ "ĠCG": 6290,
+ "ropri": 6291,
+ "ho": 6292,
+ "Ġcop": 6293,
+ "(struct": 6294,
+ "ĠBig": 6295,
+ "Ġvs": 6296,
+ "Ġfrequ": 6297,
+ ".Value": 6298,
+ "Ġactions": 6299,
+ "Ġproper": 6300,
+ "Ġinn": 6301,
+ "Ġobjects": 6302,
+ "Ġmatrix": 6303,
+ "avascript": 6304,
+ "Ġones": 6305,
+ ".group": 6306,
+ "Ġgreen": 6307,
+ "Ġpaint": 6308,
+ "ools": 6309,
+ "ycl": 6310,
+ "encode": 6311,
+ "olt": 6312,
+ "comment": 6313,
+ ".api": 6314,
+ "Dir": 6315,
+ "Ġune": 6316,
+ "izont": 6317,
+ ".position": 6318,
+ "Ġdesigned": 6319,
+ "_val": 6320,
+ "avi": 6321,
+ "iring": 6322,
+ "tab": 6323,
+ "Ġlayer": 6324,
+ "Ġviews": 6325,
+ "Ġreve": 6326,
+ "rael": 6327,
+ "ĠON": 6328,
+ "rics": 6329,
+ "160": 6330,
+ "np": 6331,
+ "Ġcore": 6332,
+ "());čĊ": 6333,
+ "Main": 6334,
+ "Ġexpert": 6335,
+ "ĉĉčĊ": 6336,
+ "_en": 6337,
+ "Ġ/>": 6338,
+ "utter": 6339,
+ "IAL": 6340,
+ "ails": 6341,
+ "ĠKing": 6342,
+ "*/ĊĊ": 6343,
+ "ĠMet": 6344,
+ "_end": 6345,
+ "addr": 6346,
+ "ora": 6347,
+ "Ġir": 6348,
+ "Min": 6349,
+ "Ġsurpr": 6350,
+ "Ġrepe": 6351,
+ "Ġdirectory": 6352,
+ "PUT": 6353,
+ "-S": 6354,
+ "Ġelection": 6355,
+ "haps": 6356,
+ ".pre": 6357,
+ "cm": 6358,
+ "Values": 6359,
+ "Ġ\"Ċ": 6360,
+ "column": 6361,
+ "ivil": 6362,
+ "Login": 6363,
+ "inue": 6364,
+ "93": 6365,
+ "Ġbeautiful": 6366,
+ "Ġsecret": 6367,
+ "(event": 6368,
+ "Ġchat": 6369,
+ "ums": 6370,
+ "Ġorigin": 6371,
+ "Ġeffects": 6372,
+ "Ġmanagement": 6373,
+ "illa": 6374,
+ "tk": 6375,
+ "Ġsetting": 6376,
+ "ĠCour": 6377,
+ "Ġmassage": 6378,
+ "ĉend": 6379,
+ "Ġhappy": 6380,
+ "Ġfinish": 6381,
+ "Ġcamera": 6382,
+ "ĠVer": 6383,
+ "ĠDemocr": 6384,
+ "ĠHer": 6385,
+ "(Q": 6386,
+ "cons": 6387,
+ "ita": 6388,
+ "Ġ'.": 6389,
+ "{}": 6390,
+ "ĉC": 6391,
+ "Ġstuff": 6392,
+ "194": 6393,
+ "Ġ:Ċ": 6394,
+ "ĠAR": 6395,
+ "Task": 6396,
+ "hidden": 6397,
+ "eros": 6398,
+ "IGN": 6399,
+ "atio": 6400,
+ "ĠHealth": 6401,
+ "olute": 6402,
+ "Enter": 6403,
+ "'>": 6404,
+ "ĠTwitter": 6405,
+ "ĠCounty": 6406,
+ "scribe": 6407,
+ "Ġ=>Ċ": 6408,
+ "Ġhy": 6409,
+ "fit": 6410,
+ "Ġmilitary": 6411,
+ "Ġsale": 6412,
+ "required": 6413,
+ "non": 6414,
+ "bootstrap": 6415,
+ "hold": 6416,
+ "rim": 6417,
+ "-old": 6418,
+ "ĠDown": 6419,
+ "Ġmention": 6420,
+ "contact": 6421,
+ "_group": 6422,
+ "oday": 6423,
+ "Ġtown": 6424,
+ "Ġsolution": 6425,
+ "uate": 6426,
+ "elling": 6427,
+ "]->": 6428,
+ "otes": 6429,
+ "ental": 6430,
+ "omen": 6431,
+ "ospital": 6432,
+ "ĠSup": 6433,
+ "_EN": 6434,
+ "Ġslow": 6435,
+ "SESSION": 6436,
+ "Ġblue": 6437,
+ "ago": 6438,
+ "Ġlives": 6439,
+ "Ġ^": 6440,
+ ".un": 6441,
+ "inst": 6442,
+ "enge": 6443,
+ "Ġcustomers": 6444,
+ "Ġcast": 6445,
+ "udget": 6446,
+ "ï¼ģ": 6447,
+ "icens": 6448,
+ "Ġdetermin": 6449,
+ "Selected": 6450,
+ "_pl": 6451,
+ "ueue": 6452,
+ "Ġdark": 6453,
+ "//ĊĊ": 6454,
+ "si": 6455,
+ "thern": 6456,
+ "ĠJapan": 6457,
+ "/w": 6458,
+ "PU": 6459,
+ "ĠEast": 6460,
+ "ovie": 6461,
+ "Ġpackage": 6462,
+ "Ġnor": 6463,
+ "Ġapi": 6464,
+ "bot": 6465,
+ "\"];Ċ": 6466,
+ "_post": 6467,
+ "ulate": 6468,
+ "Ġclub": 6469,
+ "'));Ċ": 6470,
+ "Ġloop": 6471,
+ "PIO": 6472,
+ "ione": 6473,
+ "shot": 6474,
+ "Initial": 6475,
+ "Ġplayed": 6476,
+ "register": 6477,
+ "rought": 6478,
+ "_max": 6479,
+ "acement": 6480,
+ "match": 6481,
+ "raphics": 6482,
+ "AST": 6483,
+ "Ġexisting": 6484,
+ "Ġcomplex": 6485,
+ "DA": 6486,
+ ".Ch": 6487,
+ ".common": 6488,
+ "mo": 6489,
+ "Ġ'../../": 6490,
+ "ito": 6491,
+ "Ġanalysis": 6492,
+ "Ġdeliver": 6493,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 6494,
+ "idx": 6495,
+ "Ãł": 6496,
+ "ongo": 6497,
+ "ĠEnglish": 6498,
+ "Ċ": 10197,
+ "_default": 10198,
+ "ĠDatabase": 10199,
+ "rep": 10200,
+ "ESS": 10201,
+ "nergy": 10202,
+ ".Find": 10203,
+ "_mask": 10204,
+ "Ġrise": 10205,
+ "Ġkernel": 10206,
+ "::$": 10207,
+ ".Q": 10208,
+ "Ġoffering": 10209,
+ "decl": 10210,
+ "ĠCS": 10211,
+ "Ġlisted": 10212,
+ "Ġmostly": 10213,
+ "enger": 10214,
+ "Ġblocks": 10215,
+ "olo": 10216,
+ "Ġgoverning": 10217,
+ "\\F": 10218,
+ "Ġconcent": 10219,
+ ".getText": 10220,
+ "Ġmb": 10221,
+ "Ġoccurred": 10222,
+ "Ġchanging": 10223,
+ "Scene": 10224,
+ "_CODE": 10225,
+ "Beh": 10226,
+ "\"The": 10227,
+ "Ġtile": 10228,
+ "ĠAssociation": 10229,
+ "ĉP": 10230,
+ "alty": 10231,
+ "_ad": 10232,
+ "odies": 10233,
+ "iated": 10234,
+ "Ġprepared": 10235,
+ "possible": 10236,
+ "Ġmort": 10237,
+ "TEST": 10238,
+ "142": 10239,
+ "Ġignore": 10240,
+ "Ġcalc": 10241,
+ "Ġrs": 10242,
+ "ĠassertEquals": 10243,
+ "Ġsz": 10244,
+ "ĠTHIS": 10245,
+ ".\"Ċ": 10246,
+ "Ġcanvas": 10247,
+ "java": 10248,
+ "Ġdut": 10249,
+ "VALID": 10250,
+ ".sql": 10251,
+ ".input": 10252,
+ "Ġaux": 10253,
+ "Sup": 10254,
+ "Ġartist": 10255,
+ "Vec": 10256,
+ "_TIME": 10257,
+ ".stringify": 10258,
+ "etween": 10259,
+ "ĠCategory": 10260,
+ "Ġ[-": 10261,
+ "ĠDevExpress": 10262,
+ "ĠJul": 10263,
+ "Ġring": 10264,
+ ".ed": 10265,
+ "YY": 10266,
+ "Let": 10267,
+ "TextField": 10268,
+ "Ġflat": 10269,
+ "_print": 10270,
+ "ĠOTHER": 10271,
+ "adian": 10272,
+ "Ġchecked": 10273,
+ "ele": 10274,
+ "Align": 10275,
+ "standing": 10276,
+ "Ġ[],": 10277,
+ "Ġlab": 10278,
+ "ucky": 10279,
+ "ĠChristmas": 10280,
+ "(image": 10281,
+ ".module": 10282,
+ "Ġlots": 10283,
+ "Ġslightly": 10284,
+ "(final": 10285,
+ "erge": 10286,
+ "è¿": 10287,
+ "147": 10288,
+ "ĠPolice": 10289,
+ "143": 10290,
+ "ĠRight": 10291,
+ "Ġaward": 10292,
+ "ĠOS": 10293,
+ "Ġ{}ĊĊ": 10294,
+ "Ġptr": 10295,
+ "oves": 10296,
+ "icated": 10297,
+ "ем": 10298,
+ "Ġmanage": 10299,
+ "oliday": 10300,
+ "Amount": 10301,
+ "oolStrip": 10302,
+ "tbody": 10303,
+ "Nav": 10304,
+ "wrap": 10305,
+ "BB": 10306,
+ "Ġwatching": 10307,
+ "arios": 10308,
+ "Ġoptional": 10309,
+ "_K": 10310,
+ "ĠLicensed": 10311,
+ ".Map": 10312,
+ "Timer": 10313,
+ "ĠAP": 10314,
+ "ĠRev": 10315,
+ "(o": 10316,
+ ",c": 10317,
+ "umin": 10318,
+ "etailed": 10319,
+ "ĠHy": 10320,
+ "Ġblank": 10321,
+ "agger": 10322,
+ "ĠSelf": 10323,
+ "()[": 10324,
+ ".make": 10325,
+ "earn": 10326,
+ "channel": 10327,
+ ";Ċ": 10342,
+ "World": 10343,
+ "Ġpython": 10344,
+ "Ġlif": 10345,
+ "Ġtrav": 10346,
+ "Ġconven": 10347,
+ "company": 10348,
+ "ĠClub": 10349,
+ "138": 10350,
+ "Ver": 10351,
+ "Btn": 10352,
+ "Ġzone": 10353,
+ "products": 10354,
+ "ĠEduc": 10355,
+ "Ġverify": 10356,
+ "ĠMil": 10357,
+ "ono": 10358,
+ "]);ĊĊ": 10359,
+ "ENCE": 10360,
+ "Ġpacket": 10361,
+ "Ġcer": 10362,
+ "Ġenumer": 10363,
+ "Ġpars": 10364,
+ "formed": 10365,
+ "Ġoccup": 10366,
+ "tre": 10367,
+ "Ġexercise": 10368,
+ "Day": 10369,
+ "_sum": 10370,
+ "Ġasking": 10371,
+ "aption": 10372,
+ "Ġorders": 10373,
+ "Ġspending": 10374,
+ "ĠERR": 10375,
+ ".Dis": 10376,
+ "ĠUtil": 10377,
+ "âĢľI": 10378,
+ "\\'": 10379,
+ "?)": 10380,
+ "/>Ċ": 10381,
+ "Ġemot": 10382,
+ "Ġinfluence": 10383,
+ "ĠAfrica": 10384,
+ "atters": 10385,
+ "Ùħ": 10386,
+ ".session": 10387,
+ "Ġchief": 10388,
+ "ĉĉĉĉĉĉĉĉĉĉĉ": 10389,
+ "Ġtom": 10390,
+ "cluded": 10391,
+ "serial": 10392,
+ "_handler": 10393,
+ ".Type": 10394,
+ "aped": 10395,
+ "Ġpolicies": 10396,
+ "-ex": 10397,
+ "-tr": 10398,
+ "blank": 10399,
+ "merce": 10400,
+ "Ġcoverage": 10401,
+ "Ġrc": 10402,
+ "_matrix": 10403,
+ "_box": 10404,
+ "Ġcharges": 10405,
+ "ĠBoston": 10406,
+ "Pe": 10407,
+ "Ġcircum": 10408,
+ "Ġfilled": 10409,
+ "148": 10410,
+ "Ġnorth": 10411,
+ "ictureBox": 10412,
+ "ĉres": 10413,
+ "è®": 10414,
+ "Ġtermin": 10415,
+ "Ġ[â̦": 10416,
+ "IRECT": 10417,
+ "Ġber": 10418,
+ "Ġ\"../../": 10419,
+ "retch": 10420,
+ ".code": 10421,
+ "_col": 10422,
+ "ĠGovernment": 10423,
+ "Ġargv": 10424,
+ "ĠLord": 10425,
+ "asi": 10426,
+ "Exec": 10427,
+ "ĉlet": 10428,
+ "vertis": 10429,
+ "Ġdiscussion": 10430,
+ "enance": 10431,
+ "outube": 10432,
+ "typeof": 10433,
+ "Ġserved": 10434,
+ "ĠPut": 10435,
+ "ĉx": 10436,
+ "Ġsweet": 10437,
+ "Before": 10438,
+ "ategy": 10439,
+ ".of": 10440,
+ "ĠMaterial": 10441,
+ "Sort": 10442,
+ "ONT": 10443,
+ "igital": 10444,
+ "Why": 10445,
+ "Ġsust": 10446,
+ "Ġç": 10447,
+ "abet": 10448,
+ "Ġsegment": 10449,
+ "Ġ[],Ċ": 10450,
+ "ĠMuslim": 10451,
+ "ĠfindViewById": 10452,
+ "cut": 10453,
+ "_TEXT": 10454,
+ "ĠMary": 10455,
+ "Ġloved": 10456,
+ "Ġlie": 10457,
+ "ĠJO": 10458,
+ "Ġisset": 10459,
+ "month": 10460,
+ "Ġprime": 10461,
+ "ti": 10462,
+ "ĠCarol": 10463,
+ "Use": 10464,
+ "146": 10465,
+ "ĠPop": 10466,
+ "ĠSave": 10467,
+ "Interval": 10468,
+ "execute": 10469,
+ "dy": 10470,
+ "ĠIran": 10471,
+ "_cont": 10472,
+ "ĉT": 10473,
+ "Ġphase": 10474,
+ "checkbox": 10475,
+ "week": 10476,
+ "Ġhide": 10477,
+ "Ġtil": 10478,
+ "Ġju": 10479,
+ "Custom": 10480,
+ "burg": 10481,
+ "/M": 10482,
+ "TON": 10483,
+ "Ġquant": 10484,
+ "Ġrub": 10485,
+ "ixels": 10486,
+ "Ġinstalled": 10487,
+ "Ġdump": 10488,
+ "Ġproperly": 10489,
+ "(List": 10490,
+ "Ġdecide": 10491,
+ "apply": 10492,
+ "Has": 10493,
+ "Ġkeeping": 10494,
+ "Ġcitizens": 10495,
+ "Ġjoint": 10496,
+ "pool": 10497,
+ "Socket": 10498,
+ "_op": 10499,
+ "Ġweapon": 10500,
+ "gnore": 10501,
+ "ĠExec": 10502,
+ "otten": 10503,
+ "ĠMS": 10504,
+ "Ġ(-": 10505,
+ "ĠReview": 10506,
+ "Ġexamples": 10507,
+ "Ġtight": 10508,
+ "!(": 10509,
+ "DP": 10510,
+ "ĠMessageBox": 10511,
+ "Ġphotograph": 10512,
+ "164": 10513,
+ "URI": 10514,
+ "ét": 10515,
+ "low": 10516,
+ "ĠGrand": 10517,
+ ".persistence": 10518,
+ "Ġmaintain": 10519,
+ "Ġnums": 10520,
+ "Ġzip": 10521,
+ "ials": 10522,
+ "ĠGets": 10523,
+ "peg": 10524,
+ "ĠBuffer": 10525,
+ "~~~~": 10526,
+ "rastructure": 10527,
+ "ĠPL": 10528,
+ "uen": 10529,
+ "obby": 10530,
+ "sizeof": 10531,
+ "Ġpic": 10532,
+ "Ġseed": 10533,
+ "Ġexperienced": 10534,
+ "Ġodd": 10535,
+ "Ġkick": 10536,
+ "Ġprocedure": 10537,
+ "avigator": 10538,
+ "-on": 10539,
+ ",j": 10540,
+ "ĠAlthough": 10541,
+ "ĠuserId": 10542,
+ "accept": 10543,
+ "Blue": 10544,
+ "IColor": 10545,
+ "layer": 10546,
+ "available": 10547,
+ "Ġends": 10548,
+ ".table": 10549,
+ "Ġdataset": 10550,
+ "bus": 10551,
+ "Ġexplain": 10552,
+ "(pro": 10553,
+ "ĠCommittee": 10554,
+ "Ġnoted": 10555,
+ "]:Ċ": 10556,
+ "Dim": 10557,
+ "stdio": 10558,
+ "154": 10559,
+ ".\",Ċ": 10560,
+ "_source": 10561,
+ "181": 10562,
+ "ĠWeek": 10563,
+ "ĠEdge": 10564,
+ "Ġoperating": 10565,
+ "Ġeste": 10566,
+ "ipl": 10567,
+ "330": 10568,
+ "agination": 10569,
+ "Ġproceed": 10570,
+ "Ġanimation": 10571,
+ ".Models": 10572,
+ "ĠWatch": 10573,
+ "iat": 10574,
+ "Ġoppon": 10575,
+ "/A": 10576,
+ "Report": 10577,
+ "Ġsounds": 10578,
+ "_buf": 10579,
+ "IELD": 10580,
+ "Ġbund": 10581,
+ "ĉget": 10582,
+ ".pr": 10583,
+ "(tmp": 10584,
+ "Ġkid": 10585,
+ ">ĊĊĊ": 10586,
+ "Ġyang": 10587,
+ "NotFound": 10588,
+ "ÑĨ": 10589,
+ "math": 10590,
+ "@gmail": 10591,
+ "ĠLIMIT": 10592,
+ "redients": 10593,
+ "Ġvent": 10594,
+ "avigate": 10595,
+ "Look": 10596,
+ "Ġreligious": 10597,
+ "Ġrand": 10598,
+ "rio": 10599,
+ "(GL": 10600,
+ "_ip": 10601,
+ "uan": 10602,
+ "iciency": 10603,
+ "ĠChange": 10604,
+ ">čĊčĊ": 10605,
+ "ĠEntity": 10606,
+ "Ġrencontre": 10607,
+ "ĠRet": 10608,
+ "plan": 10609,
+ "én": 10610,
+ "BOOL": 10611,
+ "uries": 10612,
+ "train": 10613,
+ "Definition": 10614,
+ "============": 10615,
+ "zz": 10616,
+ "450": 10617,
+ "Animation": 10618,
+ "ĠOK": 10619,
+ "_menu": 10620,
+ ".bl": 10621,
+ "_score": 10622,
+ "Ġacad": 10623,
+ "(System": 10624,
+ "Ġrefresh": 10625,
+ "'=>$": 10626,
+ ".Graphics": 10627,
+ "amento": 10628,
+ "pid": 10629,
+ "tc": 10630,
+ "Ġtips": 10631,
+ "Ġhomes": 10632,
+ "Ġfuel": 10633,
+ "âĸ": 10634,
+ "_helper": 10635,
+ "ĠĠčĊ": 10636,
+ "ĠRoom": 10637,
+ ".Close": 10638,
+ "_attr": 10639,
+ "ĠMount": 10640,
+ "ĠEv": 10641,
+ "arser": 10642,
+ "_top": 10643,
+ "eah": 10644,
+ "ĠDelete": 10645,
+ "ãĢį": 10646,
+ "uke": 10647,
+ "Ġusage": 10648,
+ "aria": 10649,
+ "_dev": 10650,
+ "Ġtexture": 10651,
+ "Ġconversation": 10652,
+ "eper": 10653,
+ "Bean": 10654,
+ "done": 10655,
+ "nonatomic": 10656,
+ "ĠSecond": 10657,
+ "Ġshooting": 10658,
+ "_pre": 10659,
+ "Components": 10660,
+ "Ġ]ĊĊ": 10661,
+ "__,": 10662,
+ "stitution": 10663,
+ ".Char": 10664,
+ ">();ĊĊ": 10665,
+ "Ġpresented": 10666,
+ "Ġwa": 10667,
+ "oker": 10668,
+ "-ĊĊ": 10669,
+ "iner": 10670,
+ "Ġbecoming": 10671,
+ "Ġincident": 10672,
+ "Att": 10673,
+ "162": 10674,
+ "Ġrevealed": 10675,
+ "forc": 10676,
+ "Ġboot": 10677,
+ ".page": 10678,
+ "Enumerator": 10679,
+ "165": 10680,
+ "_->": 10681,
+ "Photo": 10682,
+ "Ġspring": 10683,
+ ".\",": 10684,
+ "ĠDictionary": 10685,
+ "BJECT": 10686,
+ "Ġlocations": 10687,
+ "Ġsamples": 10688,
+ "InputStream": 10689,
+ "ĠBrown": 10690,
+ "Ġstats": 10691,
+ "quality": 10692,
+ "Ñħ": 10693,
+ "-dis": 10694,
+ "Ġhelping": 10695,
+ "Ġped": 10696,
+ "224": 10697,
+ "(se": 10698,
+ "ĠWho": 10699,
+ "alian": 10700,
+ "internal": 10701,
+ "Ġft": 10702,
+ ">().": 10703,
+ "->{": 10704,
+ "Ġmine": 10705,
+ "Ġsector": 10706,
+ "Ġgro": 10707,
+ "Ġopportunities": 10708,
+ "Ġü": 10709,
+ "Ġmp": 10710,
+ "Ġalleged": 10711,
+ "Ġdoubt": 10712,
+ "Mouse": 10713,
+ "About": 10714,
+ "_part": 10715,
+ "Ġchair": 10716,
+ "Ġstopped": 10717,
+ "161": 10718,
+ "loop": 10719,
+ "entities": 10720,
+ "Ġapps": 10721,
+ "ansion": 10722,
+ "Ġmental": 10723,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10724,
+ "FR": 10725,
+ "Ġdefend": 10726,
+ "care": 10727,
+ "Ġideal": 10728,
+ "/api": 10729,
+ "urface": 10730,
+ "011": 10731,
+ "Ġele": 10732,
+ "ulator": 10733,
+ "ĠRights": 10734,
+ "anguages": 10735,
+ "Ġfunds": 10736,
+ "Ġadapt": 10737,
+ "Attributes": 10738,
+ "Ġdeploy": 10739,
+ "opts": 10740,
+ "Ġvalidation": 10741,
+ "Ġconcerns": 10742,
+ "uce": 10743,
+ ".num": 10744,
+ "ulture": 10745,
+ "ila": 10746,
+ "Ġcup": 10747,
+ "Ġpure": 10748,
+ ".Fore": 10749,
+ "183": 10750,
+ "ĠHashMap": 10751,
+ ".valueOf": 10752,
+ "asm": 10753,
+ "MO": 10754,
+ "Ġcs": 10755,
+ "Ġstores": 10756,
+ "Ġ************************************************************************": 10757,
+ "Ġcommunication": 10758,
+ "mem": 10759,
+ ".EventHandler": 10760,
+ ".Status": 10761,
+ "_right": 10762,
+ ".setOn": 10763,
+ "Sheet": 10764,
+ "Ġidentify": 10765,
+ "enerated": 10766,
+ "ordered": 10767,
+ "Ġ\"[": 10768,
+ "Ġswe": 10769,
+ "Condition": 10770,
+ "ĠAccording": 10771,
+ "Ġprepare": 10772,
+ "Ġrob": 10773,
+ "Pool": 10774,
+ "Ġsport": 10775,
+ "rv": 10776,
+ "ĠRouter": 10777,
+ "Ġalternative": 10778,
+ "([]": 10779,
+ "ĠChicago": 10780,
+ "ipher": 10781,
+ "ische": 10782,
+ "ĠDirector": 10783,
+ "kl": 10784,
+ "ĠWil": 10785,
+ "keys": 10786,
+ "Ġmysql": 10787,
+ "Ġwelcome": 10788,
+ "king": 10789,
+ "ĠManager": 10790,
+ "Ġcaught": 10791,
+ ")}Ċ": 10792,
+ "Score": 10793,
+ "_PR": 10794,
+ "Ġsurvey": 10795,
+ "hab": 10796,
+ "Headers": 10797,
+ "ADER": 10798,
+ "Ġdecor": 10799,
+ "Ġturns": 10800,
+ "Ġradius": 10801,
+ "errupt": 10802,
+ "Cor": 10803,
+ "Ġmel": 10804,
+ "Ġintr": 10805,
+ "(q": 10806,
+ "ĠAC": 10807,
+ "amos": 10808,
+ "MAX": 10809,
+ "ĠGrid": 10810,
+ "ĠJesus": 10811,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 10812,
+ ".DE": 10813,
+ "Ġts": 10814,
+ "Ġlinked": 10815,
+ "free": 10816,
+ "ĠQt": 10817,
+ "Ġ/**čĊ": 10818,
+ "Ġfaster": 10819,
+ "ctr": 10820,
+ "_J": 10821,
+ "DT": 10822,
+ ".Check": 10823,
+ "Ġcombination": 10824,
+ "Ġintended": 10825,
+ "-the": 10826,
+ "-type": 10827,
+ "182": 10828,
+ "ectors": 10829,
+ "ami": 10830,
+ "uting": 10831,
+ "Ġuma": 10832,
+ "XML": 10833,
+ "UCT": 10834,
+ "Ap": 10835,
+ "ĠRandom": 10836,
+ "Ġran": 10837,
+ ".sort": 10838,
+ "Ġsorted": 10839,
+ ".Un": 10840,
+ "401": 10841,
+ "_PER": 10842,
+ "itory": 10843,
+ "Ġpriority": 10844,
+ "ĠGal": 10845,
+ "ĠOld": 10846,
+ "hot": 10847,
+ "ĠDisplay": 10848,
+ "(sub": 10849,
+ "_TH": 10850,
+ "_Y": 10851,
+ "ĠCare": 10852,
+ "loading": 10853,
+ "Kind": 10854,
+ "_handle": 10855,
+ ",,": 10856,
+ "rase": 10857,
+ "_replace": 10858,
+ ".addEventListener": 10859,
+ "ĠRT": 10860,
+ "172": 10861,
+ "Ġentered": 10862,
+ "gers": 10863,
+ "Ġich": 10864,
+ "(start": 10865,
+ "205": 10866,
+ "/app": 10867,
+ "Ġbrother": 10868,
+ "Memory": 10869,
+ "Outlet": 10870,
+ "Ġutf": 10871,
+ "prec": 10872,
+ "Ġnavigation": 10873,
+ "ORK": 10874,
+ "Ġdst": 10875,
+ "Detail": 10876,
+ "Ġaudience": 10877,
+ "Ġdur": 10878,
+ "Ġcluster": 10879,
+ "unched": 10880,
+ "Ġ],": 10881,
+ "Ġcomfortable": 10882,
+ ".values": 10883,
+ "ĠTotal": 10884,
+ "Ġsnap": 10885,
+ "Ġstandards": 10886,
+ "Ġperformed": 10887,
+ "hand": 10888,
+ "(\"@": 10889,
+ "åŃ": 10890,
+ "Ġphil": 10891,
+ "ibr": 10892,
+ "trim": 10893,
+ "Ġforget": 10894,
+ "157": 10895,
+ "Ġdoctor": 10896,
+ ".TextBox": 10897,
+ "377": 10898,
+ "icons": 10899,
+ ",s": 10900,
+ "ĠOp": 10901,
+ "Sm": 10902,
+ "Stop": 10903,
+ "ĉList": 10904,
+ "ĉu": 10905,
+ "Comment": 10906,
+ "_VERSION": 10907,
+ ".Xtra": 10908,
+ "Person": 10909,
+ "rb": 10910,
+ "LOB": 10911,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĊ": 10912,
+ "ĠCentral": 10913,
+ "270": 10914,
+ "ICK": 10915,
+ "raq": 10916,
+ "Ġputting": 10917,
+ "Ġmd": 10918,
+ "ĠLove": 10919,
+ "Program": 10920,
+ "Border": 10921,
+ "oor": 10922,
+ "Ġallowing": 10923,
+ "after": 10924,
+ "Ġentries": 10925,
+ "ĠMaybe": 10926,
+ "]).": 10927,
+ "ĠShort": 10928,
+ ")\\": 10929,
+ ".now": 10930,
+ "friend": 10931,
+ "Ġprefer": 10932,
+ "ĠGPIO": 10933,
+ "osis": 10934,
+ "ĠGameObject": 10935,
+ "Ġskip": 10936,
+ "Ġcompetition": 10937,
+ "_match": 10938,
+ "lications": 10939,
+ "_CONT": 10940,
+ ".groupBox": 10941,
+ "Ġals": 10942,
+ "666": 10943,
+ "\"We": 10944,
+ "_eq": 10945,
+ "lan": 10946,
+ "_search": 10947,
+ "ĠMusic": 10948,
+ "asis": 10949,
+ "Ġbind": 10950,
+ "ĠIsland": 10951,
+ "rum": 10952,
+ "(E": 10953,
+ "Ġseat": 10954,
+ "Video": 10955,
+ "Ġack": 10956,
+ "reek": 10957,
+ "={()": 10958,
+ "Ġrating": 10959,
+ "Ġrestaurant": 10960,
+ "456": 10961,
+ "DEX": 10962,
+ "(buf": 10963,
+ "pping": 10964,
+ "uality": 10965,
+ "Ġleague": 10966,
+ "176": 10967,
+ "Ġfocused": 10968,
+ "apon": 10969,
+ "$data": 10970,
+ "CLUD": 10971,
+ "CLUDING": 10972,
+ "Ġabsolute": 10973,
+ "(query": 10974,
+ "Ġtells": 10975,
+ "Ang": 10976,
+ "Ġcommunities": 10977,
+ "Ġhonest": 10978,
+ "oking": 10979,
+ "Ġapart": 10980,
+ "arity": 10981,
+ "/$": 10982,
+ "_module": 10983,
+ "ĠEnc": 10984,
+ ".an": 10985,
+ ".Config": 10986,
+ "Cre": 10987,
+ "Ġshock": 10988,
+ "ĠArab": 10989,
+ "IENT": 10990,
+ "/re": 10991,
+ "Ġretrie": 10992,
+ "ycler": 10993,
+ "isa": 10994,
+ "ĠOrgan": 10995,
+ ".graph": 10996,
+ "Ġí": 10997,
+ "ĠBAS": 10998,
+ "Enum": 10999,
+ "Ġpossibly": 11000,
+ "ÑĢаÐ": 11001,
+ "ĠJapanese": 11002,
+ "Ġcraft": 11003,
+ "ĠPlace": 11004,
+ "Ġtalent": 11005,
+ "Ġfunding": 11006,
+ "Ġconfirmed": 11007,
+ "Ġcycle": 11008,
+ "/x": 11009,
+ "GE": 11010,
+ "Ġhearing": 11011,
+ "Ġplants": 11012,
+ "Ġmouth": 11013,
+ "pages": 11014,
+ "oria": 11015,
+ "ĠRemove": 11016,
+ "_total": 11017,
+ "Ġod": 11018,
+ "ollapse": 11019,
+ "door": 11020,
+ "Ġbought": 11021,
+ "Ġaddr": 11022,
+ "ARCH": 11023,
+ "_dim": 11024,
+ "dden": 11025,
+ "Ġdecades": 11026,
+ "REQUEST": 11027,
+ "Ġversions": 11028,
+ "fire": 11029,
+ "006": 11030,
+ "Ġmoves": 11031,
+ "fb": 11032,
+ "Ġcoffee": 11033,
+ ".connect": 11034,
+ "ĠRow": 11035,
+ "Ġschema": 11036,
+ "Scope": 11037,
+ "-Type": 11038,
+ "Ġfighting": 11039,
+ "Ġretail": 11040,
+ "Ġmodified": 11041,
+ "TF": 11042,
+ "Files": 11043,
+ "nie": 11044,
+ "_command": 11045,
+ "stone": 11046,
+ "ĠÑĤ": 11047,
+ "_thread": 11048,
+ "Ġbond": 11049,
+ "ĠDevelopment": 11050,
+ "Ġpt": 11051,
+ "FORM": 11052,
+ "plet": 11053,
+ "Ġidentified": 11054,
+ "cpp": 11055,
+ "206": 11056,
+ "225": 11057,
+ "Ġcoding": 11058,
+ "oked": 11059,
+ "ĠMaster": 11060,
+ "IDTH": 11061,
+ "Ġresidents": 11062,
+ "redit": 11063,
+ "ĠPhoto": 11064,
+ "=-": 11065,
+ "unte": 11066,
+ "ateur": 11067,
+ "159": 11068,
+ "_STATE": 11069,
+ "ĠSing": 11070,
+ "Ġsheet": 11071,
+ ".val": 11072,
+ "orse": 11073,
+ "Ġhers": 11074,
+ "Ġdetermined": 11075,
+ "Common": 11076,
+ "Ġwed": 11077,
+ "_queue": 11078,
+ "PH": 11079,
+ "ĠAtl": 11080,
+ "cred": 11081,
+ "/LICENSE": 11082,
+ "Ġmes": 11083,
+ "Ġadvanced": 11084,
+ ".java": 11085,
+ ".Sh": 11086,
+ "Go": 11087,
+ "kill": 11088,
+ "fp": 11089,
+ "_settings": 11090,
+ "Ġpal": 11091,
+ "Ġtruck": 11092,
+ "Ġcombined": 11093,
+ "Ġ\"${": 11094,
+ "ĠCorpor": 11095,
+ "Ġjoined": 11096,
+ "ĠJose": 11097,
+ "ĠCup": 11098,
+ "uns": 11099,
+ "estival": 11100,
+ "levision": 11101,
+ "Ġbroken": 11102,
+ "Ġmarriage": 11103,
+ "ĠWestern": 11104,
+ "Ġrepresents": 11105,
+ "ĠTitle": 11106,
+ "Ġss": 11107,
+ ".Ass": 11108,
+ "ongoose": 11109,
+ "iento": 11110,
+ "<>();Ċ": 11111,
+ "Ġabsolutely": 11112,
+ "Ġsmooth": 11113,
+ "TERN": 11114,
+ "ĠUnless": 11115,
+ "Word": 11116,
+ "Ġmerge": 11117,
+ "igan": 11118,
+ "ĠVol": 11119,
+ "Ġnn": 11120,
+ ".getId": 11121,
+ "Ġз": 11122,
+ "171": 11123,
+ "Ġsexy": 11124,
+ "Ġseeking": 11125,
+ "Single": 11126,
+ ".this": 11127,
+ "179": 11128,
+ "Ġkom": 11129,
+ "bound": 11130,
+ ";\"": 11131,
+ "ĠfontSize": 11132,
+ "_df": 11133,
+ "Ġinjury": 11134,
+ "(H": 11135,
+ "Ġissued": 11136,
+ "_END": 11137,
+ ":self": 11138,
+ "020": 11139,
+ "Ġpatch": 11140,
+ "Ġleaves": 11141,
+ "Ġadopt": 11142,
+ "FileName": 11143,
+ "ãĢIJ": 11144,
+ "Ġexecutive": 11145,
+ "ĠByte": 11146,
+ "]))Ċ": 11147,
+ "Ġnu": 11148,
+ "outing": 11149,
+ "cluding": 11150,
+ "-R": 11151,
+ ".options": 11152,
+ "Ġsubstant": 11153,
+ "avax": 11154,
+ "ĠBUT": 11155,
+ "Ġtechnical": 11156,
+ "Ġtwice": 11157,
+ "Ġmás": 11158,
+ "Ġunivers": 11159,
+ "yr": 11160,
+ "Ġdrag": 11161,
+ "ĠDC": 11162,
+ "Ġsed": 11163,
+ "Ġbot": 11164,
+ "ĠPal": 11165,
+ "ĠHall": 11166,
+ "forcement": 11167,
+ "Ġauch": 11168,
+ ".mod": 11169,
+ "notation": 11170,
+ "_files": 11171,
+ ".line": 11172,
+ "_flag": 11173,
+ "[name": 11174,
+ "Ġresolution": 11175,
+ "Ġbott": 11176,
+ "(\"[": 11177,
+ "ende": 11178,
+ "(arr": 11179,
+ "Free": 11180,
+ "(@\"": 11181,
+ "ĠDistrict": 11182,
+ "PEC": 11183,
+ ":-": 11184,
+ "Picker": 11185,
+ "ĠJo": 11186,
+ "ĠĠĠĠĠĊ": 11187,
+ "ĠRiver": 11188,
+ "_rows": 11189,
+ "Ġhelpful": 11190,
+ "Ġmassive": 11191,
+ "---Ċ": 11192,
+ "Ġmeasures": 11193,
+ "007": 11194,
+ "ĠRuntime": 11195,
+ "Ġworry": 11196,
+ "ĠSpec": 11197,
+ "ĉD": 11198,
+ "ãĢij": 11199,
+ "Ġ){Ċ": 11200,
+ "Ġworse": 11201,
+ "(filename": 11202,
+ "Ġlay": 11203,
+ "Ġmagic": 11204,
+ "ĠTheir": 11205,
+ "oul": 11206,
+ "stroy": 11207,
+ "ĠWhere": 11208,
+ "280": 11209,
+ "Ġsudden": 11210,
+ "Ġdefe": 11211,
+ "Ġbinding": 11212,
+ "Ġflight": 11213,
+ "ĠOnInit": 11214,
+ "ĠWomen": 11215,
+ "ĠPolicy": 11216,
+ "Ġdrugs": 11217,
+ "ishing": 11218,
+ "('../": 11219,
+ "ĠMel": 11220,
+ "peat": 11221,
+ "tor": 11222,
+ "Ġproposed": 11223,
+ "Ġstated": 11224,
+ "_RES": 11225,
+ "Ġeast": 11226,
+ "212": 11227,
+ "ĠCONDITION": 11228,
+ "_desc": 11229,
+ "Ġwinning": 11230,
+ "folio": 11231,
+ "Mapper": 11232,
+ "ĠPan": 11233,
+ "ĠAnge": 11234,
+ ".servlet": 11235,
+ "Ġcopies": 11236,
+ "LM": 11237,
+ "Ġvm": 11238,
+ "åį": 11239,
+ "Ġdictionary": 11240,
+ "Seg": 11241,
+ "177": 11242,
+ "elines": 11243,
+ "ĠSend": 11244,
+ "Ġiron": 11245,
+ "ĠFort": 11246,
+ "166": 11247,
+ ".domain": 11248,
+ "Ġdebate": 11249,
+ "NotNull": 11250,
+ "eq": 11251,
+ "acher": 11252,
+ "lf": 11253,
+ "ĉfmt": 11254,
+ "Ġlawy": 11255,
+ "178": 11256,
+ "ÄŁ": 11257,
+ "ĠMen": 11258,
+ "Ġtrim": 11259,
+ "(NULL": 11260,
+ "Ġ!!": 11261,
+ "Ġpad": 11262,
+ "Ġfollows": 11263,
+ "\"][\"": 11264,
+ "requ": 11265,
+ "ĠEp": 11266,
+ ".github": 11267,
+ "(img": 11268,
+ "eto": 11269,
+ "('\\": 11270,
+ "Services": 11271,
+ "umbnail": 11272,
+ "_main": 11273,
+ "pleted": 11274,
+ "fortunately": 11275,
+ "Ġwindows": 11276,
+ "Ġplane": 11277,
+ "ĠConnection": 11278,
+ ".local": 11279,
+ "uard": 11280,
+ "}\\": 11281,
+ "==\"": 11282,
+ "andon": 11283,
+ "ĠRoy": 11284,
+ "west": 11285,
+ "158": 11286,
+ "iginal": 11287,
+ "emies": 11288,
+ "itz": 11289,
+ "'):Ċ": 11290,
+ "ĠPeter": 11291,
+ "Ġtough": 11292,
+ "Ġreduced": 11293,
+ "Ġcalculate": 11294,
+ "Ġrapid": 11295,
+ "customer": 11296,
+ "Ġefficient": 11297,
+ "Ġmedium": 11298,
+ "Ġfell": 11299,
+ ".ref": 11300,
+ "ĠCas": 11301,
+ "Ġfeedback": 11302,
+ "Speed": 11303,
+ "(output": 11304,
+ "aje": 11305,
+ "Ġcategories": 11306,
+ "Ġfee": 11307,
+ "};": 11308,
+ "Ġdeleted": 11309,
+ "reh": 11310,
+ "Ġproof": 11311,
+ "Desc": 11312,
+ "Build": 11313,
+ "Ġsides": 11314,
+ ".ArrayList": 11315,
+ "-%": 11316,
+ "ĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠĠ": 11317,
+ "ر": 11318,
+ ".match": 11319,
+ "ли": 11320,
+ "Ġfeels": 11321,
+ "Ġachieve": 11322,
+ "Ġclim": 11323,
+ "_ON": 11324,
+ "ĠCD": 11325,
+ "Ġteacher": 11326,
+ "_current": 11327,
+ "bn": 11328,
+ "_PL": 11329,
+ "isting": 11330,
+ "Enable": 11331,
+ "GEN": 11332,
+ "Ġtv": 11333,
+ "Ġsock": 11334,
+ "Ġplays": 11335,
+ "Ġdiscount": 11336,
+ "ĠKE": 11337,
+ "ĠDebug": 11338,
+ "Fore": 11339,
+ "ĠIraq": 11340,
+ "Ġappearance": 11341,
+ "Mon": 11342,
+ "Ġstyled": 11343,
+ "ĠHuman": 11344,
+ "iot": 11345,
+ "ĠHistory": 11346,
+ "Ġsac": 11347,
+ "ĠCollection": 11348,
+ "Ġrecommended": 11349,
+ ".Selected": 11350,
+ "Ġorganizations": 11351,
+ "Ġdiscovered": 11352,
+ "cohol": 11353,
+ "adas": 11354,
+ "ĠThomas": 11355,
+ "May": 11356,
+ "Ġconserv": 11357,
+ "Ġdomin": 11358,
+ "ĠFollow": 11359,
+ "ĠSection": 11360,
+ "ĠThanks": 11361,
+ "Username": 11362,
+ "Ġrecipe": 11363,
+ "Ġwonderful": 11364,
+ ".sleep": 11365,
+ "_if": 11366,
+ "ĉĊĉĊ": 11367,
+ "orno": 11368,
+ "Ġru": 11369,
+ "_target": 11370,
+ ".\"\"": 11371,
+ "à¦": 11372,
+ "EventArgs": 11373,
+ "Ġinputs": 11374,
+ "Ġfif": 11375,
+ "Ġvision": 11376,
+ "cy": 11377,
+ "ĠSeries": 11378,
+ ")(((": 11379,
+ "Ġtrading": 11380,
+ "Ġmarker": 11381,
+ "Begin": 11382,
+ "Ġtypically": 11383,
+ "Ġcauses": 11384,
+ "dropdown": 11385,
+ "_DEBUG": 11386,
+ "260": 11387,
+ "Ġdetect": 11388,
+ "country": 11389,
+ "!\");Ċ": 11390,
+ "ĉR": 11391,
+ "appy": 11392,
+ "Ġcref": 11393,
+ "('<": 11394,
+ "\"=>": 11395,
+ "ĠLE": 11396,
+ "reader": 11397,
+ "Ġadministr": 11398,
+ "õ": 11399,
+ "ucket": 11400,
+ "Ġfashion": 11401,
+ ".char": 11402,
+ "izar": 11403,
+ "Ġdisable": 11404,
+ "Ġsuc": 11405,
+ "ĠLive": 11406,
+ "issue": 11407,
+ "Ġmetadata": 11408,
+ "flags": 11409,
+ "ĠðŁ": 11410,
+ "Ġcommitted": 11411,
+ "Ġva": 11412,
+ "Ġrough": 11413,
+ "Ġ'''Ċ": 11414,
+ "Ġhighlight": 11415,
+ "_vars": 11416,
+ "VO": 11417,
+ "Ġencoding": 11418,
+ "-Z": 11419,
+ "_sign": 11420,
+ "$(\"#": 11421,
+ "Ġrain": 11422,
+ "reatest": 11423,
+ "ĠEND": 11424,
+ "Selection": 11425,
+ "Ġcandidates": 11426,
+ "Ġsav": 11427,
+ ".Empty": 11428,
+ "Ġdecisions": 11429,
+ "Ġcollabor": 11430,
+ "ridge": 11431,
+ "feed": 11432,
+ "ression": 11433,
+ "Ġpersons": 11434,
+ "VM": 11435,
+ "008": 11436,
+ "ega": 11437,
+ "_BIT": 11438,
+ "According": 11439,
+ "acked": 11440,
+ "Ġdollars": 11441,
+ "_loss": 11442,
+ "ĠCost": 11443,
+ "}\"Ċ": 11444,
+ "Notification": 11445,
+ "Ġprostit": 11446,
+ "Ġauthority": 11447,
+ ".rec": 11448,
+ "Ġspokes": 11449,
+ "ĠToday": 11450,
+ "istant": 11451,
+ "ĠHead": 11452,
+ "âĢĿ.": 11453,
+ "ertainment": 11454,
+ "cean": 11455,
+ "culate": 11456,
+ "Ġven": 11457,
+ "However": 11458,
+ "_arr": 11459,
+ "Ġtokens": 11460,
+ "Graph": 11461,
+ "ĠJud": 11462,
+ "ĠVirgin": 11463,
+ "ĠSerial": 11464,
+ "unning": 11465,
+ "Mutable": 11466,
+ "agers": 11467,
+ ".csv": 11468,
+ "Ġdeveloping": 11469,
+ "Ġinstructions": 11470,
+ "Ġpromise": 11471,
+ "Ġrequested": 11472,
+ "_encode": 11473,
+ "/\"": 11474,
+ "ĠIcon": 11475,
+ "uilt": 11476,
+ "-day": 11477,
+ "Ġintelligence": 11478,
+ ".IS": 11479,
+ "ĠObservable": 11480,
+ "ĠHard": 11481,
+ "Bool": 11482,
+ "211": 11483,
+ "idential": 11484,
+ ".Anchor": 11485,
+ "Ġselling": 11486,
+ "CI": 11487,
+ "AGES": 11488,
+ "tle": 11489,
+ "bur": 11490,
+ "UFFER": 11491,
+ "RY": 11492,
+ "Ġbigger": 11493,
+ "Ġrat": 11494,
+ "Ġfamous": 11495,
+ "Ġtypename": 11496,
+ "Ġexplained": 11497,
+ "}}Ċ": 11498,
+ "Ġnuclear": 11499,
+ "-N": 11500,
+ "Ġcrisis": 11501,
+ "ĠEnter": 11502,
+ "Ġanswers": 11503,
+ "/${": 11504,
+ "/pl": 11505,
+ "Ġsequ": 11506,
+ "_next": 11507,
+ "mask": 11508,
+ "Ġstanding": 11509,
+ "Ġplenty": 11510,
+ "ĠCross": 11511,
+ "ĉret": 11512,
+ "dro": 11513,
+ "ĠCast": 11514,
+ "167": 11515,
+ "=true": 11516,
+ "ĠChris": 11517,
+ "icio": 11518,
+ "ĠMike": 11519,
+ "Decimal": 11520,
+ "addComponent": 11521,
+ "Len": 11522,
+ "Ġcock": 11523,
+ "Ġ#{": 11524,
+ "URN": 11525,
+ "": 11657,
+ "Ġ*=": 11658,
+ "ĠPS": 11659,
+ "Ġdangerous": 11660,
+ "[p": 11661,
+ "OME": 11662,
+ "Other": 11663,
+ "ĠStringBuilder": 11664,
+ "Points": 11665,
+ "heading": 11666,
+ "Ġcurrency": 11667,
+ "Ġpercentage": 11668,
+ "_API": 11669,
+ "Ġclassic": 11670,
+ "thead": 11671,
+ "ĠMO": 11672,
+ "FE": 11673,
+ "Idx": 11674,
+ "await": 11675,
+ "Ġè": 11676,
+ "Ġaccident": 11677,
+ "Ġvariant": 11678,
+ "Ġmyst": 11679,
+ "ĠLand": 11680,
+ "ĠBre": 11681,
+ "Ġharm": 11682,
+ "ĠAcc": 11683,
+ "Ġcharged": 11684,
+ "iones": 11685,
+ "Visibility": 11686,
+ "arry": 11687,
+ "ĠLanguage": 11688,
+ "Ġwalking": 11689,
+ "\".ĊĊ": 11690,
+ "ifer": 11691,
+ "Ġleadership": 11692,
+ ".From": 11693,
+ "ynam": 11694,
+ "Ġtimestamp": 11695,
+ "ipt": 11696,
+ "ĠHas": 11697,
+ "REFER": 11698,
+ "ĠIts": 11699,
+ "Ġlistener": 11700,
+ "UTE": 11701,
+ "213": 11702,
+ "_description": 11703,
+ "Ġexperiences": 11704,
+ "Ġcreates": 11705,
+ "RS": 11706,
+ "cart": 11707,
+ "black": 11708,
+ "Ġchoices": 11709,
+ "war": 11710,
+ "750": 11711,
+ "Ġ'''": 11712,
+ "Ġordered": 11713,
+ "Ġevening": 11714,
+ "Ġpil": 11715,
+ "Ġtun": 11716,
+ "ĠBad": 11717,
+ "(app": 11718,
+ "random": 11719,
+ "Ġexplicit": 11720,
+ "Ġarrived": 11721,
+ "Ġfly": 11722,
+ "Ġeconom": 11723,
+ "-mail": 11724,
+ "Ġlists": 11725,
+ "Ġarchitect": 11726,
+ "234": 11727,
+ "ĠPay": 11728,
+ "Ġds": 11729,
+ "ĠSol": 11730,
+ "Ġvehicles": 11731,
+ "Hz": 11732,
+ "-com": 11733,
+ "Ġking": 11734,
+ "_equal": 11735,
+ "ĠHelp": 11736,
+ "Ġabuse": 11737,
+ "480": 11738,
+ "169": 11739,
+ "--;Ċ": 11740,
+ "Ġextr": 11741,
+ "Ġchemical": 11742,
+ "ä¿": 11743,
+ "Ġorient": 11744,
+ "Ġbreath": 11745,
+ "ĠSpace": 11746,
+ "(element": 11747,
+ "wait": 11748,
+ "DED": 11749,
+ "igma": 11750,
+ "Ġentr": 11751,
+ "Ġsob": 11752,
+ "-name": 11753,
+ "Ġaffected": 11754,
+ "ika": 11755,
+ "Ġcoal": 11756,
+ "_work": 11757,
+ "Ġhundreds": 11758,
+ "Ġpolitics": 11759,
+ "subject": 11760,
+ "Ġconsumer": 11761,
+ "ANGE": 11762,
+ "Ġrepeated": 11763,
+ "Send": 11764,
+ "Ġ#[": 11765,
+ "Ġprotocol": 11766,
+ "Ġleads": 11767,
+ "useum": 11768,
+ "Every": 11769,
+ "808": 11770,
+ "174": 11771,
+ "Import": 11772,
+ "(count": 11773,
+ "Ġchallenges": 11774,
+ "Ġnovel": 11775,
+ "Ġdepart": 11776,
+ "bits": 11777,
+ ".Current": 11778,
+ "Ġ`${": 11779,
+ "oting": 11780,
+ "(\\": 11781,
+ "Ġcreative": 11782,
+ "Ġbuff": 11783,
+ "Ġintroduced": 11784,
+ "usic": 11785,
+ "modules": 11786,
+ "Are": 11787,
+ "-doc": 11788,
+ "language": 11789,
+ "_cache": 11790,
+ "Ġtod": 11791,
+ "?>": 11792,
+ "omething": 11793,
+ "Ġhun": 11794,
+ "åº": 11795,
+ "aters": 11796,
+ "Intent": 11797,
+ "Ġimplemented": 11798,
+ "ĠCase": 11799,
+ "Children": 11800,
+ "Ġnotification": 11801,
+ "Renderer": 11802,
+ "Wrapper": 11803,
+ "Objects": 11804,
+ "tl": 11805,
+ ".Contains": 11806,
+ "Plugin": 11807,
+ ".row": 11808,
+ "Ġforg": 11809,
+ "Ġpermit": 11810,
+ "Ġtargets": 11811,
+ "ĠIF": 11812,
+ "Ġtip": 11813,
+ "sex": 11814,
+ "Ġsupports": 11815,
+ "Ġfold": 11816,
+ "photo": 11817,
+ "},čĊ": 11818,
+ "Ġgoogle": 11819,
+ "$('#": 11820,
+ "Ġsharing": 11821,
+ "Ġgoods": 11822,
+ "vs": 11823,
+ "ĠDan": 11824,
+ "Rate": 11825,
+ "ĠMartin": 11826,
+ "Ġmanner": 11827,
+ "lie": 11828,
+ ".The": 11829,
+ "Internal": 11830,
+ "ĠCONTR": 11831,
+ "Mock": 11832,
+ "RIGHT": 11833,
+ "Ġ'{": 11834,
+ "Ġcontrols": 11835,
+ "Mat": 11836,
+ "Ġmand": 11837,
+ "Ġextended": 11838,
+ "Ok": 11839,
+ "Ġembed": 11840,
+ "Ġplanet": 11841,
+ "ĠNon": 11842,
+ "-ch": 11843,
+ ")\",": 11844,
+ "epar": 11845,
+ "Ġbelieved": 11846,
+ "ĠEnvironment": 11847,
+ "ĠFriend": 11848,
+ "-res": 11849,
+ "Ġhandling": 11850,
+ "nic": 11851,
+ "-level": 11852,
+ "scri": 11853,
+ "Xml": 11854,
+ "BE": 11855,
+ "ungen": 11856,
+ "Ġalter": 11857,
+ "[idx": 11858,
+ "Pop": 11859,
+ "cam": 11860,
+ "Ġ(((": 11861,
+ "Ġshipping": 11862,
+ "Ġbattery": 11863,
+ "iddleware": 11864,
+ "MC": 11865,
+ "Ġimpl": 11866,
+ "otation": 11867,
+ "ĠLab": 11868,
+ "