Instructions to use ToluClassics/gtr-base with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use ToluClassics/gtr-base with Transformers:
# Load model directly from transformers import AutoTokenizer, AutoModel tokenizer = AutoTokenizer.from_pretrained("ToluClassics/gtr-base") model = AutoModel.from_pretrained("ToluClassics/gtr-base") - Notebooks
- Google Colab
- Kaggle
| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 19.169274992015332, | |
| "global_step": 30000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.01, | |
| "learning_rate": 6.389776357827476e-07, | |
| "loss": 11.1023, | |
| "step": 10 | |
| }, | |
| { | |
| "epoch": 0.01, | |
| "learning_rate": 1.2779552715654952e-06, | |
| "loss": 11.0812, | |
| "step": 20 | |
| }, | |
| { | |
| "epoch": 0.02, | |
| "learning_rate": 1.916932907348243e-06, | |
| "loss": 11.1009, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "learning_rate": 2.5559105431309904e-06, | |
| "loss": 11.1185, | |
| "step": 40 | |
| }, | |
| { | |
| "epoch": 0.03, | |
| "learning_rate": 3.194888178913738e-06, | |
| "loss": 11.0872, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 0.04, | |
| "learning_rate": 3.833865814696486e-06, | |
| "loss": 11.0512, | |
| "step": 60 | |
| }, | |
| { | |
| "epoch": 0.04, | |
| "learning_rate": 4.472843450479234e-06, | |
| "loss": 11.0023, | |
| "step": 70 | |
| }, | |
| { | |
| "epoch": 0.05, | |
| "learning_rate": 5.111821086261981e-06, | |
| "loss": 10.9751, | |
| "step": 80 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "learning_rate": 5.750798722044729e-06, | |
| "loss": 10.9535, | |
| "step": 90 | |
| }, | |
| { | |
| "epoch": 0.06, | |
| "learning_rate": 6.389776357827476e-06, | |
| "loss": 10.9472, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.07, | |
| "learning_rate": 7.028753993610224e-06, | |
| "loss": 10.922, | |
| "step": 110 | |
| }, | |
| { | |
| "epoch": 0.08, | |
| "learning_rate": 7.667731629392972e-06, | |
| "loss": 10.8773, | |
| "step": 120 | |
| }, | |
| { | |
| "epoch": 0.08, | |
| "learning_rate": 8.306709265175718e-06, | |
| "loss": 10.8485, | |
| "step": 130 | |
| }, | |
| { | |
| "epoch": 0.09, | |
| "learning_rate": 8.945686900958468e-06, | |
| "loss": 10.7794, | |
| "step": 140 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 9.584664536741214e-06, | |
| "loss": 10.7876, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 0.1, | |
| "learning_rate": 1.0223642172523962e-05, | |
| "loss": 10.7846, | |
| "step": 160 | |
| }, | |
| { | |
| "epoch": 0.11, | |
| "learning_rate": 1.0862619808306708e-05, | |
| "loss": 10.7546, | |
| "step": 170 | |
| }, | |
| { | |
| "epoch": 0.11, | |
| "learning_rate": 1.1501597444089457e-05, | |
| "loss": 10.6649, | |
| "step": 180 | |
| }, | |
| { | |
| "epoch": 0.12, | |
| "learning_rate": 1.2140575079872205e-05, | |
| "loss": 10.6765, | |
| "step": 190 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "learning_rate": 1.2779552715654951e-05, | |
| "loss": 10.6211, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "learning_rate": 1.3418530351437701e-05, | |
| "loss": 10.6008, | |
| "step": 210 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "learning_rate": 1.4057507987220449e-05, | |
| "loss": 10.5362, | |
| "step": 220 | |
| }, | |
| { | |
| "epoch": 0.15, | |
| "learning_rate": 1.4696485623003195e-05, | |
| "loss": 10.4825, | |
| "step": 230 | |
| }, | |
| { | |
| "epoch": 0.15, | |
| "learning_rate": 1.5335463258785944e-05, | |
| "loss": 10.449, | |
| "step": 240 | |
| }, | |
| { | |
| "epoch": 0.16, | |
| "learning_rate": 1.597444089456869e-05, | |
| "loss": 10.3695, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "learning_rate": 1.6613418530351437e-05, | |
| "loss": 10.3128, | |
| "step": 260 | |
| }, | |
| { | |
| "epoch": 0.17, | |
| "learning_rate": 1.7252396166134186e-05, | |
| "loss": 10.221, | |
| "step": 270 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "learning_rate": 1.7891373801916936e-05, | |
| "loss": 10.1125, | |
| "step": 280 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "learning_rate": 1.853035143769968e-05, | |
| "loss": 9.9933, | |
| "step": 290 | |
| }, | |
| { | |
| "epoch": 0.19, | |
| "learning_rate": 1.9169329073482428e-05, | |
| "loss": 9.7903, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "learning_rate": 1.9808306709265177e-05, | |
| "loss": 9.5898, | |
| "step": 310 | |
| }, | |
| { | |
| "epoch": 0.2, | |
| "learning_rate": 2.0447284345047924e-05, | |
| "loss": 9.4338, | |
| "step": 320 | |
| }, | |
| { | |
| "epoch": 0.21, | |
| "learning_rate": 2.1086261980830673e-05, | |
| "loss": 9.2167, | |
| "step": 330 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 2.1725239616613416e-05, | |
| "loss": 8.9299, | |
| "step": 340 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 2.2364217252396165e-05, | |
| "loss": 8.5451, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 0.23, | |
| "learning_rate": 2.3003194888178915e-05, | |
| "loss": 8.377, | |
| "step": 360 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "learning_rate": 2.364217252396166e-05, | |
| "loss": 8.1605, | |
| "step": 370 | |
| }, | |
| { | |
| "epoch": 0.24, | |
| "learning_rate": 2.428115015974441e-05, | |
| "loss": 7.8136, | |
| "step": 380 | |
| }, | |
| { | |
| "epoch": 0.25, | |
| "learning_rate": 2.4920127795527157e-05, | |
| "loss": 7.4985, | |
| "step": 390 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "learning_rate": 2.5559105431309903e-05, | |
| "loss": 7.1695, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "learning_rate": 2.6198083067092652e-05, | |
| "loss": 6.9816, | |
| "step": 410 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "learning_rate": 2.6837060702875402e-05, | |
| "loss": 6.4929, | |
| "step": 420 | |
| }, | |
| { | |
| "epoch": 0.27, | |
| "learning_rate": 2.7476038338658148e-05, | |
| "loss": 6.3582, | |
| "step": 430 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "learning_rate": 2.8115015974440897e-05, | |
| "loss": 6.1947, | |
| "step": 440 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "learning_rate": 2.875399361022364e-05, | |
| "loss": 5.8765, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 0.29, | |
| "learning_rate": 2.939297124600639e-05, | |
| "loss": 5.6917, | |
| "step": 460 | |
| }, | |
| { | |
| "epoch": 0.3, | |
| "learning_rate": 3.003194888178914e-05, | |
| "loss": 5.5349, | |
| "step": 470 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "learning_rate": 3.067092651757189e-05, | |
| "loss": 5.4405, | |
| "step": 480 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "learning_rate": 3.130990415335463e-05, | |
| "loss": 5.2719, | |
| "step": 490 | |
| }, | |
| { | |
| "epoch": 0.32, | |
| "learning_rate": 3.194888178913738e-05, | |
| "loss": 4.8337, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.33, | |
| "learning_rate": 3.258785942492013e-05, | |
| "loss": 4.8143, | |
| "step": 510 | |
| }, | |
| { | |
| "epoch": 0.33, | |
| "learning_rate": 3.322683706070287e-05, | |
| "loss": 4.5746, | |
| "step": 520 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "learning_rate": 3.386581469648562e-05, | |
| "loss": 4.348, | |
| "step": 530 | |
| }, | |
| { | |
| "epoch": 0.34, | |
| "learning_rate": 3.450479233226837e-05, | |
| "loss": 4.1607, | |
| "step": 540 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "learning_rate": 3.5143769968051115e-05, | |
| "loss": 4.0622, | |
| "step": 550 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "learning_rate": 3.578274760383387e-05, | |
| "loss": 3.9419, | |
| "step": 560 | |
| }, | |
| { | |
| "epoch": 0.36, | |
| "learning_rate": 3.6421725239616614e-05, | |
| "loss": 3.8112, | |
| "step": 570 | |
| }, | |
| { | |
| "epoch": 0.37, | |
| "learning_rate": 3.706070287539936e-05, | |
| "loss": 3.6399, | |
| "step": 580 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "learning_rate": 3.769968051118211e-05, | |
| "loss": 3.5703, | |
| "step": 590 | |
| }, | |
| { | |
| "epoch": 0.38, | |
| "learning_rate": 3.8338658146964856e-05, | |
| "loss": 3.4017, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "learning_rate": 3.8977635782747605e-05, | |
| "loss": 3.2633, | |
| "step": 610 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "learning_rate": 3.9616613418530355e-05, | |
| "loss": 3.0287, | |
| "step": 620 | |
| }, | |
| { | |
| "epoch": 0.4, | |
| "learning_rate": 4.02555910543131e-05, | |
| "loss": 3.0033, | |
| "step": 630 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "learning_rate": 4.089456869009585e-05, | |
| "loss": 3.0306, | |
| "step": 640 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "learning_rate": 4.15335463258786e-05, | |
| "loss": 2.8719, | |
| "step": 650 | |
| }, | |
| { | |
| "epoch": 0.42, | |
| "learning_rate": 4.2172523961661346e-05, | |
| "loss": 2.6886, | |
| "step": 660 | |
| }, | |
| { | |
| "epoch": 0.43, | |
| "learning_rate": 4.281150159744409e-05, | |
| "loss": 2.5607, | |
| "step": 670 | |
| }, | |
| { | |
| "epoch": 0.43, | |
| "learning_rate": 4.345047923322683e-05, | |
| "loss": 2.4779, | |
| "step": 680 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "learning_rate": 4.408945686900959e-05, | |
| "loss": 2.4884, | |
| "step": 690 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "learning_rate": 4.472843450479233e-05, | |
| "loss": 2.3248, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.45, | |
| "learning_rate": 4.536741214057508e-05, | |
| "loss": 2.3108, | |
| "step": 710 | |
| }, | |
| { | |
| "epoch": 0.46, | |
| "learning_rate": 4.600638977635783e-05, | |
| "loss": 2.2866, | |
| "step": 720 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "learning_rate": 4.664536741214057e-05, | |
| "loss": 2.1556, | |
| "step": 730 | |
| }, | |
| { | |
| "epoch": 0.47, | |
| "learning_rate": 4.728434504792332e-05, | |
| "loss": 2.0662, | |
| "step": 740 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "learning_rate": 4.792332268370607e-05, | |
| "loss": 2.1048, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "learning_rate": 4.856230031948882e-05, | |
| "loss": 1.9392, | |
| "step": 760 | |
| }, | |
| { | |
| "epoch": 0.49, | |
| "learning_rate": 4.9201277955271564e-05, | |
| "loss": 1.9819, | |
| "step": 770 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "learning_rate": 4.984025559105431e-05, | |
| "loss": 1.9099, | |
| "step": 780 | |
| }, | |
| { | |
| "epoch": 0.5, | |
| "learning_rate": 5.047923322683706e-05, | |
| "loss": 1.8879, | |
| "step": 790 | |
| }, | |
| { | |
| "epoch": 0.51, | |
| "learning_rate": 5.1118210862619806e-05, | |
| "loss": 1.8877, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.52, | |
| "learning_rate": 5.175718849840256e-05, | |
| "loss": 1.8067, | |
| "step": 810 | |
| }, | |
| { | |
| "epoch": 0.52, | |
| "learning_rate": 5.2396166134185305e-05, | |
| "loss": 1.74, | |
| "step": 820 | |
| }, | |
| { | |
| "epoch": 0.53, | |
| "learning_rate": 5.3035143769968054e-05, | |
| "loss": 1.705, | |
| "step": 830 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 5.3674121405750804e-05, | |
| "loss": 1.5959, | |
| "step": 840 | |
| }, | |
| { | |
| "epoch": 0.54, | |
| "learning_rate": 5.4313099041533546e-05, | |
| "loss": 1.6158, | |
| "step": 850 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "learning_rate": 5.4952076677316296e-05, | |
| "loss": 1.6574, | |
| "step": 860 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "learning_rate": 5.559105431309904e-05, | |
| "loss": 1.5606, | |
| "step": 870 | |
| }, | |
| { | |
| "epoch": 0.56, | |
| "learning_rate": 5.6230031948881795e-05, | |
| "loss": 1.5595, | |
| "step": 880 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "learning_rate": 5.686900958466454e-05, | |
| "loss": 1.6025, | |
| "step": 890 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "learning_rate": 5.750798722044728e-05, | |
| "loss": 1.6317, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.58, | |
| "learning_rate": 5.814696485623004e-05, | |
| "loss": 1.4737, | |
| "step": 910 | |
| }, | |
| { | |
| "epoch": 0.59, | |
| "learning_rate": 5.878594249201278e-05, | |
| "loss": 1.5243, | |
| "step": 920 | |
| }, | |
| { | |
| "epoch": 0.59, | |
| "learning_rate": 5.942492012779553e-05, | |
| "loss": 1.4923, | |
| "step": 930 | |
| }, | |
| { | |
| "epoch": 0.6, | |
| "learning_rate": 6.006389776357828e-05, | |
| "loss": 1.3972, | |
| "step": 940 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "learning_rate": 6.070287539936102e-05, | |
| "loss": 1.4433, | |
| "step": 950 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "learning_rate": 6.134185303514378e-05, | |
| "loss": 1.4677, | |
| "step": 960 | |
| }, | |
| { | |
| "epoch": 0.62, | |
| "learning_rate": 6.198083067092652e-05, | |
| "loss": 1.3918, | |
| "step": 970 | |
| }, | |
| { | |
| "epoch": 0.63, | |
| "learning_rate": 6.261980830670926e-05, | |
| "loss": 1.2902, | |
| "step": 980 | |
| }, | |
| { | |
| "epoch": 0.63, | |
| "learning_rate": 6.325878594249202e-05, | |
| "loss": 1.3005, | |
| "step": 990 | |
| }, | |
| { | |
| "epoch": 0.64, | |
| "learning_rate": 6.389776357827476e-05, | |
| "loss": 1.2544, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.65, | |
| "learning_rate": 6.45367412140575e-05, | |
| "loss": 1.2713, | |
| "step": 1010 | |
| }, | |
| { | |
| "epoch": 0.65, | |
| "learning_rate": 6.517571884984026e-05, | |
| "loss": 1.3027, | |
| "step": 1020 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "learning_rate": 6.5814696485623e-05, | |
| "loss": 1.2434, | |
| "step": 1030 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "learning_rate": 6.645367412140575e-05, | |
| "loss": 1.2283, | |
| "step": 1040 | |
| }, | |
| { | |
| "epoch": 0.67, | |
| "learning_rate": 6.70926517571885e-05, | |
| "loss": 1.2587, | |
| "step": 1050 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "learning_rate": 6.773162939297125e-05, | |
| "loss": 1.1828, | |
| "step": 1060 | |
| }, | |
| { | |
| "epoch": 0.68, | |
| "learning_rate": 6.8370607028754e-05, | |
| "loss": 1.1369, | |
| "step": 1070 | |
| }, | |
| { | |
| "epoch": 0.69, | |
| "learning_rate": 6.900958466453674e-05, | |
| "loss": 1.1307, | |
| "step": 1080 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "learning_rate": 6.964856230031949e-05, | |
| "loss": 1.1675, | |
| "step": 1090 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "learning_rate": 7.028753993610223e-05, | |
| "loss": 1.1872, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 0.71, | |
| "learning_rate": 7.092651757188499e-05, | |
| "loss": 1.1707, | |
| "step": 1110 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "learning_rate": 7.156549520766774e-05, | |
| "loss": 1.19, | |
| "step": 1120 | |
| }, | |
| { | |
| "epoch": 0.72, | |
| "learning_rate": 7.220447284345049e-05, | |
| "loss": 1.1268, | |
| "step": 1130 | |
| }, | |
| { | |
| "epoch": 0.73, | |
| "learning_rate": 7.284345047923323e-05, | |
| "loss": 1.0189, | |
| "step": 1140 | |
| }, | |
| { | |
| "epoch": 0.73, | |
| "learning_rate": 7.348242811501597e-05, | |
| "loss": 1.0764, | |
| "step": 1150 | |
| }, | |
| { | |
| "epoch": 0.74, | |
| "learning_rate": 7.412140575079871e-05, | |
| "loss": 1.073, | |
| "step": 1160 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "learning_rate": 7.476038338658147e-05, | |
| "loss": 0.9837, | |
| "step": 1170 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "learning_rate": 7.539936102236423e-05, | |
| "loss": 1.014, | |
| "step": 1180 | |
| }, | |
| { | |
| "epoch": 0.76, | |
| "learning_rate": 7.603833865814697e-05, | |
| "loss": 1.0643, | |
| "step": 1190 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "learning_rate": 7.667731629392971e-05, | |
| "loss": 1.0439, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 0.77, | |
| "learning_rate": 7.731629392971245e-05, | |
| "loss": 1.0419, | |
| "step": 1210 | |
| }, | |
| { | |
| "epoch": 0.78, | |
| "learning_rate": 7.795527156549521e-05, | |
| "loss": 1.01, | |
| "step": 1220 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "learning_rate": 7.859424920127795e-05, | |
| "loss": 0.9829, | |
| "step": 1230 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "learning_rate": 7.923322683706071e-05, | |
| "loss": 1.0113, | |
| "step": 1240 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "learning_rate": 7.987220447284345e-05, | |
| "loss": 0.9818, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 0.8, | |
| "learning_rate": 8.05111821086262e-05, | |
| "loss": 0.9299, | |
| "step": 1260 | |
| }, | |
| { | |
| "epoch": 0.81, | |
| "learning_rate": 8.115015974440895e-05, | |
| "loss": 0.9891, | |
| "step": 1270 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "learning_rate": 8.17891373801917e-05, | |
| "loss": 0.9429, | |
| "step": 1280 | |
| }, | |
| { | |
| "epoch": 0.82, | |
| "learning_rate": 8.242811501597444e-05, | |
| "loss": 0.8778, | |
| "step": 1290 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "learning_rate": 8.30670926517572e-05, | |
| "loss": 0.8918, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "learning_rate": 8.370607028753994e-05, | |
| "loss": 0.8873, | |
| "step": 1310 | |
| }, | |
| { | |
| "epoch": 0.84, | |
| "learning_rate": 8.434504792332269e-05, | |
| "loss": 0.9026, | |
| "step": 1320 | |
| }, | |
| { | |
| "epoch": 0.85, | |
| "learning_rate": 8.498402555910544e-05, | |
| "loss": 0.9084, | |
| "step": 1330 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "learning_rate": 8.562300319488818e-05, | |
| "loss": 0.9513, | |
| "step": 1340 | |
| }, | |
| { | |
| "epoch": 0.86, | |
| "learning_rate": 8.626198083067092e-05, | |
| "loss": 0.8507, | |
| "step": 1350 | |
| }, | |
| { | |
| "epoch": 0.87, | |
| "learning_rate": 8.690095846645366e-05, | |
| "loss": 0.9136, | |
| "step": 1360 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "learning_rate": 8.753993610223643e-05, | |
| "loss": 0.8661, | |
| "step": 1370 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "learning_rate": 8.817891373801918e-05, | |
| "loss": 0.8559, | |
| "step": 1380 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "learning_rate": 8.881789137380192e-05, | |
| "loss": 0.8322, | |
| "step": 1390 | |
| }, | |
| { | |
| "epoch": 0.89, | |
| "learning_rate": 8.945686900958466e-05, | |
| "loss": 0.829, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 0.9, | |
| "learning_rate": 9.00958466453674e-05, | |
| "loss": 0.9206, | |
| "step": 1410 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "learning_rate": 9.073482428115016e-05, | |
| "loss": 0.788, | |
| "step": 1420 | |
| }, | |
| { | |
| "epoch": 0.91, | |
| "learning_rate": 9.137380191693292e-05, | |
| "loss": 0.8313, | |
| "step": 1430 | |
| }, | |
| { | |
| "epoch": 0.92, | |
| "learning_rate": 9.201277955271566e-05, | |
| "loss": 0.8072, | |
| "step": 1440 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 9.26517571884984e-05, | |
| "loss": 0.8115, | |
| "step": 1450 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "learning_rate": 9.329073482428115e-05, | |
| "loss": 0.7849, | |
| "step": 1460 | |
| }, | |
| { | |
| "epoch": 0.94, | |
| "learning_rate": 9.39297124600639e-05, | |
| "loss": 0.8003, | |
| "step": 1470 | |
| }, | |
| { | |
| "epoch": 0.95, | |
| "learning_rate": 9.456869009584664e-05, | |
| "loss": 0.7835, | |
| "step": 1480 | |
| }, | |
| { | |
| "epoch": 0.95, | |
| "learning_rate": 9.52076677316294e-05, | |
| "loss": 0.8598, | |
| "step": 1490 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "learning_rate": 9.584664536741214e-05, | |
| "loss": 0.746, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.96, | |
| "learning_rate": 9.648562300319489e-05, | |
| "loss": 0.8485, | |
| "step": 1510 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "learning_rate": 9.712460063897764e-05, | |
| "loss": 0.7976, | |
| "step": 1520 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "learning_rate": 9.776357827476038e-05, | |
| "loss": 0.7023, | |
| "step": 1530 | |
| }, | |
| { | |
| "epoch": 0.98, | |
| "learning_rate": 9.840255591054313e-05, | |
| "loss": 0.7586, | |
| "step": 1540 | |
| }, | |
| { | |
| "epoch": 0.99, | |
| "learning_rate": 9.904153354632587e-05, | |
| "loss": 0.771, | |
| "step": 1550 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 9.968051118210863e-05, | |
| "loss": 0.7551, | |
| "step": 1560 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "learning_rate": 0.00010031948881789138, | |
| "loss": 0.7311, | |
| "step": 1570 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "learning_rate": 0.00010095846645367413, | |
| "loss": 0.7774, | |
| "step": 1580 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "learning_rate": 0.00010159744408945687, | |
| "loss": 0.7289, | |
| "step": 1590 | |
| }, | |
| { | |
| "epoch": 1.02, | |
| "learning_rate": 0.00010223642172523961, | |
| "loss": 0.7326, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.03, | |
| "learning_rate": 0.00010287539936102237, | |
| "loss": 0.7089, | |
| "step": 1610 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "learning_rate": 0.00010351437699680512, | |
| "loss": 0.6825, | |
| "step": 1620 | |
| }, | |
| { | |
| "epoch": 1.04, | |
| "learning_rate": 0.00010415335463258787, | |
| "loss": 0.7002, | |
| "step": 1630 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "learning_rate": 0.00010479233226837061, | |
| "loss": 0.6959, | |
| "step": 1640 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "learning_rate": 0.00010543130990415335, | |
| "loss": 0.713, | |
| "step": 1650 | |
| }, | |
| { | |
| "epoch": 1.06, | |
| "learning_rate": 0.00010607028753993611, | |
| "loss": 0.6884, | |
| "step": 1660 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "learning_rate": 0.00010670926517571885, | |
| "loss": 0.6914, | |
| "step": 1670 | |
| }, | |
| { | |
| "epoch": 1.07, | |
| "learning_rate": 0.00010734824281150161, | |
| "loss": 0.6628, | |
| "step": 1680 | |
| }, | |
| { | |
| "epoch": 1.08, | |
| "learning_rate": 0.00010798722044728435, | |
| "loss": 0.7524, | |
| "step": 1690 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "learning_rate": 0.00010862619808306709, | |
| "loss": 0.6824, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 1.09, | |
| "learning_rate": 0.00010926517571884985, | |
| "loss": 0.6922, | |
| "step": 1710 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "learning_rate": 0.00010990415335463259, | |
| "loss": 0.6298, | |
| "step": 1720 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "learning_rate": 0.00011054313099041533, | |
| "loss": 0.6545, | |
| "step": 1730 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "learning_rate": 0.00011118210862619808, | |
| "loss": 0.6842, | |
| "step": 1740 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 0.00011182108626198083, | |
| "loss": 0.6909, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 1.12, | |
| "learning_rate": 0.00011246006389776359, | |
| "loss": 0.687, | |
| "step": 1760 | |
| }, | |
| { | |
| "epoch": 1.13, | |
| "learning_rate": 0.00011309904153354633, | |
| "loss": 0.6096, | |
| "step": 1770 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "learning_rate": 0.00011373801916932908, | |
| "loss": 0.6599, | |
| "step": 1780 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "learning_rate": 0.00011437699680511182, | |
| "loss": 0.7088, | |
| "step": 1790 | |
| }, | |
| { | |
| "epoch": 1.15, | |
| "learning_rate": 0.00011501597444089456, | |
| "loss": 0.7042, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "learning_rate": 0.00011565495207667733, | |
| "loss": 0.6482, | |
| "step": 1810 | |
| }, | |
| { | |
| "epoch": 1.16, | |
| "learning_rate": 0.00011629392971246007, | |
| "loss": 0.6221, | |
| "step": 1820 | |
| }, | |
| { | |
| "epoch": 1.17, | |
| "learning_rate": 0.00011693290734824282, | |
| "loss": 0.6134, | |
| "step": 1830 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "learning_rate": 0.00011757188498402556, | |
| "loss": 0.5959, | |
| "step": 1840 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "learning_rate": 0.0001182108626198083, | |
| "loss": 0.6201, | |
| "step": 1850 | |
| }, | |
| { | |
| "epoch": 1.19, | |
| "learning_rate": 0.00011884984025559106, | |
| "loss": 0.6298, | |
| "step": 1860 | |
| }, | |
| { | |
| "epoch": 1.19, | |
| "learning_rate": 0.00011948881789137381, | |
| "loss": 0.5908, | |
| "step": 1870 | |
| }, | |
| { | |
| "epoch": 1.2, | |
| "learning_rate": 0.00012012779552715656, | |
| "loss": 0.5862, | |
| "step": 1880 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "learning_rate": 0.0001207667731629393, | |
| "loss": 0.6449, | |
| "step": 1890 | |
| }, | |
| { | |
| "epoch": 1.21, | |
| "learning_rate": 0.00012140575079872204, | |
| "loss": 0.5922, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 1.22, | |
| "learning_rate": 0.0001220447284345048, | |
| "loss": 0.604, | |
| "step": 1910 | |
| }, | |
| { | |
| "epoch": 1.23, | |
| "learning_rate": 0.00012268370607028756, | |
| "loss": 0.6396, | |
| "step": 1920 | |
| }, | |
| { | |
| "epoch": 1.23, | |
| "learning_rate": 0.00012332268370607028, | |
| "loss": 0.6068, | |
| "step": 1930 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "learning_rate": 0.00012396166134185304, | |
| "loss": 0.6454, | |
| "step": 1940 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "learning_rate": 0.00012460063897763577, | |
| "loss": 0.5194, | |
| "step": 1950 | |
| }, | |
| { | |
| "epoch": 1.25, | |
| "learning_rate": 0.00012523961661341853, | |
| "loss": 0.5865, | |
| "step": 1960 | |
| }, | |
| { | |
| "epoch": 1.26, | |
| "learning_rate": 0.00012587859424920128, | |
| "loss": 0.5784, | |
| "step": 1970 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "learning_rate": 0.00012651757188498404, | |
| "loss": 0.559, | |
| "step": 1980 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "learning_rate": 0.00012715654952076677, | |
| "loss": 0.5501, | |
| "step": 1990 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "learning_rate": 0.00012779552715654952, | |
| "loss": 0.6316, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.28, | |
| "learning_rate": 0.00012843450479233225, | |
| "loss": 0.593, | |
| "step": 2010 | |
| }, | |
| { | |
| "epoch": 1.29, | |
| "learning_rate": 0.000129073482428115, | |
| "loss": 0.5946, | |
| "step": 2020 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "learning_rate": 0.00012971246006389777, | |
| "loss": 0.5813, | |
| "step": 2030 | |
| }, | |
| { | |
| "epoch": 1.3, | |
| "learning_rate": 0.00013035143769968052, | |
| "loss": 0.5541, | |
| "step": 2040 | |
| }, | |
| { | |
| "epoch": 1.31, | |
| "learning_rate": 0.00013099041533546328, | |
| "loss": 0.5761, | |
| "step": 2050 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "learning_rate": 0.000131629392971246, | |
| "loss": 0.557, | |
| "step": 2060 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "learning_rate": 0.00013226837060702876, | |
| "loss": 0.5663, | |
| "step": 2070 | |
| }, | |
| { | |
| "epoch": 1.33, | |
| "learning_rate": 0.0001329073482428115, | |
| "loss": 0.5496, | |
| "step": 2080 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "learning_rate": 0.00013354632587859425, | |
| "loss": 0.5291, | |
| "step": 2090 | |
| }, | |
| { | |
| "epoch": 1.34, | |
| "learning_rate": 0.000134185303514377, | |
| "loss": 0.565, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "learning_rate": 0.00013482428115015973, | |
| "loss": 0.5763, | |
| "step": 2110 | |
| }, | |
| { | |
| "epoch": 1.35, | |
| "learning_rate": 0.0001354632587859425, | |
| "loss": 0.6175, | |
| "step": 2120 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "learning_rate": 0.00013610223642172525, | |
| "loss": 0.5378, | |
| "step": 2130 | |
| }, | |
| { | |
| "epoch": 1.37, | |
| "learning_rate": 0.000136741214057508, | |
| "loss": 0.574, | |
| "step": 2140 | |
| }, | |
| { | |
| "epoch": 1.37, | |
| "learning_rate": 0.00013738019169329073, | |
| "loss": 0.561, | |
| "step": 2150 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "learning_rate": 0.0001380191693290735, | |
| "loss": 0.5277, | |
| "step": 2160 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "learning_rate": 0.00013865814696485625, | |
| "loss": 0.5662, | |
| "step": 2170 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "learning_rate": 0.00013929712460063897, | |
| "loss": 0.526, | |
| "step": 2180 | |
| }, | |
| { | |
| "epoch": 1.4, | |
| "learning_rate": 0.00013993610223642173, | |
| "loss": 0.4969, | |
| "step": 2190 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "learning_rate": 0.00014057507987220446, | |
| "loss": 0.5275, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 1.41, | |
| "learning_rate": 0.00014121405750798722, | |
| "loss": 0.553, | |
| "step": 2210 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "learning_rate": 0.00014185303514376997, | |
| "loss": 0.5598, | |
| "step": 2220 | |
| }, | |
| { | |
| "epoch": 1.42, | |
| "learning_rate": 0.00014249201277955273, | |
| "loss": 0.5127, | |
| "step": 2230 | |
| }, | |
| { | |
| "epoch": 1.43, | |
| "learning_rate": 0.00014313099041533549, | |
| "loss": 0.5606, | |
| "step": 2240 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 0.00014376996805111821, | |
| "loss": 0.5499, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 1.44, | |
| "learning_rate": 0.00014440894568690097, | |
| "loss": 0.5118, | |
| "step": 2260 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "learning_rate": 0.0001450479233226837, | |
| "loss": 0.5638, | |
| "step": 2270 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "learning_rate": 0.00014568690095846646, | |
| "loss": 0.5235, | |
| "step": 2280 | |
| }, | |
| { | |
| "epoch": 1.46, | |
| "learning_rate": 0.0001463258785942492, | |
| "loss": 0.5114, | |
| "step": 2290 | |
| }, | |
| { | |
| "epoch": 1.47, | |
| "learning_rate": 0.00014696485623003194, | |
| "loss": 0.5375, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "learning_rate": 0.0001476038338658147, | |
| "loss": 0.5737, | |
| "step": 2310 | |
| }, | |
| { | |
| "epoch": 1.48, | |
| "learning_rate": 0.00014824281150159743, | |
| "loss": 0.541, | |
| "step": 2320 | |
| }, | |
| { | |
| "epoch": 1.49, | |
| "learning_rate": 0.0001488817891373802, | |
| "loss": 0.5112, | |
| "step": 2330 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "learning_rate": 0.00014952076677316294, | |
| "loss": 0.4936, | |
| "step": 2340 | |
| }, | |
| { | |
| "epoch": 1.5, | |
| "learning_rate": 0.0001501597444089457, | |
| "loss": 0.515, | |
| "step": 2350 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "learning_rate": 0.00015079872204472845, | |
| "loss": 0.507, | |
| "step": 2360 | |
| }, | |
| { | |
| "epoch": 1.51, | |
| "learning_rate": 0.00015143769968051118, | |
| "loss": 0.4934, | |
| "step": 2370 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "learning_rate": 0.00015207667731629394, | |
| "loss": 0.5081, | |
| "step": 2380 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "learning_rate": 0.00015271565495207667, | |
| "loss": 0.4726, | |
| "step": 2390 | |
| }, | |
| { | |
| "epoch": 1.53, | |
| "learning_rate": 0.00015335463258785942, | |
| "loss": 0.5149, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "learning_rate": 0.00015399361022364218, | |
| "loss": 0.4544, | |
| "step": 2410 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "learning_rate": 0.0001546325878594249, | |
| "loss": 0.5026, | |
| "step": 2420 | |
| }, | |
| { | |
| "epoch": 1.55, | |
| "learning_rate": 0.0001552715654952077, | |
| "loss": 0.4987, | |
| "step": 2430 | |
| }, | |
| { | |
| "epoch": 1.56, | |
| "learning_rate": 0.00015591054313099042, | |
| "loss": 0.4715, | |
| "step": 2440 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "learning_rate": 0.00015654952076677318, | |
| "loss": 0.5137, | |
| "step": 2450 | |
| }, | |
| { | |
| "epoch": 1.57, | |
| "learning_rate": 0.0001571884984025559, | |
| "loss": 0.4659, | |
| "step": 2460 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "learning_rate": 0.00015782747603833866, | |
| "loss": 0.5293, | |
| "step": 2470 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "learning_rate": 0.00015846645367412142, | |
| "loss": 0.4848, | |
| "step": 2480 | |
| }, | |
| { | |
| "epoch": 1.59, | |
| "learning_rate": 0.00015910543130990415, | |
| "loss": 0.5464, | |
| "step": 2490 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "learning_rate": 0.0001597444089456869, | |
| "loss": 0.4918, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 1.6, | |
| "learning_rate": 0.00016038338658146963, | |
| "loss": 0.4821, | |
| "step": 2510 | |
| }, | |
| { | |
| "epoch": 1.61, | |
| "learning_rate": 0.0001610223642172524, | |
| "loss": 0.4464, | |
| "step": 2520 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "learning_rate": 0.00016166134185303515, | |
| "loss": 0.5041, | |
| "step": 2530 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "learning_rate": 0.0001623003194888179, | |
| "loss": 0.5254, | |
| "step": 2540 | |
| }, | |
| { | |
| "epoch": 1.63, | |
| "learning_rate": 0.00016293929712460066, | |
| "loss": 0.4722, | |
| "step": 2550 | |
| }, | |
| { | |
| "epoch": 1.64, | |
| "learning_rate": 0.0001635782747603834, | |
| "loss": 0.5127, | |
| "step": 2560 | |
| }, | |
| { | |
| "epoch": 1.64, | |
| "learning_rate": 0.00016421725239616614, | |
| "loss": 0.4978, | |
| "step": 2570 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "learning_rate": 0.00016485623003194887, | |
| "loss": 0.5174, | |
| "step": 2580 | |
| }, | |
| { | |
| "epoch": 1.65, | |
| "learning_rate": 0.00016549520766773163, | |
| "loss": 0.528, | |
| "step": 2590 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "learning_rate": 0.0001661341853035144, | |
| "loss": 0.5612, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "learning_rate": 0.00016677316293929712, | |
| "loss": 0.4953, | |
| "step": 2610 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "learning_rate": 0.00016741214057507987, | |
| "loss": 0.475, | |
| "step": 2620 | |
| }, | |
| { | |
| "epoch": 1.68, | |
| "learning_rate": 0.00016805111821086263, | |
| "loss": 0.476, | |
| "step": 2630 | |
| }, | |
| { | |
| "epoch": 1.69, | |
| "learning_rate": 0.00016869009584664538, | |
| "loss": 0.4799, | |
| "step": 2640 | |
| }, | |
| { | |
| "epoch": 1.69, | |
| "learning_rate": 0.00016932907348242811, | |
| "loss": 0.4838, | |
| "step": 2650 | |
| }, | |
| { | |
| "epoch": 1.7, | |
| "learning_rate": 0.00016996805111821087, | |
| "loss": 0.5215, | |
| "step": 2660 | |
| }, | |
| { | |
| "epoch": 1.71, | |
| "learning_rate": 0.00017060702875399363, | |
| "loss": 0.4927, | |
| "step": 2670 | |
| }, | |
| { | |
| "epoch": 1.71, | |
| "learning_rate": 0.00017124600638977636, | |
| "loss": 0.4973, | |
| "step": 2680 | |
| }, | |
| { | |
| "epoch": 1.72, | |
| "learning_rate": 0.0001718849840255591, | |
| "loss": 0.4703, | |
| "step": 2690 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "learning_rate": 0.00017252396166134184, | |
| "loss": 0.5073, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 1.73, | |
| "learning_rate": 0.0001731629392971246, | |
| "loss": 0.4445, | |
| "step": 2710 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "learning_rate": 0.00017380191693290733, | |
| "loss": 0.463, | |
| "step": 2720 | |
| }, | |
| { | |
| "epoch": 1.74, | |
| "learning_rate": 0.0001744408945686901, | |
| "loss": 0.4289, | |
| "step": 2730 | |
| }, | |
| { | |
| "epoch": 1.75, | |
| "learning_rate": 0.00017507987220447287, | |
| "loss": 0.4378, | |
| "step": 2740 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "learning_rate": 0.0001757188498402556, | |
| "loss": 0.4408, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "learning_rate": 0.00017635782747603835, | |
| "loss": 0.518, | |
| "step": 2760 | |
| }, | |
| { | |
| "epoch": 1.77, | |
| "learning_rate": 0.00017699680511182108, | |
| "loss": 0.4583, | |
| "step": 2770 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "learning_rate": 0.00017763578274760384, | |
| "loss": 0.4415, | |
| "step": 2780 | |
| }, | |
| { | |
| "epoch": 1.78, | |
| "learning_rate": 0.0001782747603833866, | |
| "loss": 0.4543, | |
| "step": 2790 | |
| }, | |
| { | |
| "epoch": 1.79, | |
| "learning_rate": 0.00017891373801916932, | |
| "loss": 0.4353, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "learning_rate": 0.00017955271565495208, | |
| "loss": 0.5315, | |
| "step": 2810 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "learning_rate": 0.0001801916932907348, | |
| "loss": 0.468, | |
| "step": 2820 | |
| }, | |
| { | |
| "epoch": 1.81, | |
| "learning_rate": 0.0001808306709265176, | |
| "loss": 0.4915, | |
| "step": 2830 | |
| }, | |
| { | |
| "epoch": 1.81, | |
| "learning_rate": 0.00018146964856230032, | |
| "loss": 0.4684, | |
| "step": 2840 | |
| }, | |
| { | |
| "epoch": 1.82, | |
| "learning_rate": 0.00018210862619808308, | |
| "loss": 0.4367, | |
| "step": 2850 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "learning_rate": 0.00018274760383386583, | |
| "loss": 0.3751, | |
| "step": 2860 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "learning_rate": 0.00018338658146964856, | |
| "loss": 0.4347, | |
| "step": 2870 | |
| }, | |
| { | |
| "epoch": 1.84, | |
| "learning_rate": 0.00018402555910543132, | |
| "loss": 0.4611, | |
| "step": 2880 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "learning_rate": 0.00018466453674121405, | |
| "loss": 0.4425, | |
| "step": 2890 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "learning_rate": 0.0001853035143769968, | |
| "loss": 0.4483, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 1.86, | |
| "learning_rate": 0.00018594249201277953, | |
| "loss": 0.4603, | |
| "step": 2910 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "learning_rate": 0.0001865814696485623, | |
| "loss": 0.4369, | |
| "step": 2920 | |
| }, | |
| { | |
| "epoch": 1.87, | |
| "learning_rate": 0.00018722044728434507, | |
| "loss": 0.4521, | |
| "step": 2930 | |
| }, | |
| { | |
| "epoch": 1.88, | |
| "learning_rate": 0.0001878594249201278, | |
| "loss": 0.4239, | |
| "step": 2940 | |
| }, | |
| { | |
| "epoch": 1.88, | |
| "learning_rate": 0.00018849840255591056, | |
| "loss": 0.3795, | |
| "step": 2950 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "learning_rate": 0.0001891373801916933, | |
| "loss": 0.477, | |
| "step": 2960 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "learning_rate": 0.00018977635782747604, | |
| "loss": 0.4273, | |
| "step": 2970 | |
| }, | |
| { | |
| "epoch": 1.9, | |
| "learning_rate": 0.0001904153354632588, | |
| "loss": 0.4786, | |
| "step": 2980 | |
| }, | |
| { | |
| "epoch": 1.91, | |
| "learning_rate": 0.00019105431309904153, | |
| "loss": 0.4803, | |
| "step": 2990 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 0.00019169329073482429, | |
| "loss": 0.4497, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 1.92, | |
| "learning_rate": 0.00019233226837060702, | |
| "loss": 0.4749, | |
| "step": 3010 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "learning_rate": 0.00019297124600638977, | |
| "loss": 0.4231, | |
| "step": 3020 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "learning_rate": 0.00019361022364217253, | |
| "loss": 0.4618, | |
| "step": 3030 | |
| }, | |
| { | |
| "epoch": 1.94, | |
| "learning_rate": 0.00019424920127795528, | |
| "loss": 0.4265, | |
| "step": 3040 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 0.00019488817891373804, | |
| "loss": 0.39, | |
| "step": 3050 | |
| }, | |
| { | |
| "epoch": 1.95, | |
| "learning_rate": 0.00019552715654952077, | |
| "loss": 0.4346, | |
| "step": 3060 | |
| }, | |
| { | |
| "epoch": 1.96, | |
| "learning_rate": 0.00019616613418530353, | |
| "loss": 0.4079, | |
| "step": 3070 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "learning_rate": 0.00019680511182108626, | |
| "loss": 0.4351, | |
| "step": 3080 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "learning_rate": 0.000197444089456869, | |
| "loss": 0.4402, | |
| "step": 3090 | |
| }, | |
| { | |
| "epoch": 1.98, | |
| "learning_rate": 0.00019808306709265174, | |
| "loss": 0.4294, | |
| "step": 3100 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "learning_rate": 0.0001987220447284345, | |
| "loss": 0.4079, | |
| "step": 3110 | |
| }, | |
| { | |
| "epoch": 1.99, | |
| "learning_rate": 0.00019936102236421725, | |
| "loss": 0.398, | |
| "step": 3120 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "learning_rate": 0.0002, | |
| "loss": 0.3759, | |
| "step": 3130 | |
| }, | |
| { | |
| "epoch": 2.01, | |
| "learning_rate": 0.00020063897763578277, | |
| "loss": 0.408, | |
| "step": 3140 | |
| }, | |
| { | |
| "epoch": 2.01, | |
| "learning_rate": 0.0002012779552715655, | |
| "loss": 0.4261, | |
| "step": 3150 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "learning_rate": 0.00020191693290734825, | |
| "loss": 0.3951, | |
| "step": 3160 | |
| }, | |
| { | |
| "epoch": 2.03, | |
| "learning_rate": 0.000202555910543131, | |
| "loss": 0.3488, | |
| "step": 3170 | |
| }, | |
| { | |
| "epoch": 2.03, | |
| "learning_rate": 0.00020319488817891374, | |
| "loss": 0.3529, | |
| "step": 3180 | |
| }, | |
| { | |
| "epoch": 2.04, | |
| "learning_rate": 0.0002038338658146965, | |
| "loss": 0.3806, | |
| "step": 3190 | |
| }, | |
| { | |
| "epoch": 2.04, | |
| "learning_rate": 0.00020447284345047922, | |
| "loss": 0.3641, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 2.05, | |
| "learning_rate": 0.00020511182108626198, | |
| "loss": 0.4043, | |
| "step": 3210 | |
| }, | |
| { | |
| "epoch": 2.06, | |
| "learning_rate": 0.00020575079872204473, | |
| "loss": 0.3598, | |
| "step": 3220 | |
| }, | |
| { | |
| "epoch": 2.06, | |
| "learning_rate": 0.0002063897763578275, | |
| "loss": 0.3858, | |
| "step": 3230 | |
| }, | |
| { | |
| "epoch": 2.07, | |
| "learning_rate": 0.00020702875399361025, | |
| "loss": 0.3666, | |
| "step": 3240 | |
| }, | |
| { | |
| "epoch": 2.08, | |
| "learning_rate": 0.00020766773162939298, | |
| "loss": 0.3702, | |
| "step": 3250 | |
| }, | |
| { | |
| "epoch": 2.08, | |
| "learning_rate": 0.00020830670926517573, | |
| "loss": 0.3782, | |
| "step": 3260 | |
| }, | |
| { | |
| "epoch": 2.09, | |
| "learning_rate": 0.00020894568690095846, | |
| "loss": 0.3782, | |
| "step": 3270 | |
| }, | |
| { | |
| "epoch": 2.1, | |
| "learning_rate": 0.00020958466453674122, | |
| "loss": 0.3474, | |
| "step": 3280 | |
| }, | |
| { | |
| "epoch": 2.1, | |
| "learning_rate": 0.00021022364217252395, | |
| "loss": 0.3645, | |
| "step": 3290 | |
| }, | |
| { | |
| "epoch": 2.11, | |
| "learning_rate": 0.0002108626198083067, | |
| "loss": 0.4034, | |
| "step": 3300 | |
| }, | |
| { | |
| "epoch": 2.11, | |
| "learning_rate": 0.00021150159744408946, | |
| "loss": 0.3892, | |
| "step": 3310 | |
| }, | |
| { | |
| "epoch": 2.12, | |
| "learning_rate": 0.00021214057507987222, | |
| "loss": 0.3843, | |
| "step": 3320 | |
| }, | |
| { | |
| "epoch": 2.13, | |
| "learning_rate": 0.00021277955271565497, | |
| "loss": 0.3667, | |
| "step": 3330 | |
| }, | |
| { | |
| "epoch": 2.13, | |
| "learning_rate": 0.0002134185303514377, | |
| "loss": 0.3954, | |
| "step": 3340 | |
| }, | |
| { | |
| "epoch": 2.14, | |
| "learning_rate": 0.00021405750798722046, | |
| "loss": 0.3733, | |
| "step": 3350 | |
| }, | |
| { | |
| "epoch": 2.15, | |
| "learning_rate": 0.00021469648562300321, | |
| "loss": 0.3801, | |
| "step": 3360 | |
| }, | |
| { | |
| "epoch": 2.15, | |
| "learning_rate": 0.00021533546325878594, | |
| "loss": 0.3813, | |
| "step": 3370 | |
| }, | |
| { | |
| "epoch": 2.16, | |
| "learning_rate": 0.0002159744408945687, | |
| "loss": 0.382, | |
| "step": 3380 | |
| }, | |
| { | |
| "epoch": 2.17, | |
| "learning_rate": 0.00021661341853035143, | |
| "loss": 0.3959, | |
| "step": 3390 | |
| }, | |
| { | |
| "epoch": 2.17, | |
| "learning_rate": 0.00021725239616613419, | |
| "loss": 0.338, | |
| "step": 3400 | |
| }, | |
| { | |
| "epoch": 2.18, | |
| "learning_rate": 0.00021789137380191691, | |
| "loss": 0.3884, | |
| "step": 3410 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "learning_rate": 0.0002185303514376997, | |
| "loss": 0.3583, | |
| "step": 3420 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "learning_rate": 0.00021916932907348245, | |
| "loss": 0.3224, | |
| "step": 3430 | |
| }, | |
| { | |
| "epoch": 2.2, | |
| "learning_rate": 0.00021980830670926518, | |
| "loss": 0.3587, | |
| "step": 3440 | |
| }, | |
| { | |
| "epoch": 2.2, | |
| "learning_rate": 0.00022044728434504794, | |
| "loss": 0.3493, | |
| "step": 3450 | |
| }, | |
| { | |
| "epoch": 2.21, | |
| "learning_rate": 0.00022108626198083067, | |
| "loss": 0.392, | |
| "step": 3460 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "learning_rate": 0.00022172523961661343, | |
| "loss": 0.3555, | |
| "step": 3470 | |
| }, | |
| { | |
| "epoch": 2.22, | |
| "learning_rate": 0.00022236421725239615, | |
| "loss": 0.4006, | |
| "step": 3480 | |
| }, | |
| { | |
| "epoch": 2.23, | |
| "learning_rate": 0.0002230031948881789, | |
| "loss": 0.3817, | |
| "step": 3490 | |
| }, | |
| { | |
| "epoch": 2.24, | |
| "learning_rate": 0.00022364217252396167, | |
| "loss": 0.3957, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 2.24, | |
| "learning_rate": 0.0002242811501597444, | |
| "loss": 0.3538, | |
| "step": 3510 | |
| }, | |
| { | |
| "epoch": 2.25, | |
| "learning_rate": 0.00022492012779552718, | |
| "loss": 0.3811, | |
| "step": 3520 | |
| }, | |
| { | |
| "epoch": 2.26, | |
| "learning_rate": 0.0002255591054313099, | |
| "loss": 0.3615, | |
| "step": 3530 | |
| }, | |
| { | |
| "epoch": 2.26, | |
| "learning_rate": 0.00022619808306709267, | |
| "loss": 0.3491, | |
| "step": 3540 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "learning_rate": 0.00022683706070287542, | |
| "loss": 0.3904, | |
| "step": 3550 | |
| }, | |
| { | |
| "epoch": 2.27, | |
| "learning_rate": 0.00022747603833865815, | |
| "loss": 0.3692, | |
| "step": 3560 | |
| }, | |
| { | |
| "epoch": 2.28, | |
| "learning_rate": 0.0002281150159744409, | |
| "loss": 0.3764, | |
| "step": 3570 | |
| }, | |
| { | |
| "epoch": 2.29, | |
| "learning_rate": 0.00022875399361022364, | |
| "loss": 0.3189, | |
| "step": 3580 | |
| }, | |
| { | |
| "epoch": 2.29, | |
| "learning_rate": 0.0002293929712460064, | |
| "loss": 0.3437, | |
| "step": 3590 | |
| }, | |
| { | |
| "epoch": 2.3, | |
| "learning_rate": 0.00023003194888178912, | |
| "loss": 0.38, | |
| "step": 3600 | |
| }, | |
| { | |
| "epoch": 2.31, | |
| "learning_rate": 0.00023067092651757188, | |
| "loss": 0.3694, | |
| "step": 3610 | |
| }, | |
| { | |
| "epoch": 2.31, | |
| "learning_rate": 0.00023130990415335466, | |
| "loss": 0.3297, | |
| "step": 3620 | |
| }, | |
| { | |
| "epoch": 2.32, | |
| "learning_rate": 0.0002319488817891374, | |
| "loss": 0.391, | |
| "step": 3630 | |
| }, | |
| { | |
| "epoch": 2.33, | |
| "learning_rate": 0.00023258785942492015, | |
| "loss": 0.3465, | |
| "step": 3640 | |
| }, | |
| { | |
| "epoch": 2.33, | |
| "learning_rate": 0.00023322683706070288, | |
| "loss": 0.3879, | |
| "step": 3650 | |
| }, | |
| { | |
| "epoch": 2.34, | |
| "learning_rate": 0.00023386581469648563, | |
| "loss": 0.3551, | |
| "step": 3660 | |
| }, | |
| { | |
| "epoch": 2.34, | |
| "learning_rate": 0.00023450479233226836, | |
| "loss": 0.3383, | |
| "step": 3670 | |
| }, | |
| { | |
| "epoch": 2.35, | |
| "learning_rate": 0.00023514376996805112, | |
| "loss": 0.3284, | |
| "step": 3680 | |
| }, | |
| { | |
| "epoch": 2.36, | |
| "learning_rate": 0.00023578274760383387, | |
| "loss": 0.3362, | |
| "step": 3690 | |
| }, | |
| { | |
| "epoch": 2.36, | |
| "learning_rate": 0.0002364217252396166, | |
| "loss": 0.349, | |
| "step": 3700 | |
| }, | |
| { | |
| "epoch": 2.37, | |
| "learning_rate": 0.00023706070287539936, | |
| "loss": 0.357, | |
| "step": 3710 | |
| }, | |
| { | |
| "epoch": 2.38, | |
| "learning_rate": 0.00023769968051118212, | |
| "loss": 0.3993, | |
| "step": 3720 | |
| }, | |
| { | |
| "epoch": 2.38, | |
| "learning_rate": 0.00023833865814696487, | |
| "loss": 0.3611, | |
| "step": 3730 | |
| }, | |
| { | |
| "epoch": 2.39, | |
| "learning_rate": 0.00023897763578274763, | |
| "loss": 0.3989, | |
| "step": 3740 | |
| }, | |
| { | |
| "epoch": 2.4, | |
| "learning_rate": 0.00023961661341853036, | |
| "loss": 0.3792, | |
| "step": 3750 | |
| }, | |
| { | |
| "epoch": 2.4, | |
| "learning_rate": 0.00024025559105431311, | |
| "loss": 0.3434, | |
| "step": 3760 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "learning_rate": 0.00024089456869009584, | |
| "loss": 0.3669, | |
| "step": 3770 | |
| }, | |
| { | |
| "epoch": 2.42, | |
| "learning_rate": 0.0002415335463258786, | |
| "loss": 0.3858, | |
| "step": 3780 | |
| }, | |
| { | |
| "epoch": 2.42, | |
| "learning_rate": 0.00024217252396166133, | |
| "loss": 0.3016, | |
| "step": 3790 | |
| }, | |
| { | |
| "epoch": 2.43, | |
| "learning_rate": 0.00024281150159744408, | |
| "loss": 0.3253, | |
| "step": 3800 | |
| }, | |
| { | |
| "epoch": 2.43, | |
| "learning_rate": 0.00024345047923322684, | |
| "loss": 0.3811, | |
| "step": 3810 | |
| }, | |
| { | |
| "epoch": 2.44, | |
| "learning_rate": 0.0002440894568690096, | |
| "loss": 0.338, | |
| "step": 3820 | |
| }, | |
| { | |
| "epoch": 2.45, | |
| "learning_rate": 0.0002447284345047923, | |
| "loss": 0.3214, | |
| "step": 3830 | |
| }, | |
| { | |
| "epoch": 2.45, | |
| "learning_rate": 0.0002453674121405751, | |
| "loss": 0.3696, | |
| "step": 3840 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "learning_rate": 0.00024600638977635784, | |
| "loss": 0.3624, | |
| "step": 3850 | |
| }, | |
| { | |
| "epoch": 2.47, | |
| "learning_rate": 0.00024664536741214057, | |
| "loss": 0.3538, | |
| "step": 3860 | |
| }, | |
| { | |
| "epoch": 2.47, | |
| "learning_rate": 0.00024728434504792335, | |
| "loss": 0.372, | |
| "step": 3870 | |
| }, | |
| { | |
| "epoch": 2.48, | |
| "learning_rate": 0.0002479233226837061, | |
| "loss": 0.3884, | |
| "step": 3880 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "learning_rate": 0.0002485623003194888, | |
| "loss": 0.325, | |
| "step": 3890 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "learning_rate": 0.00024920127795527154, | |
| "loss": 0.3567, | |
| "step": 3900 | |
| }, | |
| { | |
| "epoch": 2.5, | |
| "learning_rate": 0.0002498402555910543, | |
| "loss": 0.379, | |
| "step": 3910 | |
| }, | |
| { | |
| "epoch": 2.5, | |
| "learning_rate": 0.00025047923322683705, | |
| "loss": 0.3542, | |
| "step": 3920 | |
| }, | |
| { | |
| "epoch": 2.51, | |
| "learning_rate": 0.00025111821086261984, | |
| "loss": 0.3739, | |
| "step": 3930 | |
| }, | |
| { | |
| "epoch": 2.52, | |
| "learning_rate": 0.00025175718849840256, | |
| "loss": 0.3657, | |
| "step": 3940 | |
| }, | |
| { | |
| "epoch": 2.52, | |
| "learning_rate": 0.0002523961661341853, | |
| "loss": 0.3499, | |
| "step": 3950 | |
| }, | |
| { | |
| "epoch": 2.53, | |
| "learning_rate": 0.0002530351437699681, | |
| "loss": 0.3428, | |
| "step": 3960 | |
| }, | |
| { | |
| "epoch": 2.54, | |
| "learning_rate": 0.0002536741214057508, | |
| "loss": 0.3369, | |
| "step": 3970 | |
| }, | |
| { | |
| "epoch": 2.54, | |
| "learning_rate": 0.00025431309904153354, | |
| "loss": 0.4055, | |
| "step": 3980 | |
| }, | |
| { | |
| "epoch": 2.55, | |
| "learning_rate": 0.00025495207667731626, | |
| "loss": 0.365, | |
| "step": 3990 | |
| }, | |
| { | |
| "epoch": 2.56, | |
| "learning_rate": 0.00025559105431309905, | |
| "loss": 0.3533, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 2.56, | |
| "learning_rate": 0.0002562300319488818, | |
| "loss": 0.3223, | |
| "step": 4010 | |
| }, | |
| { | |
| "epoch": 2.57, | |
| "learning_rate": 0.0002568690095846645, | |
| "loss": 0.3176, | |
| "step": 4020 | |
| }, | |
| { | |
| "epoch": 2.57, | |
| "learning_rate": 0.0002575079872204473, | |
| "loss": 0.3098, | |
| "step": 4030 | |
| }, | |
| { | |
| "epoch": 2.58, | |
| "learning_rate": 0.00025814696485623, | |
| "loss": 0.3792, | |
| "step": 4040 | |
| }, | |
| { | |
| "epoch": 2.59, | |
| "learning_rate": 0.00025878594249201275, | |
| "loss": 0.357, | |
| "step": 4050 | |
| }, | |
| { | |
| "epoch": 2.59, | |
| "learning_rate": 0.00025942492012779553, | |
| "loss": 0.3706, | |
| "step": 4060 | |
| }, | |
| { | |
| "epoch": 2.6, | |
| "learning_rate": 0.0002600638977635783, | |
| "loss": 0.346, | |
| "step": 4070 | |
| }, | |
| { | |
| "epoch": 2.61, | |
| "learning_rate": 0.00026070287539936104, | |
| "loss": 0.341, | |
| "step": 4080 | |
| }, | |
| { | |
| "epoch": 2.61, | |
| "learning_rate": 0.0002613418530351438, | |
| "loss": 0.3352, | |
| "step": 4090 | |
| }, | |
| { | |
| "epoch": 2.62, | |
| "learning_rate": 0.00026198083067092656, | |
| "loss": 0.3219, | |
| "step": 4100 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "learning_rate": 0.0002626198083067093, | |
| "loss": 0.3638, | |
| "step": 4110 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "learning_rate": 0.000263258785942492, | |
| "loss": 0.3356, | |
| "step": 4120 | |
| }, | |
| { | |
| "epoch": 2.64, | |
| "learning_rate": 0.0002638977635782748, | |
| "loss": 0.3309, | |
| "step": 4130 | |
| }, | |
| { | |
| "epoch": 2.65, | |
| "learning_rate": 0.00026453674121405753, | |
| "loss": 0.3649, | |
| "step": 4140 | |
| }, | |
| { | |
| "epoch": 2.65, | |
| "learning_rate": 0.00026517571884984026, | |
| "loss": 0.3334, | |
| "step": 4150 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "learning_rate": 0.000265814696485623, | |
| "loss": 0.3279, | |
| "step": 4160 | |
| }, | |
| { | |
| "epoch": 2.66, | |
| "learning_rate": 0.00026645367412140577, | |
| "loss": 0.3603, | |
| "step": 4170 | |
| }, | |
| { | |
| "epoch": 2.67, | |
| "learning_rate": 0.0002670926517571885, | |
| "loss": 0.3207, | |
| "step": 4180 | |
| }, | |
| { | |
| "epoch": 2.68, | |
| "learning_rate": 0.00026773162939297123, | |
| "loss": 0.2887, | |
| "step": 4190 | |
| }, | |
| { | |
| "epoch": 2.68, | |
| "learning_rate": 0.000268370607028754, | |
| "loss": 0.343, | |
| "step": 4200 | |
| }, | |
| { | |
| "epoch": 2.69, | |
| "learning_rate": 0.00026900958466453674, | |
| "loss": 0.3347, | |
| "step": 4210 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "learning_rate": 0.00026964856230031947, | |
| "loss": 0.3013, | |
| "step": 4220 | |
| }, | |
| { | |
| "epoch": 2.7, | |
| "learning_rate": 0.0002702875399361022, | |
| "loss": 0.3681, | |
| "step": 4230 | |
| }, | |
| { | |
| "epoch": 2.71, | |
| "learning_rate": 0.000270926517571885, | |
| "loss": 0.313, | |
| "step": 4240 | |
| }, | |
| { | |
| "epoch": 2.72, | |
| "learning_rate": 0.0002715654952076677, | |
| "loss": 0.3769, | |
| "step": 4250 | |
| }, | |
| { | |
| "epoch": 2.72, | |
| "learning_rate": 0.0002722044728434505, | |
| "loss": 0.346, | |
| "step": 4260 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "learning_rate": 0.0002728434504792333, | |
| "loss": 0.321, | |
| "step": 4270 | |
| }, | |
| { | |
| "epoch": 2.73, | |
| "learning_rate": 0.000273482428115016, | |
| "loss": 0.3783, | |
| "step": 4280 | |
| }, | |
| { | |
| "epoch": 2.74, | |
| "learning_rate": 0.00027412140575079874, | |
| "loss": 0.3621, | |
| "step": 4290 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "learning_rate": 0.00027476038338658147, | |
| "loss": 0.3509, | |
| "step": 4300 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "learning_rate": 0.00027539936102236425, | |
| "loss": 0.3836, | |
| "step": 4310 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "learning_rate": 0.000276038338658147, | |
| "loss": 0.3595, | |
| "step": 4320 | |
| }, | |
| { | |
| "epoch": 2.77, | |
| "learning_rate": 0.0002766773162939297, | |
| "loss": 0.3375, | |
| "step": 4330 | |
| }, | |
| { | |
| "epoch": 2.77, | |
| "learning_rate": 0.0002773162939297125, | |
| "loss": 0.3343, | |
| "step": 4340 | |
| }, | |
| { | |
| "epoch": 2.78, | |
| "learning_rate": 0.0002779552715654952, | |
| "loss": 0.3306, | |
| "step": 4350 | |
| }, | |
| { | |
| "epoch": 2.79, | |
| "learning_rate": 0.00027859424920127795, | |
| "loss": 0.3474, | |
| "step": 4360 | |
| }, | |
| { | |
| "epoch": 2.79, | |
| "learning_rate": 0.0002792332268370607, | |
| "loss": 0.3696, | |
| "step": 4370 | |
| }, | |
| { | |
| "epoch": 2.8, | |
| "learning_rate": 0.00027987220447284346, | |
| "loss": 0.35, | |
| "step": 4380 | |
| }, | |
| { | |
| "epoch": 2.8, | |
| "learning_rate": 0.0002805111821086262, | |
| "loss": 0.3887, | |
| "step": 4390 | |
| }, | |
| { | |
| "epoch": 2.81, | |
| "learning_rate": 0.0002811501597444089, | |
| "loss": 0.3449, | |
| "step": 4400 | |
| }, | |
| { | |
| "epoch": 2.82, | |
| "learning_rate": 0.0002817891373801917, | |
| "loss": 0.369, | |
| "step": 4410 | |
| }, | |
| { | |
| "epoch": 2.82, | |
| "learning_rate": 0.00028242811501597443, | |
| "loss": 0.373, | |
| "step": 4420 | |
| }, | |
| { | |
| "epoch": 2.83, | |
| "learning_rate": 0.00028306709265175716, | |
| "loss": 0.3299, | |
| "step": 4430 | |
| }, | |
| { | |
| "epoch": 2.84, | |
| "learning_rate": 0.00028370607028753995, | |
| "loss": 0.3233, | |
| "step": 4440 | |
| }, | |
| { | |
| "epoch": 2.84, | |
| "learning_rate": 0.0002843450479233227, | |
| "loss": 0.3629, | |
| "step": 4450 | |
| }, | |
| { | |
| "epoch": 2.85, | |
| "learning_rate": 0.00028498402555910546, | |
| "loss": 0.3576, | |
| "step": 4460 | |
| }, | |
| { | |
| "epoch": 2.86, | |
| "learning_rate": 0.0002856230031948882, | |
| "loss": 0.3053, | |
| "step": 4470 | |
| }, | |
| { | |
| "epoch": 2.86, | |
| "learning_rate": 0.00028626198083067097, | |
| "loss": 0.3185, | |
| "step": 4480 | |
| }, | |
| { | |
| "epoch": 2.87, | |
| "learning_rate": 0.0002869009584664537, | |
| "loss": 0.3423, | |
| "step": 4490 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "learning_rate": 0.00028753993610223643, | |
| "loss": 0.3727, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 2.88, | |
| "learning_rate": 0.0002881789137380192, | |
| "loss": 0.3121, | |
| "step": 4510 | |
| }, | |
| { | |
| "epoch": 2.89, | |
| "learning_rate": 0.00028881789137380194, | |
| "loss": 0.322, | |
| "step": 4520 | |
| }, | |
| { | |
| "epoch": 2.89, | |
| "learning_rate": 0.00028945686900958467, | |
| "loss": 0.3581, | |
| "step": 4530 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "learning_rate": 0.0002900958466453674, | |
| "loss": 0.339, | |
| "step": 4540 | |
| }, | |
| { | |
| "epoch": 2.91, | |
| "learning_rate": 0.0002907348242811502, | |
| "loss": 0.3226, | |
| "step": 4550 | |
| }, | |
| { | |
| "epoch": 2.91, | |
| "learning_rate": 0.0002913738019169329, | |
| "loss": 0.2947, | |
| "step": 4560 | |
| }, | |
| { | |
| "epoch": 2.92, | |
| "learning_rate": 0.00029201277955271564, | |
| "loss": 0.3572, | |
| "step": 4570 | |
| }, | |
| { | |
| "epoch": 2.93, | |
| "learning_rate": 0.0002926517571884984, | |
| "loss": 0.3029, | |
| "step": 4580 | |
| }, | |
| { | |
| "epoch": 2.93, | |
| "learning_rate": 0.00029329073482428115, | |
| "loss": 0.3149, | |
| "step": 4590 | |
| }, | |
| { | |
| "epoch": 2.94, | |
| "learning_rate": 0.0002939297124600639, | |
| "loss": 0.3521, | |
| "step": 4600 | |
| }, | |
| { | |
| "epoch": 2.95, | |
| "learning_rate": 0.0002945686900958466, | |
| "loss": 0.3207, | |
| "step": 4610 | |
| }, | |
| { | |
| "epoch": 2.95, | |
| "learning_rate": 0.0002952076677316294, | |
| "loss": 0.2926, | |
| "step": 4620 | |
| }, | |
| { | |
| "epoch": 2.96, | |
| "learning_rate": 0.0002958466453674121, | |
| "loss": 0.3318, | |
| "step": 4630 | |
| }, | |
| { | |
| "epoch": 2.96, | |
| "learning_rate": 0.00029648562300319485, | |
| "loss": 0.2907, | |
| "step": 4640 | |
| }, | |
| { | |
| "epoch": 2.97, | |
| "learning_rate": 0.00029712460063897764, | |
| "loss": 0.3876, | |
| "step": 4650 | |
| }, | |
| { | |
| "epoch": 2.98, | |
| "learning_rate": 0.0002977635782747604, | |
| "loss": 0.3375, | |
| "step": 4660 | |
| }, | |
| { | |
| "epoch": 2.98, | |
| "learning_rate": 0.00029840255591054315, | |
| "loss": 0.3327, | |
| "step": 4670 | |
| }, | |
| { | |
| "epoch": 2.99, | |
| "learning_rate": 0.0002990415335463259, | |
| "loss": 0.2991, | |
| "step": 4680 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 0.00029968051118210866, | |
| "loss": 0.3027, | |
| "step": 4690 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "learning_rate": 0.0003003194888178914, | |
| "loss": 0.3189, | |
| "step": 4700 | |
| }, | |
| { | |
| "epoch": 3.01, | |
| "learning_rate": 0.0003009584664536741, | |
| "loss": 0.3073, | |
| "step": 4710 | |
| }, | |
| { | |
| "epoch": 3.02, | |
| "learning_rate": 0.0003015974440894569, | |
| "loss": 0.2792, | |
| "step": 4720 | |
| }, | |
| { | |
| "epoch": 3.02, | |
| "learning_rate": 0.00030223642172523963, | |
| "loss": 0.2776, | |
| "step": 4730 | |
| }, | |
| { | |
| "epoch": 3.03, | |
| "learning_rate": 0.00030287539936102236, | |
| "loss": 0.3064, | |
| "step": 4740 | |
| }, | |
| { | |
| "epoch": 3.04, | |
| "learning_rate": 0.0003035143769968051, | |
| "loss": 0.2736, | |
| "step": 4750 | |
| }, | |
| { | |
| "epoch": 3.04, | |
| "learning_rate": 0.0003041533546325879, | |
| "loss": 0.2906, | |
| "step": 4760 | |
| }, | |
| { | |
| "epoch": 3.05, | |
| "learning_rate": 0.0003047923322683706, | |
| "loss": 0.2766, | |
| "step": 4770 | |
| }, | |
| { | |
| "epoch": 3.05, | |
| "learning_rate": 0.00030543130990415333, | |
| "loss": 0.3055, | |
| "step": 4780 | |
| }, | |
| { | |
| "epoch": 3.06, | |
| "learning_rate": 0.0003060702875399361, | |
| "loss": 0.2889, | |
| "step": 4790 | |
| }, | |
| { | |
| "epoch": 3.07, | |
| "learning_rate": 0.00030670926517571885, | |
| "loss": 0.2952, | |
| "step": 4800 | |
| }, | |
| { | |
| "epoch": 3.07, | |
| "learning_rate": 0.0003073482428115016, | |
| "loss": 0.3135, | |
| "step": 4810 | |
| }, | |
| { | |
| "epoch": 3.08, | |
| "learning_rate": 0.00030798722044728436, | |
| "loss": 0.3029, | |
| "step": 4820 | |
| }, | |
| { | |
| "epoch": 3.09, | |
| "learning_rate": 0.0003086261980830671, | |
| "loss": 0.2786, | |
| "step": 4830 | |
| }, | |
| { | |
| "epoch": 3.09, | |
| "learning_rate": 0.0003092651757188498, | |
| "loss": 0.2854, | |
| "step": 4840 | |
| }, | |
| { | |
| "epoch": 3.1, | |
| "learning_rate": 0.00030990415335463255, | |
| "loss": 0.2851, | |
| "step": 4850 | |
| }, | |
| { | |
| "epoch": 3.11, | |
| "learning_rate": 0.0003105431309904154, | |
| "loss": 0.2715, | |
| "step": 4860 | |
| }, | |
| { | |
| "epoch": 3.11, | |
| "learning_rate": 0.0003111821086261981, | |
| "loss": 0.2966, | |
| "step": 4870 | |
| }, | |
| { | |
| "epoch": 3.12, | |
| "learning_rate": 0.00031182108626198084, | |
| "loss": 0.2524, | |
| "step": 4880 | |
| }, | |
| { | |
| "epoch": 3.12, | |
| "learning_rate": 0.0003124600638977636, | |
| "loss": 0.3158, | |
| "step": 4890 | |
| }, | |
| { | |
| "epoch": 3.13, | |
| "learning_rate": 0.00031309904153354636, | |
| "loss": 0.2955, | |
| "step": 4900 | |
| }, | |
| { | |
| "epoch": 3.14, | |
| "learning_rate": 0.0003137380191693291, | |
| "loss": 0.3291, | |
| "step": 4910 | |
| }, | |
| { | |
| "epoch": 3.14, | |
| "learning_rate": 0.0003143769968051118, | |
| "loss": 0.3231, | |
| "step": 4920 | |
| }, | |
| { | |
| "epoch": 3.15, | |
| "learning_rate": 0.0003150159744408946, | |
| "loss": 0.3137, | |
| "step": 4930 | |
| }, | |
| { | |
| "epoch": 3.16, | |
| "learning_rate": 0.0003156549520766773, | |
| "loss": 0.2828, | |
| "step": 4940 | |
| }, | |
| { | |
| "epoch": 3.16, | |
| "learning_rate": 0.00031629392971246006, | |
| "loss": 0.2963, | |
| "step": 4950 | |
| }, | |
| { | |
| "epoch": 3.17, | |
| "learning_rate": 0.00031693290734824284, | |
| "loss": 0.281, | |
| "step": 4960 | |
| }, | |
| { | |
| "epoch": 3.18, | |
| "learning_rate": 0.00031757188498402557, | |
| "loss": 0.2507, | |
| "step": 4970 | |
| }, | |
| { | |
| "epoch": 3.18, | |
| "learning_rate": 0.0003182108626198083, | |
| "loss": 0.2772, | |
| "step": 4980 | |
| }, | |
| { | |
| "epoch": 3.19, | |
| "learning_rate": 0.000318849840255591, | |
| "loss": 0.2989, | |
| "step": 4990 | |
| }, | |
| { | |
| "epoch": 3.19, | |
| "learning_rate": 0.0003194888178913738, | |
| "loss": 0.2848, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 3.2, | |
| "learning_rate": 0.00032012779552715654, | |
| "loss": 0.2925, | |
| "step": 5010 | |
| }, | |
| { | |
| "epoch": 3.21, | |
| "learning_rate": 0.00032076677316293927, | |
| "loss": 0.2756, | |
| "step": 5020 | |
| }, | |
| { | |
| "epoch": 3.21, | |
| "learning_rate": 0.00032140575079872205, | |
| "loss": 0.2793, | |
| "step": 5030 | |
| }, | |
| { | |
| "epoch": 3.22, | |
| "learning_rate": 0.0003220447284345048, | |
| "loss": 0.3096, | |
| "step": 5040 | |
| }, | |
| { | |
| "epoch": 3.23, | |
| "learning_rate": 0.0003226837060702875, | |
| "loss": 0.3056, | |
| "step": 5050 | |
| }, | |
| { | |
| "epoch": 3.23, | |
| "learning_rate": 0.0003233226837060703, | |
| "loss": 0.2636, | |
| "step": 5060 | |
| }, | |
| { | |
| "epoch": 3.24, | |
| "learning_rate": 0.0003239616613418531, | |
| "loss": 0.362, | |
| "step": 5070 | |
| }, | |
| { | |
| "epoch": 3.25, | |
| "learning_rate": 0.0003246006389776358, | |
| "loss": 0.294, | |
| "step": 5080 | |
| }, | |
| { | |
| "epoch": 3.25, | |
| "learning_rate": 0.00032523961661341854, | |
| "loss": 0.2913, | |
| "step": 5090 | |
| }, | |
| { | |
| "epoch": 3.26, | |
| "learning_rate": 0.0003258785942492013, | |
| "loss": 0.3018, | |
| "step": 5100 | |
| }, | |
| { | |
| "epoch": 3.27, | |
| "learning_rate": 0.00032651757188498405, | |
| "loss": 0.3096, | |
| "step": 5110 | |
| }, | |
| { | |
| "epoch": 3.27, | |
| "learning_rate": 0.0003271565495207668, | |
| "loss": 0.2857, | |
| "step": 5120 | |
| }, | |
| { | |
| "epoch": 3.28, | |
| "learning_rate": 0.0003277955271565495, | |
| "loss": 0.2586, | |
| "step": 5130 | |
| }, | |
| { | |
| "epoch": 3.28, | |
| "learning_rate": 0.0003284345047923323, | |
| "loss": 0.2943, | |
| "step": 5140 | |
| }, | |
| { | |
| "epoch": 3.29, | |
| "learning_rate": 0.000329073482428115, | |
| "loss": 0.2719, | |
| "step": 5150 | |
| }, | |
| { | |
| "epoch": 3.3, | |
| "learning_rate": 0.00032971246006389775, | |
| "loss": 0.2682, | |
| "step": 5160 | |
| }, | |
| { | |
| "epoch": 3.3, | |
| "learning_rate": 0.00033035143769968053, | |
| "loss": 0.2883, | |
| "step": 5170 | |
| }, | |
| { | |
| "epoch": 3.31, | |
| "learning_rate": 0.00033099041533546326, | |
| "loss": 0.286, | |
| "step": 5180 | |
| }, | |
| { | |
| "epoch": 3.32, | |
| "learning_rate": 0.000331629392971246, | |
| "loss": 0.3188, | |
| "step": 5190 | |
| }, | |
| { | |
| "epoch": 3.32, | |
| "learning_rate": 0.0003322683706070288, | |
| "loss": 0.2683, | |
| "step": 5200 | |
| }, | |
| { | |
| "epoch": 3.33, | |
| "learning_rate": 0.0003329073482428115, | |
| "loss": 0.2782, | |
| "step": 5210 | |
| }, | |
| { | |
| "epoch": 3.34, | |
| "learning_rate": 0.00033354632587859423, | |
| "loss": 0.2968, | |
| "step": 5220 | |
| }, | |
| { | |
| "epoch": 3.34, | |
| "learning_rate": 0.00033418530351437696, | |
| "loss": 0.2765, | |
| "step": 5230 | |
| }, | |
| { | |
| "epoch": 3.35, | |
| "learning_rate": 0.00033482428115015974, | |
| "loss": 0.2481, | |
| "step": 5240 | |
| }, | |
| { | |
| "epoch": 3.35, | |
| "learning_rate": 0.00033546325878594253, | |
| "loss": 0.301, | |
| "step": 5250 | |
| }, | |
| { | |
| "epoch": 3.36, | |
| "learning_rate": 0.00033610223642172526, | |
| "loss": 0.2576, | |
| "step": 5260 | |
| }, | |
| { | |
| "epoch": 3.37, | |
| "learning_rate": 0.00033674121405750804, | |
| "loss": 0.3013, | |
| "step": 5270 | |
| }, | |
| { | |
| "epoch": 3.37, | |
| "learning_rate": 0.00033738019169329077, | |
| "loss": 0.3062, | |
| "step": 5280 | |
| }, | |
| { | |
| "epoch": 3.38, | |
| "learning_rate": 0.0003380191693290735, | |
| "loss": 0.2969, | |
| "step": 5290 | |
| }, | |
| { | |
| "epoch": 3.39, | |
| "learning_rate": 0.00033865814696485623, | |
| "loss": 0.3039, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 3.39, | |
| "learning_rate": 0.000339297124600639, | |
| "loss": 0.2954, | |
| "step": 5310 | |
| }, | |
| { | |
| "epoch": 3.4, | |
| "learning_rate": 0.00033993610223642174, | |
| "loss": 0.2835, | |
| "step": 5320 | |
| }, | |
| { | |
| "epoch": 3.41, | |
| "learning_rate": 0.00034057507987220447, | |
| "loss": 0.3215, | |
| "step": 5330 | |
| }, | |
| { | |
| "epoch": 3.41, | |
| "learning_rate": 0.00034121405750798725, | |
| "loss": 0.2902, | |
| "step": 5340 | |
| }, | |
| { | |
| "epoch": 3.42, | |
| "learning_rate": 0.00034185303514377, | |
| "loss": 0.2957, | |
| "step": 5350 | |
| }, | |
| { | |
| "epoch": 3.42, | |
| "learning_rate": 0.0003424920127795527, | |
| "loss": 0.2844, | |
| "step": 5360 | |
| }, | |
| { | |
| "epoch": 3.43, | |
| "learning_rate": 0.00034313099041533544, | |
| "loss": 0.2502, | |
| "step": 5370 | |
| }, | |
| { | |
| "epoch": 3.44, | |
| "learning_rate": 0.0003437699680511182, | |
| "loss": 0.2757, | |
| "step": 5380 | |
| }, | |
| { | |
| "epoch": 3.44, | |
| "learning_rate": 0.00034440894568690095, | |
| "loss": 0.3069, | |
| "step": 5390 | |
| }, | |
| { | |
| "epoch": 3.45, | |
| "learning_rate": 0.0003450479233226837, | |
| "loss": 0.2948, | |
| "step": 5400 | |
| }, | |
| { | |
| "epoch": 3.46, | |
| "learning_rate": 0.00034568690095846647, | |
| "loss": 0.2886, | |
| "step": 5410 | |
| }, | |
| { | |
| "epoch": 3.46, | |
| "learning_rate": 0.0003463258785942492, | |
| "loss": 0.2625, | |
| "step": 5420 | |
| }, | |
| { | |
| "epoch": 3.47, | |
| "learning_rate": 0.0003469648562300319, | |
| "loss": 0.3224, | |
| "step": 5430 | |
| }, | |
| { | |
| "epoch": 3.48, | |
| "learning_rate": 0.00034760383386581465, | |
| "loss": 0.3151, | |
| "step": 5440 | |
| }, | |
| { | |
| "epoch": 3.48, | |
| "learning_rate": 0.0003482428115015975, | |
| "loss": 0.3082, | |
| "step": 5450 | |
| }, | |
| { | |
| "epoch": 3.49, | |
| "learning_rate": 0.0003488817891373802, | |
| "loss": 0.2851, | |
| "step": 5460 | |
| }, | |
| { | |
| "epoch": 3.5, | |
| "learning_rate": 0.00034952076677316295, | |
| "loss": 0.2495, | |
| "step": 5470 | |
| }, | |
| { | |
| "epoch": 3.5, | |
| "learning_rate": 0.00035015974440894573, | |
| "loss": 0.3161, | |
| "step": 5480 | |
| }, | |
| { | |
| "epoch": 3.51, | |
| "learning_rate": 0.00035079872204472846, | |
| "loss": 0.3085, | |
| "step": 5490 | |
| }, | |
| { | |
| "epoch": 3.51, | |
| "learning_rate": 0.0003514376996805112, | |
| "loss": 0.2806, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 3.52, | |
| "learning_rate": 0.0003520766773162939, | |
| "loss": 0.2427, | |
| "step": 5510 | |
| }, | |
| { | |
| "epoch": 3.53, | |
| "learning_rate": 0.0003527156549520767, | |
| "loss": 0.2567, | |
| "step": 5520 | |
| }, | |
| { | |
| "epoch": 3.53, | |
| "learning_rate": 0.00035335463258785943, | |
| "loss": 0.2581, | |
| "step": 5530 | |
| }, | |
| { | |
| "epoch": 3.54, | |
| "learning_rate": 0.00035399361022364216, | |
| "loss": 0.3021, | |
| "step": 5540 | |
| }, | |
| { | |
| "epoch": 3.55, | |
| "learning_rate": 0.00035463258785942495, | |
| "loss": 0.2633, | |
| "step": 5550 | |
| }, | |
| { | |
| "epoch": 3.55, | |
| "learning_rate": 0.0003552715654952077, | |
| "loss": 0.2753, | |
| "step": 5560 | |
| }, | |
| { | |
| "epoch": 3.56, | |
| "learning_rate": 0.0003559105431309904, | |
| "loss": 0.2755, | |
| "step": 5570 | |
| }, | |
| { | |
| "epoch": 3.57, | |
| "learning_rate": 0.0003565495207667732, | |
| "loss": 0.297, | |
| "step": 5580 | |
| }, | |
| { | |
| "epoch": 3.57, | |
| "learning_rate": 0.0003571884984025559, | |
| "loss": 0.2739, | |
| "step": 5590 | |
| }, | |
| { | |
| "epoch": 3.58, | |
| "learning_rate": 0.00035782747603833865, | |
| "loss": 0.2994, | |
| "step": 5600 | |
| }, | |
| { | |
| "epoch": 3.58, | |
| "learning_rate": 0.0003584664536741214, | |
| "loss": 0.3026, | |
| "step": 5610 | |
| }, | |
| { | |
| "epoch": 3.59, | |
| "learning_rate": 0.00035910543130990416, | |
| "loss": 0.2724, | |
| "step": 5620 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "learning_rate": 0.0003597444089456869, | |
| "loss": 0.2863, | |
| "step": 5630 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "learning_rate": 0.0003603833865814696, | |
| "loss": 0.3245, | |
| "step": 5640 | |
| }, | |
| { | |
| "epoch": 3.61, | |
| "learning_rate": 0.00036102236421725245, | |
| "loss": 0.2751, | |
| "step": 5650 | |
| }, | |
| { | |
| "epoch": 3.62, | |
| "learning_rate": 0.0003616613418530352, | |
| "loss": 0.2783, | |
| "step": 5660 | |
| }, | |
| { | |
| "epoch": 3.62, | |
| "learning_rate": 0.0003623003194888179, | |
| "loss": 0.3159, | |
| "step": 5670 | |
| }, | |
| { | |
| "epoch": 3.63, | |
| "learning_rate": 0.00036293929712460064, | |
| "loss": 0.3649, | |
| "step": 5680 | |
| }, | |
| { | |
| "epoch": 3.64, | |
| "learning_rate": 0.0003635782747603834, | |
| "loss": 0.2486, | |
| "step": 5690 | |
| }, | |
| { | |
| "epoch": 3.64, | |
| "learning_rate": 0.00036421725239616615, | |
| "loss": 0.319, | |
| "step": 5700 | |
| }, | |
| { | |
| "epoch": 3.65, | |
| "learning_rate": 0.0003648562300319489, | |
| "loss": 0.2897, | |
| "step": 5710 | |
| }, | |
| { | |
| "epoch": 3.65, | |
| "learning_rate": 0.00036549520766773167, | |
| "loss": 0.2648, | |
| "step": 5720 | |
| }, | |
| { | |
| "epoch": 3.66, | |
| "learning_rate": 0.0003661341853035144, | |
| "loss": 0.3063, | |
| "step": 5730 | |
| }, | |
| { | |
| "epoch": 3.67, | |
| "learning_rate": 0.0003667731629392971, | |
| "loss": 0.2459, | |
| "step": 5740 | |
| }, | |
| { | |
| "epoch": 3.67, | |
| "learning_rate": 0.00036741214057507985, | |
| "loss": 0.3034, | |
| "step": 5750 | |
| }, | |
| { | |
| "epoch": 3.68, | |
| "learning_rate": 0.00036805111821086264, | |
| "loss": 0.2805, | |
| "step": 5760 | |
| }, | |
| { | |
| "epoch": 3.69, | |
| "learning_rate": 0.00036869009584664537, | |
| "loss": 0.2748, | |
| "step": 5770 | |
| }, | |
| { | |
| "epoch": 3.69, | |
| "learning_rate": 0.0003693290734824281, | |
| "loss": 0.2738, | |
| "step": 5780 | |
| }, | |
| { | |
| "epoch": 3.7, | |
| "learning_rate": 0.0003699680511182109, | |
| "loss": 0.2739, | |
| "step": 5790 | |
| }, | |
| { | |
| "epoch": 3.71, | |
| "learning_rate": 0.0003706070287539936, | |
| "loss": 0.3178, | |
| "step": 5800 | |
| }, | |
| { | |
| "epoch": 3.71, | |
| "learning_rate": 0.00037124600638977634, | |
| "loss": 0.2705, | |
| "step": 5810 | |
| }, | |
| { | |
| "epoch": 3.72, | |
| "learning_rate": 0.00037188498402555907, | |
| "loss": 0.3111, | |
| "step": 5820 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "learning_rate": 0.00037252396166134185, | |
| "loss": 0.2781, | |
| "step": 5830 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "learning_rate": 0.0003731629392971246, | |
| "loss": 0.2899, | |
| "step": 5840 | |
| }, | |
| { | |
| "epoch": 3.74, | |
| "learning_rate": 0.00037380191693290736, | |
| "loss": 0.316, | |
| "step": 5850 | |
| }, | |
| { | |
| "epoch": 3.74, | |
| "learning_rate": 0.00037444089456869015, | |
| "loss": 0.3097, | |
| "step": 5860 | |
| }, | |
| { | |
| "epoch": 3.75, | |
| "learning_rate": 0.0003750798722044729, | |
| "loss": 0.2693, | |
| "step": 5870 | |
| }, | |
| { | |
| "epoch": 3.76, | |
| "learning_rate": 0.0003757188498402556, | |
| "loss": 0.2846, | |
| "step": 5880 | |
| }, | |
| { | |
| "epoch": 3.76, | |
| "learning_rate": 0.00037635782747603833, | |
| "loss": 0.2892, | |
| "step": 5890 | |
| }, | |
| { | |
| "epoch": 3.77, | |
| "learning_rate": 0.0003769968051118211, | |
| "loss": 0.313, | |
| "step": 5900 | |
| }, | |
| { | |
| "epoch": 3.78, | |
| "learning_rate": 0.00037763578274760385, | |
| "loss": 0.2979, | |
| "step": 5910 | |
| }, | |
| { | |
| "epoch": 3.78, | |
| "learning_rate": 0.0003782747603833866, | |
| "loss": 0.2734, | |
| "step": 5920 | |
| }, | |
| { | |
| "epoch": 3.79, | |
| "learning_rate": 0.00037891373801916936, | |
| "loss": 0.2706, | |
| "step": 5930 | |
| }, | |
| { | |
| "epoch": 3.8, | |
| "learning_rate": 0.0003795527156549521, | |
| "loss": 0.2963, | |
| "step": 5940 | |
| }, | |
| { | |
| "epoch": 3.8, | |
| "learning_rate": 0.0003801916932907348, | |
| "loss": 0.2532, | |
| "step": 5950 | |
| }, | |
| { | |
| "epoch": 3.81, | |
| "learning_rate": 0.0003808306709265176, | |
| "loss": 0.3183, | |
| "step": 5960 | |
| }, | |
| { | |
| "epoch": 3.81, | |
| "learning_rate": 0.00038146964856230033, | |
| "loss": 0.3032, | |
| "step": 5970 | |
| }, | |
| { | |
| "epoch": 3.82, | |
| "learning_rate": 0.00038210862619808306, | |
| "loss": 0.3129, | |
| "step": 5980 | |
| }, | |
| { | |
| "epoch": 3.83, | |
| "learning_rate": 0.0003827476038338658, | |
| "loss": 0.267, | |
| "step": 5990 | |
| }, | |
| { | |
| "epoch": 3.83, | |
| "learning_rate": 0.00038338658146964857, | |
| "loss": 0.2766, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 3.84, | |
| "learning_rate": 0.0003840255591054313, | |
| "loss": 0.2861, | |
| "step": 6010 | |
| }, | |
| { | |
| "epoch": 3.85, | |
| "learning_rate": 0.00038466453674121403, | |
| "loss": 0.2807, | |
| "step": 6020 | |
| }, | |
| { | |
| "epoch": 3.85, | |
| "learning_rate": 0.0003853035143769968, | |
| "loss": 0.3118, | |
| "step": 6030 | |
| }, | |
| { | |
| "epoch": 3.86, | |
| "learning_rate": 0.00038594249201277954, | |
| "loss": 0.286, | |
| "step": 6040 | |
| }, | |
| { | |
| "epoch": 3.87, | |
| "learning_rate": 0.0003865814696485623, | |
| "loss": 0.2676, | |
| "step": 6050 | |
| }, | |
| { | |
| "epoch": 3.87, | |
| "learning_rate": 0.00038722044728434506, | |
| "loss": 0.3028, | |
| "step": 6060 | |
| }, | |
| { | |
| "epoch": 3.88, | |
| "learning_rate": 0.00038785942492012784, | |
| "loss": 0.2564, | |
| "step": 6070 | |
| }, | |
| { | |
| "epoch": 3.88, | |
| "learning_rate": 0.00038849840255591057, | |
| "loss": 0.2974, | |
| "step": 6080 | |
| }, | |
| { | |
| "epoch": 3.89, | |
| "learning_rate": 0.0003891373801916933, | |
| "loss": 0.2727, | |
| "step": 6090 | |
| }, | |
| { | |
| "epoch": 3.9, | |
| "learning_rate": 0.0003897763578274761, | |
| "loss": 0.2673, | |
| "step": 6100 | |
| }, | |
| { | |
| "epoch": 3.9, | |
| "learning_rate": 0.0003904153354632588, | |
| "loss": 0.27, | |
| "step": 6110 | |
| }, | |
| { | |
| "epoch": 3.91, | |
| "learning_rate": 0.00039105431309904154, | |
| "loss": 0.2758, | |
| "step": 6120 | |
| }, | |
| { | |
| "epoch": 3.92, | |
| "learning_rate": 0.00039169329073482427, | |
| "loss": 0.2891, | |
| "step": 6130 | |
| }, | |
| { | |
| "epoch": 3.92, | |
| "learning_rate": 0.00039233226837060705, | |
| "loss": 0.2904, | |
| "step": 6140 | |
| }, | |
| { | |
| "epoch": 3.93, | |
| "learning_rate": 0.0003929712460063898, | |
| "loss": 0.3009, | |
| "step": 6150 | |
| }, | |
| { | |
| "epoch": 3.94, | |
| "learning_rate": 0.0003936102236421725, | |
| "loss": 0.314, | |
| "step": 6160 | |
| }, | |
| { | |
| "epoch": 3.94, | |
| "learning_rate": 0.0003942492012779553, | |
| "loss": 0.289, | |
| "step": 6170 | |
| }, | |
| { | |
| "epoch": 3.95, | |
| "learning_rate": 0.000394888178913738, | |
| "loss": 0.3163, | |
| "step": 6180 | |
| }, | |
| { | |
| "epoch": 3.95, | |
| "learning_rate": 0.00039552715654952075, | |
| "loss": 0.2605, | |
| "step": 6190 | |
| }, | |
| { | |
| "epoch": 3.96, | |
| "learning_rate": 0.0003961661341853035, | |
| "loss": 0.2758, | |
| "step": 6200 | |
| }, | |
| { | |
| "epoch": 3.97, | |
| "learning_rate": 0.00039680511182108626, | |
| "loss": 0.3064, | |
| "step": 6210 | |
| }, | |
| { | |
| "epoch": 3.97, | |
| "learning_rate": 0.000397444089456869, | |
| "loss": 0.2991, | |
| "step": 6220 | |
| }, | |
| { | |
| "epoch": 3.98, | |
| "learning_rate": 0.0003980830670926517, | |
| "loss": 0.307, | |
| "step": 6230 | |
| }, | |
| { | |
| "epoch": 3.99, | |
| "learning_rate": 0.0003987220447284345, | |
| "loss": 0.285, | |
| "step": 6240 | |
| }, | |
| { | |
| "epoch": 3.99, | |
| "learning_rate": 0.0003993610223642173, | |
| "loss": 0.2797, | |
| "step": 6250 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "learning_rate": 0.0004, | |
| "loss": 0.2737, | |
| "step": 6260 | |
| }, | |
| { | |
| "epoch": 4.01, | |
| "learning_rate": 0.00040063897763578275, | |
| "loss": 0.2392, | |
| "step": 6270 | |
| }, | |
| { | |
| "epoch": 4.01, | |
| "learning_rate": 0.00040127795527156553, | |
| "loss": 0.2275, | |
| "step": 6280 | |
| }, | |
| { | |
| "epoch": 4.02, | |
| "learning_rate": 0.00040191693290734826, | |
| "loss": 0.2617, | |
| "step": 6290 | |
| }, | |
| { | |
| "epoch": 4.03, | |
| "learning_rate": 0.000402555910543131, | |
| "loss": 0.2528, | |
| "step": 6300 | |
| }, | |
| { | |
| "epoch": 4.03, | |
| "learning_rate": 0.0004031948881789138, | |
| "loss": 0.2262, | |
| "step": 6310 | |
| }, | |
| { | |
| "epoch": 4.04, | |
| "learning_rate": 0.0004038338658146965, | |
| "loss": 0.259, | |
| "step": 6320 | |
| }, | |
| { | |
| "epoch": 4.04, | |
| "learning_rate": 0.00040447284345047923, | |
| "loss": 0.2519, | |
| "step": 6330 | |
| }, | |
| { | |
| "epoch": 4.05, | |
| "learning_rate": 0.000405111821086262, | |
| "loss": 0.2259, | |
| "step": 6340 | |
| }, | |
| { | |
| "epoch": 4.06, | |
| "learning_rate": 0.00040575079872204474, | |
| "loss": 0.2386, | |
| "step": 6350 | |
| }, | |
| { | |
| "epoch": 4.06, | |
| "learning_rate": 0.0004063897763578275, | |
| "loss": 0.2217, | |
| "step": 6360 | |
| }, | |
| { | |
| "epoch": 4.07, | |
| "learning_rate": 0.0004070287539936102, | |
| "loss": 0.2309, | |
| "step": 6370 | |
| }, | |
| { | |
| "epoch": 4.08, | |
| "learning_rate": 0.000407667731629393, | |
| "loss": 0.211, | |
| "step": 6380 | |
| }, | |
| { | |
| "epoch": 4.08, | |
| "learning_rate": 0.0004083067092651757, | |
| "loss": 0.2459, | |
| "step": 6390 | |
| }, | |
| { | |
| "epoch": 4.09, | |
| "learning_rate": 0.00040894568690095844, | |
| "loss": 0.2603, | |
| "step": 6400 | |
| }, | |
| { | |
| "epoch": 4.1, | |
| "learning_rate": 0.00040958466453674123, | |
| "loss": 0.2343, | |
| "step": 6410 | |
| }, | |
| { | |
| "epoch": 4.1, | |
| "learning_rate": 0.00041022364217252396, | |
| "loss": 0.2562, | |
| "step": 6420 | |
| }, | |
| { | |
| "epoch": 4.11, | |
| "learning_rate": 0.0004108626198083067, | |
| "loss": 0.2148, | |
| "step": 6430 | |
| }, | |
| { | |
| "epoch": 4.11, | |
| "learning_rate": 0.00041150159744408947, | |
| "loss": 0.2349, | |
| "step": 6440 | |
| }, | |
| { | |
| "epoch": 4.12, | |
| "learning_rate": 0.00041214057507987225, | |
| "loss": 0.2975, | |
| "step": 6450 | |
| }, | |
| { | |
| "epoch": 4.13, | |
| "learning_rate": 0.000412779552715655, | |
| "loss": 0.2541, | |
| "step": 6460 | |
| }, | |
| { | |
| "epoch": 4.13, | |
| "learning_rate": 0.0004134185303514377, | |
| "loss": 0.2555, | |
| "step": 6470 | |
| }, | |
| { | |
| "epoch": 4.14, | |
| "learning_rate": 0.0004140575079872205, | |
| "loss": 0.2818, | |
| "step": 6480 | |
| }, | |
| { | |
| "epoch": 4.15, | |
| "learning_rate": 0.0004146964856230032, | |
| "loss": 0.2577, | |
| "step": 6490 | |
| }, | |
| { | |
| "epoch": 4.15, | |
| "learning_rate": 0.00041533546325878595, | |
| "loss": 0.2433, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 4.16, | |
| "learning_rate": 0.0004159744408945687, | |
| "loss": 0.2231, | |
| "step": 6510 | |
| }, | |
| { | |
| "epoch": 4.17, | |
| "learning_rate": 0.00041661341853035147, | |
| "loss": 0.2841, | |
| "step": 6520 | |
| }, | |
| { | |
| "epoch": 4.17, | |
| "learning_rate": 0.0004172523961661342, | |
| "loss": 0.2048, | |
| "step": 6530 | |
| }, | |
| { | |
| "epoch": 4.18, | |
| "learning_rate": 0.0004178913738019169, | |
| "loss": 0.2484, | |
| "step": 6540 | |
| }, | |
| { | |
| "epoch": 4.19, | |
| "learning_rate": 0.0004185303514376997, | |
| "loss": 0.2542, | |
| "step": 6550 | |
| }, | |
| { | |
| "epoch": 4.19, | |
| "learning_rate": 0.00041916932907348244, | |
| "loss": 0.2293, | |
| "step": 6560 | |
| }, | |
| { | |
| "epoch": 4.2, | |
| "learning_rate": 0.00041980830670926517, | |
| "loss": 0.2545, | |
| "step": 6570 | |
| }, | |
| { | |
| "epoch": 4.2, | |
| "learning_rate": 0.0004204472843450479, | |
| "loss": 0.2565, | |
| "step": 6580 | |
| }, | |
| { | |
| "epoch": 4.21, | |
| "learning_rate": 0.0004210862619808307, | |
| "loss": 0.2441, | |
| "step": 6590 | |
| }, | |
| { | |
| "epoch": 4.22, | |
| "learning_rate": 0.0004217252396166134, | |
| "loss": 0.2623, | |
| "step": 6600 | |
| }, | |
| { | |
| "epoch": 4.22, | |
| "learning_rate": 0.00042236421725239614, | |
| "loss": 0.2542, | |
| "step": 6610 | |
| }, | |
| { | |
| "epoch": 4.23, | |
| "learning_rate": 0.0004230031948881789, | |
| "loss": 0.2368, | |
| "step": 6620 | |
| }, | |
| { | |
| "epoch": 4.24, | |
| "learning_rate": 0.00042364217252396165, | |
| "loss": 0.2683, | |
| "step": 6630 | |
| }, | |
| { | |
| "epoch": 4.24, | |
| "learning_rate": 0.00042428115015974443, | |
| "loss": 0.2468, | |
| "step": 6640 | |
| }, | |
| { | |
| "epoch": 4.25, | |
| "learning_rate": 0.00042492012779552716, | |
| "loss": 0.226, | |
| "step": 6650 | |
| }, | |
| { | |
| "epoch": 4.26, | |
| "learning_rate": 0.00042555910543130995, | |
| "loss": 0.2362, | |
| "step": 6660 | |
| }, | |
| { | |
| "epoch": 4.26, | |
| "learning_rate": 0.0004261980830670927, | |
| "loss": 0.2606, | |
| "step": 6670 | |
| }, | |
| { | |
| "epoch": 4.27, | |
| "learning_rate": 0.0004268370607028754, | |
| "loss": 0.2436, | |
| "step": 6680 | |
| }, | |
| { | |
| "epoch": 4.27, | |
| "learning_rate": 0.0004274760383386582, | |
| "loss": 0.2501, | |
| "step": 6690 | |
| }, | |
| { | |
| "epoch": 4.28, | |
| "learning_rate": 0.0004281150159744409, | |
| "loss": 0.2367, | |
| "step": 6700 | |
| }, | |
| { | |
| "epoch": 4.29, | |
| "learning_rate": 0.00042875399361022365, | |
| "loss": 0.248, | |
| "step": 6710 | |
| }, | |
| { | |
| "epoch": 4.29, | |
| "learning_rate": 0.00042939297124600643, | |
| "loss": 0.2475, | |
| "step": 6720 | |
| }, | |
| { | |
| "epoch": 4.3, | |
| "learning_rate": 0.00043003194888178916, | |
| "loss": 0.2544, | |
| "step": 6730 | |
| }, | |
| { | |
| "epoch": 4.31, | |
| "learning_rate": 0.0004306709265175719, | |
| "loss": 0.2127, | |
| "step": 6740 | |
| }, | |
| { | |
| "epoch": 4.31, | |
| "learning_rate": 0.0004313099041533546, | |
| "loss": 0.2495, | |
| "step": 6750 | |
| }, | |
| { | |
| "epoch": 4.32, | |
| "learning_rate": 0.0004319488817891374, | |
| "loss": 0.2434, | |
| "step": 6760 | |
| }, | |
| { | |
| "epoch": 4.33, | |
| "learning_rate": 0.00043258785942492013, | |
| "loss": 0.2641, | |
| "step": 6770 | |
| }, | |
| { | |
| "epoch": 4.33, | |
| "learning_rate": 0.00043322683706070286, | |
| "loss": 0.2549, | |
| "step": 6780 | |
| }, | |
| { | |
| "epoch": 4.34, | |
| "learning_rate": 0.00043386581469648564, | |
| "loss": 0.2748, | |
| "step": 6790 | |
| }, | |
| { | |
| "epoch": 4.34, | |
| "learning_rate": 0.00043450479233226837, | |
| "loss": 0.2991, | |
| "step": 6800 | |
| }, | |
| { | |
| "epoch": 4.35, | |
| "learning_rate": 0.0004351437699680511, | |
| "loss": 0.2217, | |
| "step": 6810 | |
| }, | |
| { | |
| "epoch": 4.36, | |
| "learning_rate": 0.00043578274760383383, | |
| "loss": 0.2307, | |
| "step": 6820 | |
| }, | |
| { | |
| "epoch": 4.36, | |
| "learning_rate": 0.0004364217252396166, | |
| "loss": 0.234, | |
| "step": 6830 | |
| }, | |
| { | |
| "epoch": 4.37, | |
| "learning_rate": 0.0004370607028753994, | |
| "loss": 0.2637, | |
| "step": 6840 | |
| }, | |
| { | |
| "epoch": 4.38, | |
| "learning_rate": 0.0004376996805111821, | |
| "loss": 0.2285, | |
| "step": 6850 | |
| }, | |
| { | |
| "epoch": 4.38, | |
| "learning_rate": 0.0004383386581469649, | |
| "loss": 0.2585, | |
| "step": 6860 | |
| }, | |
| { | |
| "epoch": 4.39, | |
| "learning_rate": 0.00043897763578274764, | |
| "loss": 0.2358, | |
| "step": 6870 | |
| }, | |
| { | |
| "epoch": 4.4, | |
| "learning_rate": 0.00043961661341853037, | |
| "loss": 0.246, | |
| "step": 6880 | |
| }, | |
| { | |
| "epoch": 4.4, | |
| "learning_rate": 0.0004402555910543131, | |
| "loss": 0.2672, | |
| "step": 6890 | |
| }, | |
| { | |
| "epoch": 4.41, | |
| "learning_rate": 0.0004408945686900959, | |
| "loss": 0.2606, | |
| "step": 6900 | |
| }, | |
| { | |
| "epoch": 4.42, | |
| "learning_rate": 0.0004415335463258786, | |
| "loss": 0.2397, | |
| "step": 6910 | |
| }, | |
| { | |
| "epoch": 4.42, | |
| "learning_rate": 0.00044217252396166134, | |
| "loss": 0.2539, | |
| "step": 6920 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "learning_rate": 0.0004428115015974441, | |
| "loss": 0.2348, | |
| "step": 6930 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "learning_rate": 0.00044345047923322685, | |
| "loss": 0.2845, | |
| "step": 6940 | |
| }, | |
| { | |
| "epoch": 4.44, | |
| "learning_rate": 0.0004440894568690096, | |
| "loss": 0.2402, | |
| "step": 6950 | |
| }, | |
| { | |
| "epoch": 4.45, | |
| "learning_rate": 0.0004447284345047923, | |
| "loss": 0.2678, | |
| "step": 6960 | |
| }, | |
| { | |
| "epoch": 4.45, | |
| "learning_rate": 0.0004453674121405751, | |
| "loss": 0.2653, | |
| "step": 6970 | |
| }, | |
| { | |
| "epoch": 4.46, | |
| "learning_rate": 0.0004460063897763578, | |
| "loss": 0.2813, | |
| "step": 6980 | |
| }, | |
| { | |
| "epoch": 4.47, | |
| "learning_rate": 0.00044664536741214055, | |
| "loss": 0.262, | |
| "step": 6990 | |
| }, | |
| { | |
| "epoch": 4.47, | |
| "learning_rate": 0.00044728434504792333, | |
| "loss": 0.2247, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 4.48, | |
| "learning_rate": 0.00044792332268370606, | |
| "loss": 0.2547, | |
| "step": 7010 | |
| }, | |
| { | |
| "epoch": 4.49, | |
| "learning_rate": 0.0004485623003194888, | |
| "loss": 0.2627, | |
| "step": 7020 | |
| }, | |
| { | |
| "epoch": 4.49, | |
| "learning_rate": 0.0004492012779552715, | |
| "loss": 0.277, | |
| "step": 7030 | |
| }, | |
| { | |
| "epoch": 4.5, | |
| "learning_rate": 0.00044984025559105436, | |
| "loss": 0.2467, | |
| "step": 7040 | |
| }, | |
| { | |
| "epoch": 4.5, | |
| "learning_rate": 0.0004504792332268371, | |
| "loss": 0.2437, | |
| "step": 7050 | |
| }, | |
| { | |
| "epoch": 4.51, | |
| "learning_rate": 0.0004511182108626198, | |
| "loss": 0.2605, | |
| "step": 7060 | |
| }, | |
| { | |
| "epoch": 4.52, | |
| "learning_rate": 0.0004517571884984026, | |
| "loss": 0.2649, | |
| "step": 7070 | |
| }, | |
| { | |
| "epoch": 4.52, | |
| "learning_rate": 0.00045239616613418533, | |
| "loss": 0.283, | |
| "step": 7080 | |
| }, | |
| { | |
| "epoch": 4.53, | |
| "learning_rate": 0.00045303514376996806, | |
| "loss": 0.2337, | |
| "step": 7090 | |
| }, | |
| { | |
| "epoch": 4.54, | |
| "learning_rate": 0.00045367412140575084, | |
| "loss": 0.2756, | |
| "step": 7100 | |
| }, | |
| { | |
| "epoch": 4.54, | |
| "learning_rate": 0.00045431309904153357, | |
| "loss": 0.2699, | |
| "step": 7110 | |
| }, | |
| { | |
| "epoch": 4.55, | |
| "learning_rate": 0.0004549520766773163, | |
| "loss": 0.2649, | |
| "step": 7120 | |
| }, | |
| { | |
| "epoch": 4.56, | |
| "learning_rate": 0.00045559105431309903, | |
| "loss": 0.2685, | |
| "step": 7130 | |
| }, | |
| { | |
| "epoch": 4.56, | |
| "learning_rate": 0.0004562300319488818, | |
| "loss": 0.2451, | |
| "step": 7140 | |
| }, | |
| { | |
| "epoch": 4.57, | |
| "learning_rate": 0.00045686900958466454, | |
| "loss": 0.2614, | |
| "step": 7150 | |
| }, | |
| { | |
| "epoch": 4.57, | |
| "learning_rate": 0.00045750798722044727, | |
| "loss": 0.2484, | |
| "step": 7160 | |
| }, | |
| { | |
| "epoch": 4.58, | |
| "learning_rate": 0.00045814696485623006, | |
| "loss": 0.2642, | |
| "step": 7170 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "learning_rate": 0.0004587859424920128, | |
| "loss": 0.2413, | |
| "step": 7180 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "learning_rate": 0.0004594249201277955, | |
| "loss": 0.2324, | |
| "step": 7190 | |
| }, | |
| { | |
| "epoch": 4.6, | |
| "learning_rate": 0.00046006389776357824, | |
| "loss": 0.2632, | |
| "step": 7200 | |
| }, | |
| { | |
| "epoch": 4.61, | |
| "learning_rate": 0.000460702875399361, | |
| "loss": 0.2472, | |
| "step": 7210 | |
| }, | |
| { | |
| "epoch": 4.61, | |
| "learning_rate": 0.00046134185303514376, | |
| "loss": 0.276, | |
| "step": 7220 | |
| }, | |
| { | |
| "epoch": 4.62, | |
| "learning_rate": 0.0004619808306709265, | |
| "loss": 0.2647, | |
| "step": 7230 | |
| }, | |
| { | |
| "epoch": 4.63, | |
| "learning_rate": 0.0004626198083067093, | |
| "loss": 0.2409, | |
| "step": 7240 | |
| }, | |
| { | |
| "epoch": 4.63, | |
| "learning_rate": 0.00046325878594249205, | |
| "loss": 0.2568, | |
| "step": 7250 | |
| }, | |
| { | |
| "epoch": 4.64, | |
| "learning_rate": 0.0004638977635782748, | |
| "loss": 0.2856, | |
| "step": 7260 | |
| }, | |
| { | |
| "epoch": 4.65, | |
| "learning_rate": 0.0004645367412140575, | |
| "loss": 0.249, | |
| "step": 7270 | |
| }, | |
| { | |
| "epoch": 4.65, | |
| "learning_rate": 0.0004651757188498403, | |
| "loss": 0.2779, | |
| "step": 7280 | |
| }, | |
| { | |
| "epoch": 4.66, | |
| "learning_rate": 0.000465814696485623, | |
| "loss": 0.2317, | |
| "step": 7290 | |
| }, | |
| { | |
| "epoch": 4.66, | |
| "learning_rate": 0.00046645367412140575, | |
| "loss": 0.2889, | |
| "step": 7300 | |
| }, | |
| { | |
| "epoch": 4.67, | |
| "learning_rate": 0.00046709265175718854, | |
| "loss": 0.2711, | |
| "step": 7310 | |
| }, | |
| { | |
| "epoch": 4.68, | |
| "learning_rate": 0.00046773162939297126, | |
| "loss": 0.2467, | |
| "step": 7320 | |
| }, | |
| { | |
| "epoch": 4.68, | |
| "learning_rate": 0.000468370607028754, | |
| "loss": 0.2422, | |
| "step": 7330 | |
| }, | |
| { | |
| "epoch": 4.69, | |
| "learning_rate": 0.0004690095846645367, | |
| "loss": 0.2018, | |
| "step": 7340 | |
| }, | |
| { | |
| "epoch": 4.7, | |
| "learning_rate": 0.0004696485623003195, | |
| "loss": 0.2285, | |
| "step": 7350 | |
| }, | |
| { | |
| "epoch": 4.7, | |
| "learning_rate": 0.00047028753993610224, | |
| "loss": 0.2277, | |
| "step": 7360 | |
| }, | |
| { | |
| "epoch": 4.71, | |
| "learning_rate": 0.00047092651757188496, | |
| "loss": 0.2734, | |
| "step": 7370 | |
| }, | |
| { | |
| "epoch": 4.72, | |
| "learning_rate": 0.00047156549520766775, | |
| "loss": 0.2438, | |
| "step": 7380 | |
| }, | |
| { | |
| "epoch": 4.72, | |
| "learning_rate": 0.0004722044728434505, | |
| "loss": 0.2769, | |
| "step": 7390 | |
| }, | |
| { | |
| "epoch": 4.73, | |
| "learning_rate": 0.0004728434504792332, | |
| "loss": 0.2448, | |
| "step": 7400 | |
| }, | |
| { | |
| "epoch": 4.73, | |
| "learning_rate": 0.00047348242811501594, | |
| "loss": 0.2272, | |
| "step": 7410 | |
| }, | |
| { | |
| "epoch": 4.74, | |
| "learning_rate": 0.0004741214057507987, | |
| "loss": 0.2935, | |
| "step": 7420 | |
| }, | |
| { | |
| "epoch": 4.75, | |
| "learning_rate": 0.0004747603833865815, | |
| "loss": 0.2244, | |
| "step": 7430 | |
| }, | |
| { | |
| "epoch": 4.75, | |
| "learning_rate": 0.00047539936102236423, | |
| "loss": 0.2567, | |
| "step": 7440 | |
| }, | |
| { | |
| "epoch": 4.76, | |
| "learning_rate": 0.000476038338658147, | |
| "loss": 0.2725, | |
| "step": 7450 | |
| }, | |
| { | |
| "epoch": 4.77, | |
| "learning_rate": 0.00047667731629392974, | |
| "loss": 0.2912, | |
| "step": 7460 | |
| }, | |
| { | |
| "epoch": 4.77, | |
| "learning_rate": 0.0004773162939297125, | |
| "loss": 0.2618, | |
| "step": 7470 | |
| }, | |
| { | |
| "epoch": 4.78, | |
| "learning_rate": 0.00047795527156549526, | |
| "loss": 0.2646, | |
| "step": 7480 | |
| }, | |
| { | |
| "epoch": 4.79, | |
| "learning_rate": 0.000478594249201278, | |
| "loss": 0.2548, | |
| "step": 7490 | |
| }, | |
| { | |
| "epoch": 4.79, | |
| "learning_rate": 0.0004792332268370607, | |
| "loss": 0.2626, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 4.8, | |
| "learning_rate": 0.00047987220447284344, | |
| "loss": 0.2671, | |
| "step": 7510 | |
| }, | |
| { | |
| "epoch": 4.8, | |
| "learning_rate": 0.00048051118210862623, | |
| "loss": 0.2704, | |
| "step": 7520 | |
| }, | |
| { | |
| "epoch": 4.81, | |
| "learning_rate": 0.00048115015974440896, | |
| "loss": 0.2659, | |
| "step": 7530 | |
| }, | |
| { | |
| "epoch": 4.82, | |
| "learning_rate": 0.0004817891373801917, | |
| "loss": 0.2804, | |
| "step": 7540 | |
| }, | |
| { | |
| "epoch": 4.82, | |
| "learning_rate": 0.00048242811501597447, | |
| "loss": 0.2503, | |
| "step": 7550 | |
| }, | |
| { | |
| "epoch": 4.83, | |
| "learning_rate": 0.0004830670926517572, | |
| "loss": 0.2489, | |
| "step": 7560 | |
| }, | |
| { | |
| "epoch": 4.84, | |
| "learning_rate": 0.00048370607028753993, | |
| "loss": 0.2837, | |
| "step": 7570 | |
| }, | |
| { | |
| "epoch": 4.84, | |
| "learning_rate": 0.00048434504792332266, | |
| "loss": 0.2364, | |
| "step": 7580 | |
| }, | |
| { | |
| "epoch": 4.85, | |
| "learning_rate": 0.00048498402555910544, | |
| "loss": 0.2508, | |
| "step": 7590 | |
| }, | |
| { | |
| "epoch": 4.86, | |
| "learning_rate": 0.00048562300319488817, | |
| "loss": 0.2279, | |
| "step": 7600 | |
| }, | |
| { | |
| "epoch": 4.86, | |
| "learning_rate": 0.0004862619808306709, | |
| "loss": 0.2174, | |
| "step": 7610 | |
| }, | |
| { | |
| "epoch": 4.87, | |
| "learning_rate": 0.0004869009584664537, | |
| "loss": 0.2837, | |
| "step": 7620 | |
| }, | |
| { | |
| "epoch": 4.88, | |
| "learning_rate": 0.00048753993610223647, | |
| "loss": 0.2414, | |
| "step": 7630 | |
| }, | |
| { | |
| "epoch": 4.88, | |
| "learning_rate": 0.0004881789137380192, | |
| "loss": 0.2452, | |
| "step": 7640 | |
| }, | |
| { | |
| "epoch": 4.89, | |
| "learning_rate": 0.0004888178913738019, | |
| "loss": 0.2854, | |
| "step": 7650 | |
| }, | |
| { | |
| "epoch": 4.89, | |
| "learning_rate": 0.0004894568690095847, | |
| "loss": 0.2593, | |
| "step": 7660 | |
| }, | |
| { | |
| "epoch": 4.9, | |
| "learning_rate": 0.0004900958466453675, | |
| "loss": 0.2507, | |
| "step": 7670 | |
| }, | |
| { | |
| "epoch": 4.91, | |
| "learning_rate": 0.0004907348242811502, | |
| "loss": 0.2407, | |
| "step": 7680 | |
| }, | |
| { | |
| "epoch": 4.91, | |
| "learning_rate": 0.000491373801916933, | |
| "loss": 0.2345, | |
| "step": 7690 | |
| }, | |
| { | |
| "epoch": 4.92, | |
| "learning_rate": 0.0004920127795527157, | |
| "loss": 0.2786, | |
| "step": 7700 | |
| }, | |
| { | |
| "epoch": 4.93, | |
| "learning_rate": 0.0004926517571884984, | |
| "loss": 0.2639, | |
| "step": 7710 | |
| }, | |
| { | |
| "epoch": 4.93, | |
| "learning_rate": 0.0004932907348242811, | |
| "loss": 0.2819, | |
| "step": 7720 | |
| }, | |
| { | |
| "epoch": 4.94, | |
| "learning_rate": 0.0004939297124600639, | |
| "loss": 0.2602, | |
| "step": 7730 | |
| }, | |
| { | |
| "epoch": 4.95, | |
| "learning_rate": 0.0004945686900958467, | |
| "loss": 0.2647, | |
| "step": 7740 | |
| }, | |
| { | |
| "epoch": 4.95, | |
| "learning_rate": 0.0004952076677316294, | |
| "loss": 0.2126, | |
| "step": 7750 | |
| }, | |
| { | |
| "epoch": 4.96, | |
| "learning_rate": 0.0004958466453674122, | |
| "loss": 0.2694, | |
| "step": 7760 | |
| }, | |
| { | |
| "epoch": 4.96, | |
| "learning_rate": 0.0004964856230031949, | |
| "loss": 0.2193, | |
| "step": 7770 | |
| }, | |
| { | |
| "epoch": 4.97, | |
| "learning_rate": 0.0004971246006389776, | |
| "loss": 0.2219, | |
| "step": 7780 | |
| }, | |
| { | |
| "epoch": 4.98, | |
| "learning_rate": 0.0004977635782747603, | |
| "loss": 0.2674, | |
| "step": 7790 | |
| }, | |
| { | |
| "epoch": 4.98, | |
| "learning_rate": 0.0004984025559105431, | |
| "loss": 0.2368, | |
| "step": 7800 | |
| }, | |
| { | |
| "epoch": 4.99, | |
| "learning_rate": 0.0004990415335463259, | |
| "loss": 0.2356, | |
| "step": 7810 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 0.0004996805111821086, | |
| "loss": 0.2548, | |
| "step": 7820 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "learning_rate": 0.0005003194888178914, | |
| "loss": 0.277, | |
| "step": 7830 | |
| }, | |
| { | |
| "epoch": 5.01, | |
| "learning_rate": 0.0005009584664536741, | |
| "loss": 0.2186, | |
| "step": 7840 | |
| }, | |
| { | |
| "epoch": 5.02, | |
| "learning_rate": 0.0005015974440894568, | |
| "loss": 0.2285, | |
| "step": 7850 | |
| }, | |
| { | |
| "epoch": 5.02, | |
| "learning_rate": 0.0005022364217252397, | |
| "loss": 0.2198, | |
| "step": 7860 | |
| }, | |
| { | |
| "epoch": 5.03, | |
| "learning_rate": 0.0005028753993610223, | |
| "loss": 0.1782, | |
| "step": 7870 | |
| }, | |
| { | |
| "epoch": 5.04, | |
| "learning_rate": 0.0005035143769968051, | |
| "loss": 0.2177, | |
| "step": 7880 | |
| }, | |
| { | |
| "epoch": 5.04, | |
| "learning_rate": 0.0005041533546325879, | |
| "loss": 0.2345, | |
| "step": 7890 | |
| }, | |
| { | |
| "epoch": 5.05, | |
| "learning_rate": 0.0005047923322683706, | |
| "loss": 0.2268, | |
| "step": 7900 | |
| }, | |
| { | |
| "epoch": 5.05, | |
| "learning_rate": 0.0005054313099041533, | |
| "loss": 0.2024, | |
| "step": 7910 | |
| }, | |
| { | |
| "epoch": 5.06, | |
| "learning_rate": 0.0005060702875399362, | |
| "loss": 0.2183, | |
| "step": 7920 | |
| }, | |
| { | |
| "epoch": 5.07, | |
| "learning_rate": 0.0005067092651757189, | |
| "loss": 0.2126, | |
| "step": 7930 | |
| }, | |
| { | |
| "epoch": 5.07, | |
| "learning_rate": 0.0005073482428115016, | |
| "loss": 0.241, | |
| "step": 7940 | |
| }, | |
| { | |
| "epoch": 5.08, | |
| "learning_rate": 0.0005079872204472845, | |
| "loss": 0.2137, | |
| "step": 7950 | |
| }, | |
| { | |
| "epoch": 5.09, | |
| "learning_rate": 0.0005086261980830671, | |
| "loss": 0.2156, | |
| "step": 7960 | |
| }, | |
| { | |
| "epoch": 5.09, | |
| "learning_rate": 0.0005092651757188499, | |
| "loss": 0.2081, | |
| "step": 7970 | |
| }, | |
| { | |
| "epoch": 5.1, | |
| "learning_rate": 0.0005099041533546325, | |
| "loss": 0.2235, | |
| "step": 7980 | |
| }, | |
| { | |
| "epoch": 5.11, | |
| "learning_rate": 0.0005105431309904154, | |
| "loss": 0.2023, | |
| "step": 7990 | |
| }, | |
| { | |
| "epoch": 5.11, | |
| "learning_rate": 0.0005111821086261981, | |
| "loss": 0.2001, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 5.12, | |
| "learning_rate": 0.0005118210862619808, | |
| "loss": 0.1899, | |
| "step": 8010 | |
| }, | |
| { | |
| "epoch": 5.12, | |
| "learning_rate": 0.0005124600638977636, | |
| "loss": 0.2328, | |
| "step": 8020 | |
| }, | |
| { | |
| "epoch": 5.13, | |
| "learning_rate": 0.0005130990415335464, | |
| "loss": 0.222, | |
| "step": 8030 | |
| }, | |
| { | |
| "epoch": 5.14, | |
| "learning_rate": 0.000513738019169329, | |
| "loss": 0.2191, | |
| "step": 8040 | |
| }, | |
| { | |
| "epoch": 5.14, | |
| "learning_rate": 0.0005143769968051119, | |
| "loss": 0.2012, | |
| "step": 8050 | |
| }, | |
| { | |
| "epoch": 5.15, | |
| "learning_rate": 0.0005150159744408946, | |
| "loss": 0.2093, | |
| "step": 8060 | |
| }, | |
| { | |
| "epoch": 5.16, | |
| "learning_rate": 0.0005156549520766773, | |
| "loss": 0.192, | |
| "step": 8070 | |
| }, | |
| { | |
| "epoch": 5.16, | |
| "learning_rate": 0.00051629392971246, | |
| "loss": 0.2442, | |
| "step": 8080 | |
| }, | |
| { | |
| "epoch": 5.17, | |
| "learning_rate": 0.0005169329073482429, | |
| "loss": 0.2149, | |
| "step": 8090 | |
| }, | |
| { | |
| "epoch": 5.18, | |
| "learning_rate": 0.0005175718849840255, | |
| "loss": 0.2278, | |
| "step": 8100 | |
| }, | |
| { | |
| "epoch": 5.18, | |
| "learning_rate": 0.0005182108626198083, | |
| "loss": 0.2626, | |
| "step": 8110 | |
| }, | |
| { | |
| "epoch": 5.19, | |
| "learning_rate": 0.0005188498402555911, | |
| "loss": 0.2234, | |
| "step": 8120 | |
| }, | |
| { | |
| "epoch": 5.19, | |
| "learning_rate": 0.0005194888178913738, | |
| "loss": 0.2177, | |
| "step": 8130 | |
| }, | |
| { | |
| "epoch": 5.2, | |
| "learning_rate": 0.0005201277955271566, | |
| "loss": 0.264, | |
| "step": 8140 | |
| }, | |
| { | |
| "epoch": 5.21, | |
| "learning_rate": 0.0005207667731629393, | |
| "loss": 0.2129, | |
| "step": 8150 | |
| }, | |
| { | |
| "epoch": 5.21, | |
| "learning_rate": 0.0005214057507987221, | |
| "loss": 0.2431, | |
| "step": 8160 | |
| }, | |
| { | |
| "epoch": 5.22, | |
| "learning_rate": 0.0005220447284345048, | |
| "loss": 0.2204, | |
| "step": 8170 | |
| }, | |
| { | |
| "epoch": 5.23, | |
| "learning_rate": 0.0005226837060702875, | |
| "loss": 0.2081, | |
| "step": 8180 | |
| }, | |
| { | |
| "epoch": 5.23, | |
| "learning_rate": 0.0005233226837060703, | |
| "loss": 0.207, | |
| "step": 8190 | |
| }, | |
| { | |
| "epoch": 5.24, | |
| "learning_rate": 0.0005239616613418531, | |
| "loss": 0.2233, | |
| "step": 8200 | |
| }, | |
| { | |
| "epoch": 5.25, | |
| "learning_rate": 0.0005246006389776357, | |
| "loss": 0.2488, | |
| "step": 8210 | |
| }, | |
| { | |
| "epoch": 5.25, | |
| "learning_rate": 0.0005252396166134186, | |
| "loss": 0.207, | |
| "step": 8220 | |
| }, | |
| { | |
| "epoch": 5.26, | |
| "learning_rate": 0.0005258785942492013, | |
| "loss": 0.2447, | |
| "step": 8230 | |
| }, | |
| { | |
| "epoch": 5.27, | |
| "learning_rate": 0.000526517571884984, | |
| "loss": 0.2295, | |
| "step": 8240 | |
| }, | |
| { | |
| "epoch": 5.27, | |
| "learning_rate": 0.0005271565495207668, | |
| "loss": 0.2539, | |
| "step": 8250 | |
| }, | |
| { | |
| "epoch": 5.28, | |
| "learning_rate": 0.0005277955271565496, | |
| "loss": 0.243, | |
| "step": 8260 | |
| }, | |
| { | |
| "epoch": 5.28, | |
| "learning_rate": 0.0005284345047923322, | |
| "loss": 0.2116, | |
| "step": 8270 | |
| }, | |
| { | |
| "epoch": 5.29, | |
| "learning_rate": 0.0005290734824281151, | |
| "loss": 0.2204, | |
| "step": 8280 | |
| }, | |
| { | |
| "epoch": 5.3, | |
| "learning_rate": 0.0005297124600638977, | |
| "loss": 0.2041, | |
| "step": 8290 | |
| }, | |
| { | |
| "epoch": 5.3, | |
| "learning_rate": 0.0005303514376996805, | |
| "loss": 0.2402, | |
| "step": 8300 | |
| }, | |
| { | |
| "epoch": 5.31, | |
| "learning_rate": 0.0005309904153354632, | |
| "loss": 0.2276, | |
| "step": 8310 | |
| }, | |
| { | |
| "epoch": 5.32, | |
| "learning_rate": 0.000531629392971246, | |
| "loss": 0.2305, | |
| "step": 8320 | |
| }, | |
| { | |
| "epoch": 5.32, | |
| "learning_rate": 0.0005322683706070288, | |
| "loss": 0.2257, | |
| "step": 8330 | |
| }, | |
| { | |
| "epoch": 5.33, | |
| "learning_rate": 0.0005329073482428115, | |
| "loss": 0.2062, | |
| "step": 8340 | |
| }, | |
| { | |
| "epoch": 5.34, | |
| "learning_rate": 0.0005335463258785943, | |
| "loss": 0.2013, | |
| "step": 8350 | |
| }, | |
| { | |
| "epoch": 5.34, | |
| "learning_rate": 0.000534185303514377, | |
| "loss": 0.2429, | |
| "step": 8360 | |
| }, | |
| { | |
| "epoch": 5.35, | |
| "learning_rate": 0.0005348242811501598, | |
| "loss": 0.1853, | |
| "step": 8370 | |
| }, | |
| { | |
| "epoch": 5.35, | |
| "learning_rate": 0.0005354632587859425, | |
| "loss": 0.2314, | |
| "step": 8380 | |
| }, | |
| { | |
| "epoch": 5.36, | |
| "learning_rate": 0.0005361022364217253, | |
| "loss": 0.2033, | |
| "step": 8390 | |
| }, | |
| { | |
| "epoch": 5.37, | |
| "learning_rate": 0.000536741214057508, | |
| "loss": 0.2227, | |
| "step": 8400 | |
| }, | |
| { | |
| "epoch": 5.37, | |
| "learning_rate": 0.0005373801916932908, | |
| "loss": 0.2243, | |
| "step": 8410 | |
| }, | |
| { | |
| "epoch": 5.38, | |
| "learning_rate": 0.0005380191693290735, | |
| "loss": 0.2322, | |
| "step": 8420 | |
| }, | |
| { | |
| "epoch": 5.39, | |
| "learning_rate": 0.0005386581469648563, | |
| "loss": 0.2103, | |
| "step": 8430 | |
| }, | |
| { | |
| "epoch": 5.39, | |
| "learning_rate": 0.0005392971246006389, | |
| "loss": 0.2361, | |
| "step": 8440 | |
| }, | |
| { | |
| "epoch": 5.4, | |
| "learning_rate": 0.0005399361022364218, | |
| "loss": 0.2518, | |
| "step": 8450 | |
| }, | |
| { | |
| "epoch": 5.41, | |
| "learning_rate": 0.0005405750798722044, | |
| "loss": 0.2079, | |
| "step": 8460 | |
| }, | |
| { | |
| "epoch": 5.41, | |
| "learning_rate": 0.0005412140575079872, | |
| "loss": 0.2353, | |
| "step": 8470 | |
| }, | |
| { | |
| "epoch": 5.42, | |
| "learning_rate": 0.00054185303514377, | |
| "loss": 0.2471, | |
| "step": 8480 | |
| }, | |
| { | |
| "epoch": 5.42, | |
| "learning_rate": 0.0005424920127795527, | |
| "loss": 0.2506, | |
| "step": 8490 | |
| }, | |
| { | |
| "epoch": 5.43, | |
| "learning_rate": 0.0005431309904153354, | |
| "loss": 0.2277, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 5.44, | |
| "learning_rate": 0.0005437699680511183, | |
| "loss": 0.2754, | |
| "step": 8510 | |
| }, | |
| { | |
| "epoch": 5.44, | |
| "learning_rate": 0.000544408945686901, | |
| "loss": 0.2325, | |
| "step": 8520 | |
| }, | |
| { | |
| "epoch": 5.45, | |
| "learning_rate": 0.0005450479233226837, | |
| "loss": 0.2329, | |
| "step": 8530 | |
| }, | |
| { | |
| "epoch": 5.46, | |
| "learning_rate": 0.0005456869009584666, | |
| "loss": 0.2542, | |
| "step": 8540 | |
| }, | |
| { | |
| "epoch": 5.46, | |
| "learning_rate": 0.0005463258785942492, | |
| "loss": 0.2054, | |
| "step": 8550 | |
| }, | |
| { | |
| "epoch": 5.47, | |
| "learning_rate": 0.000546964856230032, | |
| "loss": 0.2109, | |
| "step": 8560 | |
| }, | |
| { | |
| "epoch": 5.48, | |
| "learning_rate": 0.0005476038338658147, | |
| "loss": 0.2119, | |
| "step": 8570 | |
| }, | |
| { | |
| "epoch": 5.48, | |
| "learning_rate": 0.0005482428115015975, | |
| "loss": 0.2293, | |
| "step": 8580 | |
| }, | |
| { | |
| "epoch": 5.49, | |
| "learning_rate": 0.0005488817891373802, | |
| "loss": 0.2151, | |
| "step": 8590 | |
| }, | |
| { | |
| "epoch": 5.5, | |
| "learning_rate": 0.0005495207667731629, | |
| "loss": 0.2247, | |
| "step": 8600 | |
| }, | |
| { | |
| "epoch": 5.5, | |
| "learning_rate": 0.0005501597444089457, | |
| "loss": 0.2787, | |
| "step": 8610 | |
| }, | |
| { | |
| "epoch": 5.51, | |
| "learning_rate": 0.0005507987220447285, | |
| "loss": 0.2135, | |
| "step": 8620 | |
| }, | |
| { | |
| "epoch": 5.51, | |
| "learning_rate": 0.0005514376996805111, | |
| "loss": 0.2429, | |
| "step": 8630 | |
| }, | |
| { | |
| "epoch": 5.52, | |
| "learning_rate": 0.000552076677316294, | |
| "loss": 0.224, | |
| "step": 8640 | |
| }, | |
| { | |
| "epoch": 5.53, | |
| "learning_rate": 0.0005527156549520767, | |
| "loss": 0.2559, | |
| "step": 8650 | |
| }, | |
| { | |
| "epoch": 5.53, | |
| "learning_rate": 0.0005533546325878594, | |
| "loss": 0.2006, | |
| "step": 8660 | |
| }, | |
| { | |
| "epoch": 5.54, | |
| "learning_rate": 0.0005539936102236421, | |
| "loss": 0.2098, | |
| "step": 8670 | |
| }, | |
| { | |
| "epoch": 5.55, | |
| "learning_rate": 0.000554632587859425, | |
| "loss": 0.2211, | |
| "step": 8680 | |
| }, | |
| { | |
| "epoch": 5.55, | |
| "learning_rate": 0.0005552715654952076, | |
| "loss": 0.2151, | |
| "step": 8690 | |
| }, | |
| { | |
| "epoch": 5.56, | |
| "learning_rate": 0.0005559105431309904, | |
| "loss": 0.2487, | |
| "step": 8700 | |
| }, | |
| { | |
| "epoch": 5.57, | |
| "learning_rate": 0.0005565495207667732, | |
| "loss": 0.1934, | |
| "step": 8710 | |
| }, | |
| { | |
| "epoch": 5.57, | |
| "learning_rate": 0.0005571884984025559, | |
| "loss": 0.237, | |
| "step": 8720 | |
| }, | |
| { | |
| "epoch": 5.58, | |
| "learning_rate": 0.0005578274760383387, | |
| "loss": 0.2356, | |
| "step": 8730 | |
| }, | |
| { | |
| "epoch": 5.58, | |
| "learning_rate": 0.0005584664536741214, | |
| "loss": 0.242, | |
| "step": 8740 | |
| }, | |
| { | |
| "epoch": 5.59, | |
| "learning_rate": 0.0005591054313099042, | |
| "loss": 0.2187, | |
| "step": 8750 | |
| }, | |
| { | |
| "epoch": 5.6, | |
| "learning_rate": 0.0005597444089456869, | |
| "loss": 0.2434, | |
| "step": 8760 | |
| }, | |
| { | |
| "epoch": 5.6, | |
| "learning_rate": 0.0005603833865814697, | |
| "loss": 0.2641, | |
| "step": 8770 | |
| }, | |
| { | |
| "epoch": 5.61, | |
| "learning_rate": 0.0005610223642172524, | |
| "loss": 0.2223, | |
| "step": 8780 | |
| }, | |
| { | |
| "epoch": 5.62, | |
| "learning_rate": 0.0005616613418530352, | |
| "loss": 0.2159, | |
| "step": 8790 | |
| }, | |
| { | |
| "epoch": 5.62, | |
| "learning_rate": 0.0005623003194888178, | |
| "loss": 0.233, | |
| "step": 8800 | |
| }, | |
| { | |
| "epoch": 5.63, | |
| "learning_rate": 0.0005629392971246007, | |
| "loss": 0.2623, | |
| "step": 8810 | |
| }, | |
| { | |
| "epoch": 5.64, | |
| "learning_rate": 0.0005635782747603834, | |
| "loss": 0.2424, | |
| "step": 8820 | |
| }, | |
| { | |
| "epoch": 5.64, | |
| "learning_rate": 0.0005642172523961661, | |
| "loss": 0.236, | |
| "step": 8830 | |
| }, | |
| { | |
| "epoch": 5.65, | |
| "learning_rate": 0.0005648562300319489, | |
| "loss": 0.2372, | |
| "step": 8840 | |
| }, | |
| { | |
| "epoch": 5.65, | |
| "learning_rate": 0.0005654952076677317, | |
| "loss": 0.2165, | |
| "step": 8850 | |
| }, | |
| { | |
| "epoch": 5.66, | |
| "learning_rate": 0.0005661341853035143, | |
| "loss": 0.2702, | |
| "step": 8860 | |
| }, | |
| { | |
| "epoch": 5.67, | |
| "learning_rate": 0.0005667731629392972, | |
| "loss": 0.2253, | |
| "step": 8870 | |
| }, | |
| { | |
| "epoch": 5.67, | |
| "learning_rate": 0.0005674121405750799, | |
| "loss": 0.2361, | |
| "step": 8880 | |
| }, | |
| { | |
| "epoch": 5.68, | |
| "learning_rate": 0.0005680511182108626, | |
| "loss": 0.2314, | |
| "step": 8890 | |
| }, | |
| { | |
| "epoch": 5.69, | |
| "learning_rate": 0.0005686900958466453, | |
| "loss": 0.2188, | |
| "step": 8900 | |
| }, | |
| { | |
| "epoch": 5.69, | |
| "learning_rate": 0.0005693290734824281, | |
| "loss": 0.2121, | |
| "step": 8910 | |
| }, | |
| { | |
| "epoch": 5.7, | |
| "learning_rate": 0.0005699680511182109, | |
| "loss": 0.208, | |
| "step": 8920 | |
| }, | |
| { | |
| "epoch": 5.71, | |
| "learning_rate": 0.0005706070287539936, | |
| "loss": 0.2587, | |
| "step": 8930 | |
| }, | |
| { | |
| "epoch": 5.71, | |
| "learning_rate": 0.0005712460063897764, | |
| "loss": 0.248, | |
| "step": 8940 | |
| }, | |
| { | |
| "epoch": 5.72, | |
| "learning_rate": 0.0005718849840255591, | |
| "loss": 0.2321, | |
| "step": 8950 | |
| }, | |
| { | |
| "epoch": 5.73, | |
| "learning_rate": 0.0005725239616613419, | |
| "loss": 0.2464, | |
| "step": 8960 | |
| }, | |
| { | |
| "epoch": 5.73, | |
| "learning_rate": 0.0005731629392971246, | |
| "loss": 0.2344, | |
| "step": 8970 | |
| }, | |
| { | |
| "epoch": 5.74, | |
| "learning_rate": 0.0005738019169329074, | |
| "loss": 0.2346, | |
| "step": 8980 | |
| }, | |
| { | |
| "epoch": 5.74, | |
| "learning_rate": 0.0005744408945686901, | |
| "loss": 0.2296, | |
| "step": 8990 | |
| }, | |
| { | |
| "epoch": 5.75, | |
| "learning_rate": 0.0005750798722044729, | |
| "loss": 0.2556, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 5.76, | |
| "learning_rate": 0.0005757188498402556, | |
| "loss": 0.2424, | |
| "step": 9010 | |
| }, | |
| { | |
| "epoch": 5.76, | |
| "learning_rate": 0.0005763578274760384, | |
| "loss": 0.2561, | |
| "step": 9020 | |
| }, | |
| { | |
| "epoch": 5.77, | |
| "learning_rate": 0.000576996805111821, | |
| "loss": 0.2339, | |
| "step": 9030 | |
| }, | |
| { | |
| "epoch": 5.78, | |
| "learning_rate": 0.0005776357827476039, | |
| "loss": 0.2646, | |
| "step": 9040 | |
| }, | |
| { | |
| "epoch": 5.78, | |
| "learning_rate": 0.0005782747603833865, | |
| "loss": 0.2297, | |
| "step": 9050 | |
| }, | |
| { | |
| "epoch": 5.79, | |
| "learning_rate": 0.0005789137380191693, | |
| "loss": 0.1751, | |
| "step": 9060 | |
| }, | |
| { | |
| "epoch": 5.8, | |
| "learning_rate": 0.0005795527156549521, | |
| "loss": 0.2185, | |
| "step": 9070 | |
| }, | |
| { | |
| "epoch": 5.8, | |
| "learning_rate": 0.0005801916932907348, | |
| "loss": 0.2366, | |
| "step": 9080 | |
| }, | |
| { | |
| "epoch": 5.81, | |
| "learning_rate": 0.0005808306709265175, | |
| "loss": 0.2377, | |
| "step": 9090 | |
| }, | |
| { | |
| "epoch": 5.81, | |
| "learning_rate": 0.0005814696485623004, | |
| "loss": 0.2242, | |
| "step": 9100 | |
| }, | |
| { | |
| "epoch": 5.82, | |
| "learning_rate": 0.000582108626198083, | |
| "loss": 0.2487, | |
| "step": 9110 | |
| }, | |
| { | |
| "epoch": 5.83, | |
| "learning_rate": 0.0005827476038338658, | |
| "loss": 0.2498, | |
| "step": 9120 | |
| }, | |
| { | |
| "epoch": 5.83, | |
| "learning_rate": 0.0005833865814696487, | |
| "loss": 0.21, | |
| "step": 9130 | |
| }, | |
| { | |
| "epoch": 5.84, | |
| "learning_rate": 0.0005840255591054313, | |
| "loss": 0.2414, | |
| "step": 9140 | |
| }, | |
| { | |
| "epoch": 5.85, | |
| "learning_rate": 0.0005846645367412141, | |
| "loss": 0.2372, | |
| "step": 9150 | |
| }, | |
| { | |
| "epoch": 5.85, | |
| "learning_rate": 0.0005853035143769969, | |
| "loss": 0.2066, | |
| "step": 9160 | |
| }, | |
| { | |
| "epoch": 5.86, | |
| "learning_rate": 0.0005859424920127796, | |
| "loss": 0.2338, | |
| "step": 9170 | |
| }, | |
| { | |
| "epoch": 5.87, | |
| "learning_rate": 0.0005865814696485623, | |
| "loss": 0.2372, | |
| "step": 9180 | |
| }, | |
| { | |
| "epoch": 5.87, | |
| "learning_rate": 0.0005872204472843451, | |
| "loss": 0.2528, | |
| "step": 9190 | |
| }, | |
| { | |
| "epoch": 5.88, | |
| "learning_rate": 0.0005878594249201278, | |
| "loss": 0.2418, | |
| "step": 9200 | |
| }, | |
| { | |
| "epoch": 5.88, | |
| "learning_rate": 0.0005884984025559106, | |
| "loss": 0.2089, | |
| "step": 9210 | |
| }, | |
| { | |
| "epoch": 5.89, | |
| "learning_rate": 0.0005891373801916932, | |
| "loss": 0.2637, | |
| "step": 9220 | |
| }, | |
| { | |
| "epoch": 5.9, | |
| "learning_rate": 0.0005897763578274761, | |
| "loss": 0.262, | |
| "step": 9230 | |
| }, | |
| { | |
| "epoch": 5.9, | |
| "learning_rate": 0.0005904153354632588, | |
| "loss": 0.2451, | |
| "step": 9240 | |
| }, | |
| { | |
| "epoch": 5.91, | |
| "learning_rate": 0.0005910543130990415, | |
| "loss": 0.2283, | |
| "step": 9250 | |
| }, | |
| { | |
| "epoch": 5.92, | |
| "learning_rate": 0.0005916932907348243, | |
| "loss": 0.227, | |
| "step": 9260 | |
| }, | |
| { | |
| "epoch": 5.92, | |
| "learning_rate": 0.0005923322683706071, | |
| "loss": 0.2483, | |
| "step": 9270 | |
| }, | |
| { | |
| "epoch": 5.93, | |
| "learning_rate": 0.0005929712460063897, | |
| "loss": 0.2338, | |
| "step": 9280 | |
| }, | |
| { | |
| "epoch": 5.94, | |
| "learning_rate": 0.0005936102236421725, | |
| "loss": 0.2519, | |
| "step": 9290 | |
| }, | |
| { | |
| "epoch": 5.94, | |
| "learning_rate": 0.0005942492012779553, | |
| "loss": 0.2135, | |
| "step": 9300 | |
| }, | |
| { | |
| "epoch": 5.95, | |
| "learning_rate": 0.000594888178913738, | |
| "loss": 0.2144, | |
| "step": 9310 | |
| }, | |
| { | |
| "epoch": 5.95, | |
| "learning_rate": 0.0005955271565495208, | |
| "loss": 0.2324, | |
| "step": 9320 | |
| }, | |
| { | |
| "epoch": 5.96, | |
| "learning_rate": 0.0005961661341853036, | |
| "loss": 0.2121, | |
| "step": 9330 | |
| }, | |
| { | |
| "epoch": 5.97, | |
| "learning_rate": 0.0005968051118210863, | |
| "loss": 0.2149, | |
| "step": 9340 | |
| }, | |
| { | |
| "epoch": 5.97, | |
| "learning_rate": 0.000597444089456869, | |
| "loss": 0.2414, | |
| "step": 9350 | |
| }, | |
| { | |
| "epoch": 5.98, | |
| "learning_rate": 0.0005980830670926518, | |
| "loss": 0.2348, | |
| "step": 9360 | |
| }, | |
| { | |
| "epoch": 5.99, | |
| "learning_rate": 0.0005987220447284345, | |
| "loss": 0.2711, | |
| "step": 9370 | |
| }, | |
| { | |
| "epoch": 5.99, | |
| "learning_rate": 0.0005993610223642173, | |
| "loss": 0.2151, | |
| "step": 9380 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "learning_rate": 0.0006, | |
| "loss": 0.2554, | |
| "step": 9390 | |
| }, | |
| { | |
| "epoch": 6.01, | |
| "learning_rate": 0.0006006389776357828, | |
| "loss": 0.1843, | |
| "step": 9400 | |
| }, | |
| { | |
| "epoch": 6.01, | |
| "learning_rate": 0.0006012779552715655, | |
| "loss": 0.2518, | |
| "step": 9410 | |
| }, | |
| { | |
| "epoch": 6.02, | |
| "learning_rate": 0.0006019169329073482, | |
| "loss": 0.2017, | |
| "step": 9420 | |
| }, | |
| { | |
| "epoch": 6.03, | |
| "learning_rate": 0.000602555910543131, | |
| "loss": 0.2016, | |
| "step": 9430 | |
| }, | |
| { | |
| "epoch": 6.03, | |
| "learning_rate": 0.0006031948881789138, | |
| "loss": 0.1955, | |
| "step": 9440 | |
| }, | |
| { | |
| "epoch": 6.04, | |
| "learning_rate": 0.0006038338658146964, | |
| "loss": 0.2106, | |
| "step": 9450 | |
| }, | |
| { | |
| "epoch": 6.04, | |
| "learning_rate": 0.0006044728434504793, | |
| "loss": 0.2085, | |
| "step": 9460 | |
| }, | |
| { | |
| "epoch": 6.05, | |
| "learning_rate": 0.000605111821086262, | |
| "loss": 0.2208, | |
| "step": 9470 | |
| }, | |
| { | |
| "epoch": 6.06, | |
| "learning_rate": 0.0006057507987220447, | |
| "loss": 0.2107, | |
| "step": 9480 | |
| }, | |
| { | |
| "epoch": 6.06, | |
| "learning_rate": 0.0006063897763578275, | |
| "loss": 0.2016, | |
| "step": 9490 | |
| }, | |
| { | |
| "epoch": 6.07, | |
| "learning_rate": 0.0006070287539936102, | |
| "loss": 0.2203, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 6.08, | |
| "learning_rate": 0.000607667731629393, | |
| "loss": 0.1773, | |
| "step": 9510 | |
| }, | |
| { | |
| "epoch": 6.08, | |
| "learning_rate": 0.0006083067092651758, | |
| "loss": 0.2162, | |
| "step": 9520 | |
| }, | |
| { | |
| "epoch": 6.09, | |
| "learning_rate": 0.0006089456869009585, | |
| "loss": 0.1805, | |
| "step": 9530 | |
| }, | |
| { | |
| "epoch": 6.1, | |
| "learning_rate": 0.0006095846645367412, | |
| "loss": 0.275, | |
| "step": 9540 | |
| }, | |
| { | |
| "epoch": 6.1, | |
| "learning_rate": 0.000610223642172524, | |
| "loss": 0.2398, | |
| "step": 9550 | |
| }, | |
| { | |
| "epoch": 6.11, | |
| "learning_rate": 0.0006108626198083067, | |
| "loss": 0.1857, | |
| "step": 9560 | |
| }, | |
| { | |
| "epoch": 6.11, | |
| "learning_rate": 0.0006115015974440895, | |
| "loss": 0.2261, | |
| "step": 9570 | |
| }, | |
| { | |
| "epoch": 6.12, | |
| "learning_rate": 0.0006121405750798722, | |
| "loss": 0.1816, | |
| "step": 9580 | |
| }, | |
| { | |
| "epoch": 6.13, | |
| "learning_rate": 0.000612779552715655, | |
| "loss": 0.212, | |
| "step": 9590 | |
| }, | |
| { | |
| "epoch": 6.13, | |
| "learning_rate": 0.0006134185303514377, | |
| "loss": 0.2027, | |
| "step": 9600 | |
| }, | |
| { | |
| "epoch": 6.14, | |
| "learning_rate": 0.0006140575079872205, | |
| "loss": 0.2054, | |
| "step": 9610 | |
| }, | |
| { | |
| "epoch": 6.15, | |
| "learning_rate": 0.0006146964856230032, | |
| "loss": 0.2073, | |
| "step": 9620 | |
| }, | |
| { | |
| "epoch": 6.15, | |
| "learning_rate": 0.000615335463258786, | |
| "loss": 0.199, | |
| "step": 9630 | |
| }, | |
| { | |
| "epoch": 6.16, | |
| "learning_rate": 0.0006159744408945687, | |
| "loss": 0.2037, | |
| "step": 9640 | |
| }, | |
| { | |
| "epoch": 6.17, | |
| "learning_rate": 0.0006166134185303514, | |
| "loss": 0.1966, | |
| "step": 9650 | |
| }, | |
| { | |
| "epoch": 6.17, | |
| "learning_rate": 0.0006172523961661342, | |
| "loss": 0.2098, | |
| "step": 9660 | |
| }, | |
| { | |
| "epoch": 6.18, | |
| "learning_rate": 0.0006178913738019169, | |
| "loss": 0.2208, | |
| "step": 9670 | |
| }, | |
| { | |
| "epoch": 6.19, | |
| "learning_rate": 0.0006185303514376996, | |
| "loss": 0.1932, | |
| "step": 9680 | |
| }, | |
| { | |
| "epoch": 6.19, | |
| "learning_rate": 0.0006191693290734825, | |
| "loss": 0.2283, | |
| "step": 9690 | |
| }, | |
| { | |
| "epoch": 6.2, | |
| "learning_rate": 0.0006198083067092651, | |
| "loss": 0.2247, | |
| "step": 9700 | |
| }, | |
| { | |
| "epoch": 6.2, | |
| "learning_rate": 0.0006204472843450479, | |
| "loss": 0.2131, | |
| "step": 9710 | |
| }, | |
| { | |
| "epoch": 6.21, | |
| "learning_rate": 0.0006210862619808308, | |
| "loss": 0.1977, | |
| "step": 9720 | |
| }, | |
| { | |
| "epoch": 6.22, | |
| "learning_rate": 0.0006217252396166134, | |
| "loss": 0.2284, | |
| "step": 9730 | |
| }, | |
| { | |
| "epoch": 6.22, | |
| "learning_rate": 0.0006223642172523962, | |
| "loss": 0.2088, | |
| "step": 9740 | |
| }, | |
| { | |
| "epoch": 6.23, | |
| "learning_rate": 0.000623003194888179, | |
| "loss": 0.238, | |
| "step": 9750 | |
| }, | |
| { | |
| "epoch": 6.24, | |
| "learning_rate": 0.0006236421725239617, | |
| "loss": 0.198, | |
| "step": 9760 | |
| }, | |
| { | |
| "epoch": 6.24, | |
| "learning_rate": 0.0006242811501597444, | |
| "loss": 0.2132, | |
| "step": 9770 | |
| }, | |
| { | |
| "epoch": 6.25, | |
| "learning_rate": 0.0006249201277955273, | |
| "loss": 0.2107, | |
| "step": 9780 | |
| }, | |
| { | |
| "epoch": 6.26, | |
| "learning_rate": 0.0006255591054313099, | |
| "loss": 0.1984, | |
| "step": 9790 | |
| }, | |
| { | |
| "epoch": 6.26, | |
| "learning_rate": 0.0006261980830670927, | |
| "loss": 0.2316, | |
| "step": 9800 | |
| }, | |
| { | |
| "epoch": 6.27, | |
| "learning_rate": 0.0006268370607028753, | |
| "loss": 0.2404, | |
| "step": 9810 | |
| }, | |
| { | |
| "epoch": 6.27, | |
| "learning_rate": 0.0006274760383386582, | |
| "loss": 0.227, | |
| "step": 9820 | |
| }, | |
| { | |
| "epoch": 6.28, | |
| "learning_rate": 0.0006281150159744409, | |
| "loss": 0.1707, | |
| "step": 9830 | |
| }, | |
| { | |
| "epoch": 6.29, | |
| "learning_rate": 0.0006287539936102236, | |
| "loss": 0.2225, | |
| "step": 9840 | |
| }, | |
| { | |
| "epoch": 6.29, | |
| "learning_rate": 0.0006293929712460064, | |
| "loss": 0.2663, | |
| "step": 9850 | |
| }, | |
| { | |
| "epoch": 6.3, | |
| "learning_rate": 0.0006300319488817892, | |
| "loss": 0.2101, | |
| "step": 9860 | |
| }, | |
| { | |
| "epoch": 6.31, | |
| "learning_rate": 0.0006306709265175718, | |
| "loss": 0.2007, | |
| "step": 9870 | |
| }, | |
| { | |
| "epoch": 6.31, | |
| "learning_rate": 0.0006313099041533547, | |
| "loss": 0.2094, | |
| "step": 9880 | |
| }, | |
| { | |
| "epoch": 6.32, | |
| "learning_rate": 0.0006319488817891374, | |
| "loss": 0.2393, | |
| "step": 9890 | |
| }, | |
| { | |
| "epoch": 6.33, | |
| "learning_rate": 0.0006325878594249201, | |
| "loss": 0.2459, | |
| "step": 9900 | |
| }, | |
| { | |
| "epoch": 6.33, | |
| "learning_rate": 0.000633226837060703, | |
| "loss": 0.195, | |
| "step": 9910 | |
| }, | |
| { | |
| "epoch": 6.34, | |
| "learning_rate": 0.0006338658146964857, | |
| "loss": 0.1721, | |
| "step": 9920 | |
| }, | |
| { | |
| "epoch": 6.34, | |
| "learning_rate": 0.0006345047923322684, | |
| "loss": 0.2254, | |
| "step": 9930 | |
| }, | |
| { | |
| "epoch": 6.35, | |
| "learning_rate": 0.0006351437699680511, | |
| "loss": 0.2252, | |
| "step": 9940 | |
| }, | |
| { | |
| "epoch": 6.36, | |
| "learning_rate": 0.000635782747603834, | |
| "loss": 0.1812, | |
| "step": 9950 | |
| }, | |
| { | |
| "epoch": 6.36, | |
| "learning_rate": 0.0006364217252396166, | |
| "loss": 0.2133, | |
| "step": 9960 | |
| }, | |
| { | |
| "epoch": 6.37, | |
| "learning_rate": 0.0006370607028753994, | |
| "loss": 0.2453, | |
| "step": 9970 | |
| }, | |
| { | |
| "epoch": 6.38, | |
| "learning_rate": 0.000637699680511182, | |
| "loss": 0.2257, | |
| "step": 9980 | |
| }, | |
| { | |
| "epoch": 6.38, | |
| "learning_rate": 0.0006383386581469649, | |
| "loss": 0.2017, | |
| "step": 9990 | |
| }, | |
| { | |
| "epoch": 6.39, | |
| "learning_rate": 0.0006389776357827476, | |
| "loss": 0.2141, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 6.4, | |
| "learning_rate": 0.0006396166134185303, | |
| "loss": 0.221, | |
| "step": 10010 | |
| }, | |
| { | |
| "epoch": 6.4, | |
| "learning_rate": 0.0006402555910543131, | |
| "loss": 0.2082, | |
| "step": 10020 | |
| }, | |
| { | |
| "epoch": 6.41, | |
| "learning_rate": 0.0006408945686900959, | |
| "loss": 0.2305, | |
| "step": 10030 | |
| }, | |
| { | |
| "epoch": 6.42, | |
| "learning_rate": 0.0006415335463258785, | |
| "loss": 0.1989, | |
| "step": 10040 | |
| }, | |
| { | |
| "epoch": 6.42, | |
| "learning_rate": 0.0006421725239616614, | |
| "loss": 0.2114, | |
| "step": 10050 | |
| }, | |
| { | |
| "epoch": 6.43, | |
| "learning_rate": 0.0006428115015974441, | |
| "loss": 0.244, | |
| "step": 10060 | |
| }, | |
| { | |
| "epoch": 6.43, | |
| "learning_rate": 0.0006434504792332268, | |
| "loss": 0.2128, | |
| "step": 10070 | |
| }, | |
| { | |
| "epoch": 6.44, | |
| "learning_rate": 0.0006440894568690096, | |
| "loss": 0.2411, | |
| "step": 10080 | |
| }, | |
| { | |
| "epoch": 6.45, | |
| "learning_rate": 0.0006447284345047924, | |
| "loss": 0.2089, | |
| "step": 10090 | |
| }, | |
| { | |
| "epoch": 6.45, | |
| "learning_rate": 0.000645367412140575, | |
| "loss": 0.2048, | |
| "step": 10100 | |
| }, | |
| { | |
| "epoch": 6.46, | |
| "learning_rate": 0.0006460063897763579, | |
| "loss": 0.2081, | |
| "step": 10110 | |
| }, | |
| { | |
| "epoch": 6.47, | |
| "learning_rate": 0.0006466453674121406, | |
| "loss": 0.2285, | |
| "step": 10120 | |
| }, | |
| { | |
| "epoch": 6.47, | |
| "learning_rate": 0.0006472843450479233, | |
| "loss": 0.217, | |
| "step": 10130 | |
| }, | |
| { | |
| "epoch": 6.48, | |
| "learning_rate": 0.0006479233226837062, | |
| "loss": 0.2066, | |
| "step": 10140 | |
| }, | |
| { | |
| "epoch": 6.49, | |
| "learning_rate": 0.0006485623003194888, | |
| "loss": 0.2274, | |
| "step": 10150 | |
| }, | |
| { | |
| "epoch": 6.49, | |
| "learning_rate": 0.0006492012779552716, | |
| "loss": 0.2116, | |
| "step": 10160 | |
| }, | |
| { | |
| "epoch": 6.5, | |
| "learning_rate": 0.0006498402555910543, | |
| "loss": 0.2406, | |
| "step": 10170 | |
| }, | |
| { | |
| "epoch": 6.5, | |
| "learning_rate": 0.0006504792332268371, | |
| "loss": 0.2094, | |
| "step": 10180 | |
| }, | |
| { | |
| "epoch": 6.51, | |
| "learning_rate": 0.0006511182108626198, | |
| "loss": 0.2406, | |
| "step": 10190 | |
| }, | |
| { | |
| "epoch": 6.52, | |
| "learning_rate": 0.0006517571884984026, | |
| "loss": 0.2134, | |
| "step": 10200 | |
| }, | |
| { | |
| "epoch": 6.52, | |
| "learning_rate": 0.0006523961661341853, | |
| "loss": 0.2337, | |
| "step": 10210 | |
| }, | |
| { | |
| "epoch": 6.53, | |
| "learning_rate": 0.0006530351437699681, | |
| "loss": 0.2169, | |
| "step": 10220 | |
| }, | |
| { | |
| "epoch": 6.54, | |
| "learning_rate": 0.0006536741214057508, | |
| "loss": 0.1976, | |
| "step": 10230 | |
| }, | |
| { | |
| "epoch": 6.54, | |
| "learning_rate": 0.0006543130990415336, | |
| "loss": 0.2305, | |
| "step": 10240 | |
| }, | |
| { | |
| "epoch": 6.55, | |
| "learning_rate": 0.0006549520766773163, | |
| "loss": 0.2315, | |
| "step": 10250 | |
| }, | |
| { | |
| "epoch": 6.56, | |
| "learning_rate": 0.000655591054313099, | |
| "loss": 0.2116, | |
| "step": 10260 | |
| }, | |
| { | |
| "epoch": 6.56, | |
| "learning_rate": 0.0006562300319488817, | |
| "loss": 0.2238, | |
| "step": 10270 | |
| }, | |
| { | |
| "epoch": 6.57, | |
| "learning_rate": 0.0006568690095846646, | |
| "loss": 0.1958, | |
| "step": 10280 | |
| }, | |
| { | |
| "epoch": 6.57, | |
| "learning_rate": 0.0006575079872204472, | |
| "loss": 0.2142, | |
| "step": 10290 | |
| }, | |
| { | |
| "epoch": 6.58, | |
| "learning_rate": 0.00065814696485623, | |
| "loss": 0.2262, | |
| "step": 10300 | |
| }, | |
| { | |
| "epoch": 6.59, | |
| "learning_rate": 0.0006587859424920129, | |
| "loss": 0.2009, | |
| "step": 10310 | |
| }, | |
| { | |
| "epoch": 6.59, | |
| "learning_rate": 0.0006594249201277955, | |
| "loss": 0.2405, | |
| "step": 10320 | |
| }, | |
| { | |
| "epoch": 6.6, | |
| "learning_rate": 0.0006600638977635783, | |
| "loss": 0.239, | |
| "step": 10330 | |
| }, | |
| { | |
| "epoch": 6.61, | |
| "learning_rate": 0.0006607028753993611, | |
| "loss": 0.2234, | |
| "step": 10340 | |
| }, | |
| { | |
| "epoch": 6.61, | |
| "learning_rate": 0.0006613418530351438, | |
| "loss": 0.2276, | |
| "step": 10350 | |
| }, | |
| { | |
| "epoch": 6.62, | |
| "learning_rate": 0.0006619808306709265, | |
| "loss": 0.2201, | |
| "step": 10360 | |
| }, | |
| { | |
| "epoch": 6.63, | |
| "learning_rate": 0.0006626198083067094, | |
| "loss": 0.2277, | |
| "step": 10370 | |
| }, | |
| { | |
| "epoch": 6.63, | |
| "learning_rate": 0.000663258785942492, | |
| "loss": 0.2399, | |
| "step": 10380 | |
| }, | |
| { | |
| "epoch": 6.64, | |
| "learning_rate": 0.0006638977635782748, | |
| "loss": 0.2097, | |
| "step": 10390 | |
| }, | |
| { | |
| "epoch": 6.65, | |
| "learning_rate": 0.0006645367412140575, | |
| "loss": 0.2211, | |
| "step": 10400 | |
| }, | |
| { | |
| "epoch": 6.65, | |
| "learning_rate": 0.0006651757188498403, | |
| "loss": 0.2249, | |
| "step": 10410 | |
| }, | |
| { | |
| "epoch": 6.66, | |
| "learning_rate": 0.000665814696485623, | |
| "loss": 0.223, | |
| "step": 10420 | |
| }, | |
| { | |
| "epoch": 6.66, | |
| "learning_rate": 0.0006664536741214057, | |
| "loss": 0.2492, | |
| "step": 10430 | |
| }, | |
| { | |
| "epoch": 6.67, | |
| "learning_rate": 0.0006670926517571885, | |
| "loss": 0.1998, | |
| "step": 10440 | |
| }, | |
| { | |
| "epoch": 6.68, | |
| "learning_rate": 0.0006677316293929713, | |
| "loss": 0.2508, | |
| "step": 10450 | |
| }, | |
| { | |
| "epoch": 6.68, | |
| "learning_rate": 0.0006683706070287539, | |
| "loss": 0.2545, | |
| "step": 10460 | |
| }, | |
| { | |
| "epoch": 6.69, | |
| "learning_rate": 0.0006690095846645368, | |
| "loss": 0.2027, | |
| "step": 10470 | |
| }, | |
| { | |
| "epoch": 6.7, | |
| "learning_rate": 0.0006696485623003195, | |
| "loss": 0.2344, | |
| "step": 10480 | |
| }, | |
| { | |
| "epoch": 6.7, | |
| "learning_rate": 0.0006702875399361022, | |
| "loss": 0.2268, | |
| "step": 10490 | |
| }, | |
| { | |
| "epoch": 6.71, | |
| "learning_rate": 0.0006709265175718851, | |
| "loss": 0.2414, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 6.72, | |
| "learning_rate": 0.0006715654952076678, | |
| "loss": 0.2263, | |
| "step": 10510 | |
| }, | |
| { | |
| "epoch": 6.72, | |
| "learning_rate": 0.0006722044728434505, | |
| "loss": 0.1974, | |
| "step": 10520 | |
| }, | |
| { | |
| "epoch": 6.73, | |
| "learning_rate": 0.0006728434504792332, | |
| "loss": 0.2196, | |
| "step": 10530 | |
| }, | |
| { | |
| "epoch": 6.73, | |
| "learning_rate": 0.0006734824281150161, | |
| "loss": 0.1958, | |
| "step": 10540 | |
| }, | |
| { | |
| "epoch": 6.74, | |
| "learning_rate": 0.0006741214057507987, | |
| "loss": 0.2002, | |
| "step": 10550 | |
| }, | |
| { | |
| "epoch": 6.75, | |
| "learning_rate": 0.0006747603833865815, | |
| "loss": 0.2186, | |
| "step": 10560 | |
| }, | |
| { | |
| "epoch": 6.75, | |
| "learning_rate": 0.0006753993610223642, | |
| "loss": 0.2254, | |
| "step": 10570 | |
| }, | |
| { | |
| "epoch": 6.76, | |
| "learning_rate": 0.000676038338658147, | |
| "loss": 0.1954, | |
| "step": 10580 | |
| }, | |
| { | |
| "epoch": 6.77, | |
| "learning_rate": 0.0006766773162939297, | |
| "loss": 0.2413, | |
| "step": 10590 | |
| }, | |
| { | |
| "epoch": 6.77, | |
| "learning_rate": 0.0006773162939297125, | |
| "loss": 0.2373, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 6.78, | |
| "learning_rate": 0.0006779552715654952, | |
| "loss": 0.2389, | |
| "step": 10610 | |
| }, | |
| { | |
| "epoch": 6.79, | |
| "learning_rate": 0.000678594249201278, | |
| "loss": 0.203, | |
| "step": 10620 | |
| }, | |
| { | |
| "epoch": 6.79, | |
| "learning_rate": 0.0006792332268370606, | |
| "loss": 0.2357, | |
| "step": 10630 | |
| }, | |
| { | |
| "epoch": 6.8, | |
| "learning_rate": 0.0006798722044728435, | |
| "loss": 0.2449, | |
| "step": 10640 | |
| }, | |
| { | |
| "epoch": 6.8, | |
| "learning_rate": 0.0006805111821086262, | |
| "loss": 0.2056, | |
| "step": 10650 | |
| }, | |
| { | |
| "epoch": 6.81, | |
| "learning_rate": 0.0006811501597444089, | |
| "loss": 0.2524, | |
| "step": 10660 | |
| }, | |
| { | |
| "epoch": 6.82, | |
| "learning_rate": 0.0006817891373801917, | |
| "loss": 0.2157, | |
| "step": 10670 | |
| }, | |
| { | |
| "epoch": 6.82, | |
| "learning_rate": 0.0006824281150159745, | |
| "loss": 0.1798, | |
| "step": 10680 | |
| }, | |
| { | |
| "epoch": 6.83, | |
| "learning_rate": 0.0006830670926517571, | |
| "loss": 0.1969, | |
| "step": 10690 | |
| }, | |
| { | |
| "epoch": 6.84, | |
| "learning_rate": 0.00068370607028754, | |
| "loss": 0.2223, | |
| "step": 10700 | |
| }, | |
| { | |
| "epoch": 6.84, | |
| "learning_rate": 0.0006843450479233228, | |
| "loss": 0.2193, | |
| "step": 10710 | |
| }, | |
| { | |
| "epoch": 6.85, | |
| "learning_rate": 0.0006849840255591054, | |
| "loss": 0.2223, | |
| "step": 10720 | |
| }, | |
| { | |
| "epoch": 6.86, | |
| "learning_rate": 0.0006856230031948883, | |
| "loss": 0.2113, | |
| "step": 10730 | |
| }, | |
| { | |
| "epoch": 6.86, | |
| "learning_rate": 0.0006862619808306709, | |
| "loss": 0.2488, | |
| "step": 10740 | |
| }, | |
| { | |
| "epoch": 6.87, | |
| "learning_rate": 0.0006869009584664537, | |
| "loss": 0.2308, | |
| "step": 10750 | |
| }, | |
| { | |
| "epoch": 6.88, | |
| "learning_rate": 0.0006875399361022364, | |
| "loss": 0.2283, | |
| "step": 10760 | |
| }, | |
| { | |
| "epoch": 6.88, | |
| "learning_rate": 0.0006881789137380192, | |
| "loss": 0.2672, | |
| "step": 10770 | |
| }, | |
| { | |
| "epoch": 6.89, | |
| "learning_rate": 0.0006888178913738019, | |
| "loss": 0.2538, | |
| "step": 10780 | |
| }, | |
| { | |
| "epoch": 6.89, | |
| "learning_rate": 0.0006894568690095847, | |
| "loss": 0.2907, | |
| "step": 10790 | |
| }, | |
| { | |
| "epoch": 6.9, | |
| "learning_rate": 0.0006900958466453674, | |
| "loss": 0.1976, | |
| "step": 10800 | |
| }, | |
| { | |
| "epoch": 6.91, | |
| "learning_rate": 0.0006907348242811502, | |
| "loss": 0.2619, | |
| "step": 10810 | |
| }, | |
| { | |
| "epoch": 6.91, | |
| "learning_rate": 0.0006913738019169329, | |
| "loss": 0.1975, | |
| "step": 10820 | |
| }, | |
| { | |
| "epoch": 6.92, | |
| "learning_rate": 0.0006920127795527157, | |
| "loss": 0.1838, | |
| "step": 10830 | |
| }, | |
| { | |
| "epoch": 6.93, | |
| "learning_rate": 0.0006926517571884984, | |
| "loss": 0.2242, | |
| "step": 10840 | |
| }, | |
| { | |
| "epoch": 6.93, | |
| "learning_rate": 0.0006932907348242812, | |
| "loss": 0.2057, | |
| "step": 10850 | |
| }, | |
| { | |
| "epoch": 6.94, | |
| "learning_rate": 0.0006939297124600638, | |
| "loss": 0.2116, | |
| "step": 10860 | |
| }, | |
| { | |
| "epoch": 6.95, | |
| "learning_rate": 0.0006945686900958467, | |
| "loss": 0.2289, | |
| "step": 10870 | |
| }, | |
| { | |
| "epoch": 6.95, | |
| "learning_rate": 0.0006952076677316293, | |
| "loss": 0.202, | |
| "step": 10880 | |
| }, | |
| { | |
| "epoch": 6.96, | |
| "learning_rate": 0.0006958466453674121, | |
| "loss": 0.2221, | |
| "step": 10890 | |
| }, | |
| { | |
| "epoch": 6.96, | |
| "learning_rate": 0.000696485623003195, | |
| "loss": 0.237, | |
| "step": 10900 | |
| }, | |
| { | |
| "epoch": 6.97, | |
| "learning_rate": 0.0006971246006389776, | |
| "loss": 0.3199, | |
| "step": 10910 | |
| }, | |
| { | |
| "epoch": 6.98, | |
| "learning_rate": 0.0006977635782747604, | |
| "loss": 0.2029, | |
| "step": 10920 | |
| }, | |
| { | |
| "epoch": 6.98, | |
| "learning_rate": 0.0006984025559105432, | |
| "loss": 0.223, | |
| "step": 10930 | |
| }, | |
| { | |
| "epoch": 6.99, | |
| "learning_rate": 0.0006990415335463259, | |
| "loss": 0.216, | |
| "step": 10940 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 0.0006996805111821086, | |
| "loss": 0.1952, | |
| "step": 10950 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "learning_rate": 0.0007003194888178915, | |
| "loss": 0.2173, | |
| "step": 10960 | |
| }, | |
| { | |
| "epoch": 7.01, | |
| "learning_rate": 0.0007009584664536741, | |
| "loss": 0.1895, | |
| "step": 10970 | |
| }, | |
| { | |
| "epoch": 7.02, | |
| "learning_rate": 0.0007015974440894569, | |
| "loss": 0.1721, | |
| "step": 10980 | |
| }, | |
| { | |
| "epoch": 7.02, | |
| "learning_rate": 0.0007022364217252397, | |
| "loss": 0.1872, | |
| "step": 10990 | |
| }, | |
| { | |
| "epoch": 7.03, | |
| "learning_rate": 0.0007028753993610224, | |
| "loss": 0.1846, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 7.04, | |
| "learning_rate": 0.0007035143769968051, | |
| "loss": 0.207, | |
| "step": 11010 | |
| }, | |
| { | |
| "epoch": 7.04, | |
| "learning_rate": 0.0007041533546325878, | |
| "loss": 0.2032, | |
| "step": 11020 | |
| }, | |
| { | |
| "epoch": 7.05, | |
| "learning_rate": 0.0007047923322683706, | |
| "loss": 0.1662, | |
| "step": 11030 | |
| }, | |
| { | |
| "epoch": 7.05, | |
| "learning_rate": 0.0007054313099041534, | |
| "loss": 0.167, | |
| "step": 11040 | |
| }, | |
| { | |
| "epoch": 7.06, | |
| "learning_rate": 0.000706070287539936, | |
| "loss": 0.2351, | |
| "step": 11050 | |
| }, | |
| { | |
| "epoch": 7.07, | |
| "learning_rate": 0.0007067092651757189, | |
| "loss": 0.1653, | |
| "step": 11060 | |
| }, | |
| { | |
| "epoch": 7.07, | |
| "learning_rate": 0.0007073482428115016, | |
| "loss": 0.1826, | |
| "step": 11070 | |
| }, | |
| { | |
| "epoch": 7.08, | |
| "learning_rate": 0.0007079872204472843, | |
| "loss": 0.2162, | |
| "step": 11080 | |
| }, | |
| { | |
| "epoch": 7.09, | |
| "learning_rate": 0.000708626198083067, | |
| "loss": 0.1853, | |
| "step": 11090 | |
| }, | |
| { | |
| "epoch": 7.09, | |
| "learning_rate": 0.0007092651757188499, | |
| "loss": 0.1865, | |
| "step": 11100 | |
| }, | |
| { | |
| "epoch": 7.1, | |
| "learning_rate": 0.0007099041533546326, | |
| "loss": 0.1868, | |
| "step": 11110 | |
| }, | |
| { | |
| "epoch": 7.11, | |
| "learning_rate": 0.0007105431309904153, | |
| "loss": 0.1628, | |
| "step": 11120 | |
| }, | |
| { | |
| "epoch": 7.11, | |
| "learning_rate": 0.0007111821086261982, | |
| "loss": 0.1975, | |
| "step": 11130 | |
| }, | |
| { | |
| "epoch": 7.12, | |
| "learning_rate": 0.0007118210862619808, | |
| "loss": 0.1853, | |
| "step": 11140 | |
| }, | |
| { | |
| "epoch": 7.12, | |
| "learning_rate": 0.0007124600638977636, | |
| "loss": 0.2046, | |
| "step": 11150 | |
| }, | |
| { | |
| "epoch": 7.13, | |
| "learning_rate": 0.0007130990415335464, | |
| "loss": 0.1966, | |
| "step": 11160 | |
| }, | |
| { | |
| "epoch": 7.14, | |
| "learning_rate": 0.0007137380191693291, | |
| "loss": 0.2022, | |
| "step": 11170 | |
| }, | |
| { | |
| "epoch": 7.14, | |
| "learning_rate": 0.0007143769968051118, | |
| "loss": 0.1635, | |
| "step": 11180 | |
| }, | |
| { | |
| "epoch": 7.15, | |
| "learning_rate": 0.0007150159744408946, | |
| "loss": 0.2223, | |
| "step": 11190 | |
| }, | |
| { | |
| "epoch": 7.16, | |
| "learning_rate": 0.0007156549520766773, | |
| "loss": 0.2094, | |
| "step": 11200 | |
| }, | |
| { | |
| "epoch": 7.16, | |
| "learning_rate": 0.0007162939297124601, | |
| "loss": 0.1938, | |
| "step": 11210 | |
| }, | |
| { | |
| "epoch": 7.17, | |
| "learning_rate": 0.0007169329073482428, | |
| "loss": 0.2053, | |
| "step": 11220 | |
| }, | |
| { | |
| "epoch": 7.18, | |
| "learning_rate": 0.0007175718849840256, | |
| "loss": 0.1981, | |
| "step": 11230 | |
| }, | |
| { | |
| "epoch": 7.18, | |
| "learning_rate": 0.0007182108626198083, | |
| "loss": 0.1969, | |
| "step": 11240 | |
| }, | |
| { | |
| "epoch": 7.19, | |
| "learning_rate": 0.000718849840255591, | |
| "loss": 0.1912, | |
| "step": 11250 | |
| }, | |
| { | |
| "epoch": 7.19, | |
| "learning_rate": 0.0007194888178913738, | |
| "loss": 0.1875, | |
| "step": 11260 | |
| }, | |
| { | |
| "epoch": 7.2, | |
| "learning_rate": 0.0007201277955271566, | |
| "loss": 0.1944, | |
| "step": 11270 | |
| }, | |
| { | |
| "epoch": 7.21, | |
| "learning_rate": 0.0007207667731629392, | |
| "loss": 0.2254, | |
| "step": 11280 | |
| }, | |
| { | |
| "epoch": 7.21, | |
| "learning_rate": 0.0007214057507987221, | |
| "loss": 0.2204, | |
| "step": 11290 | |
| }, | |
| { | |
| "epoch": 7.22, | |
| "learning_rate": 0.0007220447284345049, | |
| "loss": 0.2089, | |
| "step": 11300 | |
| }, | |
| { | |
| "epoch": 7.23, | |
| "learning_rate": 0.0007226837060702875, | |
| "loss": 0.2098, | |
| "step": 11310 | |
| }, | |
| { | |
| "epoch": 7.23, | |
| "learning_rate": 0.0007233226837060704, | |
| "loss": 0.2107, | |
| "step": 11320 | |
| }, | |
| { | |
| "epoch": 7.24, | |
| "learning_rate": 0.000723961661341853, | |
| "loss": 0.2035, | |
| "step": 11330 | |
| }, | |
| { | |
| "epoch": 7.25, | |
| "learning_rate": 0.0007246006389776358, | |
| "loss": 0.2098, | |
| "step": 11340 | |
| }, | |
| { | |
| "epoch": 7.25, | |
| "learning_rate": 0.0007252396166134186, | |
| "loss": 0.2332, | |
| "step": 11350 | |
| }, | |
| { | |
| "epoch": 7.26, | |
| "learning_rate": 0.0007258785942492013, | |
| "loss": 0.1978, | |
| "step": 11360 | |
| }, | |
| { | |
| "epoch": 7.27, | |
| "learning_rate": 0.000726517571884984, | |
| "loss": 0.1873, | |
| "step": 11370 | |
| }, | |
| { | |
| "epoch": 7.27, | |
| "learning_rate": 0.0007271565495207669, | |
| "loss": 0.1933, | |
| "step": 11380 | |
| }, | |
| { | |
| "epoch": 7.28, | |
| "learning_rate": 0.0007277955271565495, | |
| "loss": 0.2329, | |
| "step": 11390 | |
| }, | |
| { | |
| "epoch": 7.28, | |
| "learning_rate": 0.0007284345047923323, | |
| "loss": 0.1914, | |
| "step": 11400 | |
| }, | |
| { | |
| "epoch": 7.29, | |
| "learning_rate": 0.000729073482428115, | |
| "loss": 0.1788, | |
| "step": 11410 | |
| }, | |
| { | |
| "epoch": 7.3, | |
| "learning_rate": 0.0007297124600638978, | |
| "loss": 0.2233, | |
| "step": 11420 | |
| }, | |
| { | |
| "epoch": 7.3, | |
| "learning_rate": 0.0007303514376996805, | |
| "loss": 0.2045, | |
| "step": 11430 | |
| }, | |
| { | |
| "epoch": 7.31, | |
| "learning_rate": 0.0007309904153354633, | |
| "loss": 0.1945, | |
| "step": 11440 | |
| }, | |
| { | |
| "epoch": 7.32, | |
| "learning_rate": 0.000731629392971246, | |
| "loss": 0.2035, | |
| "step": 11450 | |
| }, | |
| { | |
| "epoch": 7.32, | |
| "learning_rate": 0.0007322683706070288, | |
| "loss": 0.1888, | |
| "step": 11460 | |
| }, | |
| { | |
| "epoch": 7.33, | |
| "learning_rate": 0.0007329073482428114, | |
| "loss": 0.2102, | |
| "step": 11470 | |
| }, | |
| { | |
| "epoch": 7.34, | |
| "learning_rate": 0.0007335463258785943, | |
| "loss": 0.2422, | |
| "step": 11480 | |
| }, | |
| { | |
| "epoch": 7.34, | |
| "learning_rate": 0.0007341853035143771, | |
| "loss": 0.2067, | |
| "step": 11490 | |
| }, | |
| { | |
| "epoch": 7.35, | |
| "learning_rate": 0.0007348242811501597, | |
| "loss": 0.2258, | |
| "step": 11500 | |
| }, | |
| { | |
| "epoch": 7.35, | |
| "learning_rate": 0.0007354632587859425, | |
| "loss": 0.1953, | |
| "step": 11510 | |
| }, | |
| { | |
| "epoch": 7.36, | |
| "learning_rate": 0.0007361022364217253, | |
| "loss": 0.2008, | |
| "step": 11520 | |
| }, | |
| { | |
| "epoch": 7.37, | |
| "learning_rate": 0.000736741214057508, | |
| "loss": 0.1799, | |
| "step": 11530 | |
| }, | |
| { | |
| "epoch": 7.37, | |
| "learning_rate": 0.0007373801916932907, | |
| "loss": 0.1961, | |
| "step": 11540 | |
| }, | |
| { | |
| "epoch": 7.38, | |
| "learning_rate": 0.0007380191693290736, | |
| "loss": 0.2147, | |
| "step": 11550 | |
| }, | |
| { | |
| "epoch": 7.39, | |
| "learning_rate": 0.0007386581469648562, | |
| "loss": 0.2173, | |
| "step": 11560 | |
| }, | |
| { | |
| "epoch": 7.39, | |
| "learning_rate": 0.000739297124600639, | |
| "loss": 0.2015, | |
| "step": 11570 | |
| }, | |
| { | |
| "epoch": 7.4, | |
| "learning_rate": 0.0007399361022364218, | |
| "loss": 0.2245, | |
| "step": 11580 | |
| }, | |
| { | |
| "epoch": 7.41, | |
| "learning_rate": 0.0007405750798722045, | |
| "loss": 0.2001, | |
| "step": 11590 | |
| }, | |
| { | |
| "epoch": 7.41, | |
| "learning_rate": 0.0007412140575079872, | |
| "loss": 0.2022, | |
| "step": 11600 | |
| }, | |
| { | |
| "epoch": 7.42, | |
| "learning_rate": 0.0007418530351437701, | |
| "loss": 0.2094, | |
| "step": 11610 | |
| }, | |
| { | |
| "epoch": 7.42, | |
| "learning_rate": 0.0007424920127795527, | |
| "loss": 0.2429, | |
| "step": 11620 | |
| }, | |
| { | |
| "epoch": 7.43, | |
| "learning_rate": 0.0007431309904153355, | |
| "loss": 0.174, | |
| "step": 11630 | |
| }, | |
| { | |
| "epoch": 7.44, | |
| "learning_rate": 0.0007437699680511181, | |
| "loss": 0.2271, | |
| "step": 11640 | |
| }, | |
| { | |
| "epoch": 7.44, | |
| "learning_rate": 0.000744408945686901, | |
| "loss": 0.1932, | |
| "step": 11650 | |
| }, | |
| { | |
| "epoch": 7.45, | |
| "learning_rate": 0.0007450479233226837, | |
| "loss": 0.1983, | |
| "step": 11660 | |
| }, | |
| { | |
| "epoch": 7.46, | |
| "learning_rate": 0.0007456869009584664, | |
| "loss": 0.1996, | |
| "step": 11670 | |
| }, | |
| { | |
| "epoch": 7.46, | |
| "learning_rate": 0.0007463258785942492, | |
| "loss": 0.2084, | |
| "step": 11680 | |
| }, | |
| { | |
| "epoch": 7.47, | |
| "learning_rate": 0.000746964856230032, | |
| "loss": 0.2157, | |
| "step": 11690 | |
| }, | |
| { | |
| "epoch": 7.48, | |
| "learning_rate": 0.0007476038338658147, | |
| "loss": 0.2366, | |
| "step": 11700 | |
| }, | |
| { | |
| "epoch": 7.48, | |
| "learning_rate": 0.0007482428115015975, | |
| "loss": 0.2104, | |
| "step": 11710 | |
| }, | |
| { | |
| "epoch": 7.49, | |
| "learning_rate": 0.0007488817891373803, | |
| "loss": 0.2164, | |
| "step": 11720 | |
| }, | |
| { | |
| "epoch": 7.5, | |
| "learning_rate": 0.0007495207667731629, | |
| "loss": 0.1951, | |
| "step": 11730 | |
| }, | |
| { | |
| "epoch": 7.5, | |
| "learning_rate": 0.0007501597444089458, | |
| "loss": 0.2207, | |
| "step": 11740 | |
| }, | |
| { | |
| "epoch": 7.51, | |
| "learning_rate": 0.0007507987220447285, | |
| "loss": 0.1786, | |
| "step": 11750 | |
| }, | |
| { | |
| "epoch": 7.51, | |
| "learning_rate": 0.0007514376996805112, | |
| "loss": 0.2087, | |
| "step": 11760 | |
| }, | |
| { | |
| "epoch": 7.52, | |
| "learning_rate": 0.0007520766773162939, | |
| "loss": 0.2059, | |
| "step": 11770 | |
| }, | |
| { | |
| "epoch": 7.53, | |
| "learning_rate": 0.0007527156549520767, | |
| "loss": 0.2304, | |
| "step": 11780 | |
| }, | |
| { | |
| "epoch": 7.53, | |
| "learning_rate": 0.0007533546325878594, | |
| "loss": 0.2173, | |
| "step": 11790 | |
| }, | |
| { | |
| "epoch": 7.54, | |
| "learning_rate": 0.0007539936102236422, | |
| "loss": 0.2221, | |
| "step": 11800 | |
| }, | |
| { | |
| "epoch": 7.55, | |
| "learning_rate": 0.0007546325878594249, | |
| "loss": 0.203, | |
| "step": 11810 | |
| }, | |
| { | |
| "epoch": 7.55, | |
| "learning_rate": 0.0007552715654952077, | |
| "loss": 0.2087, | |
| "step": 11820 | |
| }, | |
| { | |
| "epoch": 7.56, | |
| "learning_rate": 0.0007559105431309904, | |
| "loss": 0.2292, | |
| "step": 11830 | |
| }, | |
| { | |
| "epoch": 7.57, | |
| "learning_rate": 0.0007565495207667732, | |
| "loss": 0.2116, | |
| "step": 11840 | |
| }, | |
| { | |
| "epoch": 7.57, | |
| "learning_rate": 0.0007571884984025559, | |
| "loss": 0.2227, | |
| "step": 11850 | |
| }, | |
| { | |
| "epoch": 7.58, | |
| "learning_rate": 0.0007578274760383387, | |
| "loss": 0.207, | |
| "step": 11860 | |
| }, | |
| { | |
| "epoch": 7.58, | |
| "learning_rate": 0.0007584664536741213, | |
| "loss": 0.2051, | |
| "step": 11870 | |
| }, | |
| { | |
| "epoch": 7.59, | |
| "learning_rate": 0.0007591054313099042, | |
| "loss": 0.2409, | |
| "step": 11880 | |
| }, | |
| { | |
| "epoch": 7.6, | |
| "learning_rate": 0.000759744408945687, | |
| "loss": 0.1849, | |
| "step": 11890 | |
| }, | |
| { | |
| "epoch": 7.6, | |
| "learning_rate": 0.0007603833865814696, | |
| "loss": 0.2098, | |
| "step": 11900 | |
| }, | |
| { | |
| "epoch": 7.61, | |
| "learning_rate": 0.0007610223642172525, | |
| "loss": 0.2225, | |
| "step": 11910 | |
| }, | |
| { | |
| "epoch": 7.62, | |
| "learning_rate": 0.0007616613418530352, | |
| "loss": 0.1973, | |
| "step": 11920 | |
| }, | |
| { | |
| "epoch": 7.62, | |
| "learning_rate": 0.0007623003194888179, | |
| "loss": 0.239, | |
| "step": 11930 | |
| }, | |
| { | |
| "epoch": 7.63, | |
| "learning_rate": 0.0007629392971246007, | |
| "loss": 0.2186, | |
| "step": 11940 | |
| }, | |
| { | |
| "epoch": 7.64, | |
| "learning_rate": 0.0007635782747603834, | |
| "loss": 0.1849, | |
| "step": 11950 | |
| }, | |
| { | |
| "epoch": 7.64, | |
| "learning_rate": 0.0007642172523961661, | |
| "loss": 0.2316, | |
| "step": 11960 | |
| }, | |
| { | |
| "epoch": 7.65, | |
| "learning_rate": 0.000764856230031949, | |
| "loss": 0.2223, | |
| "step": 11970 | |
| }, | |
| { | |
| "epoch": 7.65, | |
| "learning_rate": 0.0007654952076677316, | |
| "loss": 0.2457, | |
| "step": 11980 | |
| }, | |
| { | |
| "epoch": 7.66, | |
| "learning_rate": 0.0007661341853035144, | |
| "loss": 0.2006, | |
| "step": 11990 | |
| }, | |
| { | |
| "epoch": 7.67, | |
| "learning_rate": 0.0007667731629392971, | |
| "loss": 0.2142, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 7.67, | |
| "learning_rate": 0.0007674121405750799, | |
| "loss": 0.1964, | |
| "step": 12010 | |
| }, | |
| { | |
| "epoch": 7.68, | |
| "learning_rate": 0.0007680511182108626, | |
| "loss": 0.2215, | |
| "step": 12020 | |
| }, | |
| { | |
| "epoch": 7.69, | |
| "learning_rate": 0.0007686900958466454, | |
| "loss": 0.2158, | |
| "step": 12030 | |
| }, | |
| { | |
| "epoch": 7.69, | |
| "learning_rate": 0.0007693290734824281, | |
| "loss": 0.2071, | |
| "step": 12040 | |
| }, | |
| { | |
| "epoch": 7.7, | |
| "learning_rate": 0.0007699680511182109, | |
| "loss": 0.221, | |
| "step": 12050 | |
| }, | |
| { | |
| "epoch": 7.71, | |
| "learning_rate": 0.0007706070287539936, | |
| "loss": 0.2322, | |
| "step": 12060 | |
| }, | |
| { | |
| "epoch": 7.71, | |
| "learning_rate": 0.0007712460063897764, | |
| "loss": 0.2176, | |
| "step": 12070 | |
| }, | |
| { | |
| "epoch": 7.72, | |
| "learning_rate": 0.0007718849840255591, | |
| "loss": 0.1703, | |
| "step": 12080 | |
| }, | |
| { | |
| "epoch": 7.73, | |
| "learning_rate": 0.0007725239616613418, | |
| "loss": 0.2264, | |
| "step": 12090 | |
| }, | |
| { | |
| "epoch": 7.73, | |
| "learning_rate": 0.0007731629392971247, | |
| "loss": 0.2123, | |
| "step": 12100 | |
| }, | |
| { | |
| "epoch": 7.74, | |
| "learning_rate": 0.0007738019169329074, | |
| "loss": 0.2096, | |
| "step": 12110 | |
| }, | |
| { | |
| "epoch": 7.74, | |
| "learning_rate": 0.0007744408945686901, | |
| "loss": 0.228, | |
| "step": 12120 | |
| }, | |
| { | |
| "epoch": 7.75, | |
| "learning_rate": 0.0007750798722044728, | |
| "loss": 0.2193, | |
| "step": 12130 | |
| }, | |
| { | |
| "epoch": 7.76, | |
| "learning_rate": 0.0007757188498402557, | |
| "loss": 0.2062, | |
| "step": 12140 | |
| }, | |
| { | |
| "epoch": 7.76, | |
| "learning_rate": 0.0007763578274760383, | |
| "loss": 0.1992, | |
| "step": 12150 | |
| }, | |
| { | |
| "epoch": 7.77, | |
| "learning_rate": 0.0007769968051118211, | |
| "loss": 0.1922, | |
| "step": 12160 | |
| }, | |
| { | |
| "epoch": 7.78, | |
| "learning_rate": 0.0007776357827476039, | |
| "loss": 0.1991, | |
| "step": 12170 | |
| }, | |
| { | |
| "epoch": 7.78, | |
| "learning_rate": 0.0007782747603833866, | |
| "loss": 0.2427, | |
| "step": 12180 | |
| }, | |
| { | |
| "epoch": 7.79, | |
| "learning_rate": 0.0007789137380191693, | |
| "loss": 0.2242, | |
| "step": 12190 | |
| }, | |
| { | |
| "epoch": 7.8, | |
| "learning_rate": 0.0007795527156549522, | |
| "loss": 0.2559, | |
| "step": 12200 | |
| }, | |
| { | |
| "epoch": 7.8, | |
| "learning_rate": 0.0007801916932907348, | |
| "loss": 0.2238, | |
| "step": 12210 | |
| }, | |
| { | |
| "epoch": 7.81, | |
| "learning_rate": 0.0007808306709265176, | |
| "loss": 0.2055, | |
| "step": 12220 | |
| }, | |
| { | |
| "epoch": 7.81, | |
| "learning_rate": 0.0007814696485623002, | |
| "loss": 0.2139, | |
| "step": 12230 | |
| }, | |
| { | |
| "epoch": 7.82, | |
| "learning_rate": 0.0007821086261980831, | |
| "loss": 0.2198, | |
| "step": 12240 | |
| }, | |
| { | |
| "epoch": 7.83, | |
| "learning_rate": 0.0007827476038338658, | |
| "loss": 0.2401, | |
| "step": 12250 | |
| }, | |
| { | |
| "epoch": 7.83, | |
| "learning_rate": 0.0007833865814696485, | |
| "loss": 0.2253, | |
| "step": 12260 | |
| }, | |
| { | |
| "epoch": 7.84, | |
| "learning_rate": 0.0007840255591054313, | |
| "loss": 0.2157, | |
| "step": 12270 | |
| }, | |
| { | |
| "epoch": 7.85, | |
| "learning_rate": 0.0007846645367412141, | |
| "loss": 0.2274, | |
| "step": 12280 | |
| }, | |
| { | |
| "epoch": 7.85, | |
| "learning_rate": 0.0007853035143769968, | |
| "loss": 0.2281, | |
| "step": 12290 | |
| }, | |
| { | |
| "epoch": 7.86, | |
| "learning_rate": 0.0007859424920127796, | |
| "loss": 0.1965, | |
| "step": 12300 | |
| }, | |
| { | |
| "epoch": 7.87, | |
| "learning_rate": 0.0007865814696485624, | |
| "loss": 0.2179, | |
| "step": 12310 | |
| }, | |
| { | |
| "epoch": 7.87, | |
| "learning_rate": 0.000787220447284345, | |
| "loss": 0.1826, | |
| "step": 12320 | |
| }, | |
| { | |
| "epoch": 7.88, | |
| "learning_rate": 0.0007878594249201279, | |
| "loss": 0.172, | |
| "step": 12330 | |
| }, | |
| { | |
| "epoch": 7.88, | |
| "learning_rate": 0.0007884984025559106, | |
| "loss": 0.2562, | |
| "step": 12340 | |
| }, | |
| { | |
| "epoch": 7.89, | |
| "learning_rate": 0.0007891373801916933, | |
| "loss": 0.2094, | |
| "step": 12350 | |
| }, | |
| { | |
| "epoch": 7.9, | |
| "learning_rate": 0.000789776357827476, | |
| "loss": 0.1897, | |
| "step": 12360 | |
| }, | |
| { | |
| "epoch": 7.9, | |
| "learning_rate": 0.0007904153354632589, | |
| "loss": 0.2108, | |
| "step": 12370 | |
| }, | |
| { | |
| "epoch": 7.91, | |
| "learning_rate": 0.0007910543130990415, | |
| "loss": 0.21, | |
| "step": 12380 | |
| }, | |
| { | |
| "epoch": 7.92, | |
| "learning_rate": 0.0007916932907348243, | |
| "loss": 0.2316, | |
| "step": 12390 | |
| }, | |
| { | |
| "epoch": 7.92, | |
| "learning_rate": 0.000792332268370607, | |
| "loss": 0.1809, | |
| "step": 12400 | |
| }, | |
| { | |
| "epoch": 7.93, | |
| "learning_rate": 0.0007929712460063898, | |
| "loss": 0.2491, | |
| "step": 12410 | |
| }, | |
| { | |
| "epoch": 7.94, | |
| "learning_rate": 0.0007936102236421725, | |
| "loss": 0.1887, | |
| "step": 12420 | |
| }, | |
| { | |
| "epoch": 7.94, | |
| "learning_rate": 0.0007942492012779553, | |
| "loss": 0.2278, | |
| "step": 12430 | |
| }, | |
| { | |
| "epoch": 7.95, | |
| "learning_rate": 0.000794888178913738, | |
| "loss": 0.2504, | |
| "step": 12440 | |
| }, | |
| { | |
| "epoch": 7.95, | |
| "learning_rate": 0.0007955271565495208, | |
| "loss": 0.2111, | |
| "step": 12450 | |
| }, | |
| { | |
| "epoch": 7.96, | |
| "learning_rate": 0.0007961661341853034, | |
| "loss": 0.2649, | |
| "step": 12460 | |
| }, | |
| { | |
| "epoch": 7.97, | |
| "learning_rate": 0.0007968051118210863, | |
| "loss": 0.2035, | |
| "step": 12470 | |
| }, | |
| { | |
| "epoch": 7.97, | |
| "learning_rate": 0.000797444089456869, | |
| "loss": 0.2132, | |
| "step": 12480 | |
| }, | |
| { | |
| "epoch": 7.98, | |
| "learning_rate": 0.0007980830670926517, | |
| "loss": 0.2869, | |
| "step": 12490 | |
| }, | |
| { | |
| "epoch": 7.99, | |
| "learning_rate": 0.0007987220447284346, | |
| "loss": 0.261, | |
| "step": 12500 | |
| }, | |
| { | |
| "epoch": 7.99, | |
| "learning_rate": 0.0007993610223642173, | |
| "loss": 0.1863, | |
| "step": 12510 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "learning_rate": 0.0008, | |
| "loss": 0.2178, | |
| "step": 12520 | |
| }, | |
| { | |
| "epoch": 8.01, | |
| "learning_rate": 0.0008006389776357828, | |
| "loss": 0.1807, | |
| "step": 12530 | |
| }, | |
| { | |
| "epoch": 8.01, | |
| "learning_rate": 0.0008012779552715655, | |
| "loss": 0.1813, | |
| "step": 12540 | |
| }, | |
| { | |
| "epoch": 8.02, | |
| "learning_rate": 0.0008019169329073482, | |
| "loss": 0.1791, | |
| "step": 12550 | |
| }, | |
| { | |
| "epoch": 8.03, | |
| "learning_rate": 0.0008025559105431311, | |
| "loss": 0.1472, | |
| "step": 12560 | |
| }, | |
| { | |
| "epoch": 8.03, | |
| "learning_rate": 0.0008031948881789137, | |
| "loss": 0.18, | |
| "step": 12570 | |
| }, | |
| { | |
| "epoch": 8.04, | |
| "learning_rate": 0.0008038338658146965, | |
| "loss": 0.1829, | |
| "step": 12580 | |
| }, | |
| { | |
| "epoch": 8.04, | |
| "learning_rate": 0.0008044728434504793, | |
| "loss": 0.1877, | |
| "step": 12590 | |
| }, | |
| { | |
| "epoch": 8.05, | |
| "learning_rate": 0.000805111821086262, | |
| "loss": 0.2126, | |
| "step": 12600 | |
| }, | |
| { | |
| "epoch": 8.06, | |
| "learning_rate": 0.0008057507987220447, | |
| "loss": 0.1921, | |
| "step": 12610 | |
| }, | |
| { | |
| "epoch": 8.06, | |
| "learning_rate": 0.0008063897763578275, | |
| "loss": 0.1952, | |
| "step": 12620 | |
| }, | |
| { | |
| "epoch": 8.07, | |
| "learning_rate": 0.0008070287539936102, | |
| "loss": 0.1775, | |
| "step": 12630 | |
| }, | |
| { | |
| "epoch": 8.08, | |
| "learning_rate": 0.000807667731629393, | |
| "loss": 0.2038, | |
| "step": 12640 | |
| }, | |
| { | |
| "epoch": 8.08, | |
| "learning_rate": 0.0008083067092651757, | |
| "loss": 0.2054, | |
| "step": 12650 | |
| }, | |
| { | |
| "epoch": 8.09, | |
| "learning_rate": 0.0008089456869009585, | |
| "loss": 0.2258, | |
| "step": 12660 | |
| }, | |
| { | |
| "epoch": 8.1, | |
| "learning_rate": 0.0008095846645367412, | |
| "loss": 0.2226, | |
| "step": 12670 | |
| }, | |
| { | |
| "epoch": 8.1, | |
| "learning_rate": 0.000810223642172524, | |
| "loss": 0.1902, | |
| "step": 12680 | |
| }, | |
| { | |
| "epoch": 8.11, | |
| "learning_rate": 0.0008108626198083068, | |
| "loss": 0.1996, | |
| "step": 12690 | |
| }, | |
| { | |
| "epoch": 8.11, | |
| "learning_rate": 0.0008115015974440895, | |
| "loss": 0.1904, | |
| "step": 12700 | |
| }, | |
| { | |
| "epoch": 8.12, | |
| "learning_rate": 0.0008121405750798722, | |
| "loss": 0.1486, | |
| "step": 12710 | |
| }, | |
| { | |
| "epoch": 8.13, | |
| "learning_rate": 0.000812779552715655, | |
| "loss": 0.1905, | |
| "step": 12720 | |
| }, | |
| { | |
| "epoch": 8.13, | |
| "learning_rate": 0.0008134185303514378, | |
| "loss": 0.1883, | |
| "step": 12730 | |
| }, | |
| { | |
| "epoch": 8.14, | |
| "learning_rate": 0.0008140575079872204, | |
| "loss": 0.1863, | |
| "step": 12740 | |
| }, | |
| { | |
| "epoch": 8.15, | |
| "learning_rate": 0.0008146964856230032, | |
| "loss": 0.1934, | |
| "step": 12750 | |
| }, | |
| { | |
| "epoch": 8.15, | |
| "learning_rate": 0.000815335463258786, | |
| "loss": 0.1778, | |
| "step": 12760 | |
| }, | |
| { | |
| "epoch": 8.16, | |
| "learning_rate": 0.0008159744408945687, | |
| "loss": 0.1796, | |
| "step": 12770 | |
| }, | |
| { | |
| "epoch": 8.17, | |
| "learning_rate": 0.0008166134185303514, | |
| "loss": 0.1902, | |
| "step": 12780 | |
| }, | |
| { | |
| "epoch": 8.17, | |
| "learning_rate": 0.0008172523961661343, | |
| "loss": 0.1913, | |
| "step": 12790 | |
| }, | |
| { | |
| "epoch": 8.18, | |
| "learning_rate": 0.0008178913738019169, | |
| "loss": 0.1887, | |
| "step": 12800 | |
| }, | |
| { | |
| "epoch": 8.19, | |
| "learning_rate": 0.0008185303514376997, | |
| "loss": 0.1658, | |
| "step": 12810 | |
| }, | |
| { | |
| "epoch": 8.19, | |
| "learning_rate": 0.0008191693290734825, | |
| "loss": 0.169, | |
| "step": 12820 | |
| }, | |
| { | |
| "epoch": 8.2, | |
| "learning_rate": 0.0008198083067092652, | |
| "loss": 0.1946, | |
| "step": 12830 | |
| }, | |
| { | |
| "epoch": 8.2, | |
| "learning_rate": 0.0008204472843450479, | |
| "loss": 0.1913, | |
| "step": 12840 | |
| }, | |
| { | |
| "epoch": 8.21, | |
| "learning_rate": 0.0008210862619808306, | |
| "loss": 0.2135, | |
| "step": 12850 | |
| }, | |
| { | |
| "epoch": 8.22, | |
| "learning_rate": 0.0008217252396166134, | |
| "loss": 0.1913, | |
| "step": 12860 | |
| }, | |
| { | |
| "epoch": 8.22, | |
| "learning_rate": 0.0008223642172523962, | |
| "loss": 0.1958, | |
| "step": 12870 | |
| }, | |
| { | |
| "epoch": 8.23, | |
| "learning_rate": 0.0008230031948881789, | |
| "loss": 0.2013, | |
| "step": 12880 | |
| }, | |
| { | |
| "epoch": 8.24, | |
| "learning_rate": 0.0008236421725239617, | |
| "loss": 0.2246, | |
| "step": 12890 | |
| }, | |
| { | |
| "epoch": 8.24, | |
| "learning_rate": 0.0008242811501597445, | |
| "loss": 0.2016, | |
| "step": 12900 | |
| }, | |
| { | |
| "epoch": 8.25, | |
| "learning_rate": 0.0008249201277955271, | |
| "loss": 0.1932, | |
| "step": 12910 | |
| }, | |
| { | |
| "epoch": 8.26, | |
| "learning_rate": 0.00082555910543131, | |
| "loss": 0.1766, | |
| "step": 12920 | |
| }, | |
| { | |
| "epoch": 8.26, | |
| "learning_rate": 0.0008261980830670927, | |
| "loss": 0.1959, | |
| "step": 12930 | |
| }, | |
| { | |
| "epoch": 8.27, | |
| "learning_rate": 0.0008268370607028754, | |
| "loss": 0.1978, | |
| "step": 12940 | |
| }, | |
| { | |
| "epoch": 8.27, | |
| "learning_rate": 0.0008274760383386582, | |
| "loss": 0.2187, | |
| "step": 12950 | |
| }, | |
| { | |
| "epoch": 8.28, | |
| "learning_rate": 0.000828115015974441, | |
| "loss": 0.1971, | |
| "step": 12960 | |
| }, | |
| { | |
| "epoch": 8.29, | |
| "learning_rate": 0.0008287539936102236, | |
| "loss": 0.1839, | |
| "step": 12970 | |
| }, | |
| { | |
| "epoch": 8.29, | |
| "learning_rate": 0.0008293929712460064, | |
| "loss": 0.2237, | |
| "step": 12980 | |
| }, | |
| { | |
| "epoch": 8.3, | |
| "learning_rate": 0.0008300319488817891, | |
| "loss": 0.1553, | |
| "step": 12990 | |
| }, | |
| { | |
| "epoch": 8.31, | |
| "learning_rate": 0.0008306709265175719, | |
| "loss": 0.193, | |
| "step": 13000 | |
| }, | |
| { | |
| "epoch": 8.31, | |
| "learning_rate": 0.0008313099041533546, | |
| "loss": 0.2027, | |
| "step": 13010 | |
| }, | |
| { | |
| "epoch": 8.32, | |
| "learning_rate": 0.0008319488817891374, | |
| "loss": 0.1927, | |
| "step": 13020 | |
| }, | |
| { | |
| "epoch": 8.33, | |
| "learning_rate": 0.0008325878594249201, | |
| "loss": 0.2067, | |
| "step": 13030 | |
| }, | |
| { | |
| "epoch": 8.33, | |
| "learning_rate": 0.0008332268370607029, | |
| "loss": 0.2119, | |
| "step": 13040 | |
| }, | |
| { | |
| "epoch": 8.34, | |
| "learning_rate": 0.0008338658146964856, | |
| "loss": 0.2125, | |
| "step": 13050 | |
| }, | |
| { | |
| "epoch": 8.34, | |
| "learning_rate": 0.0008345047923322684, | |
| "loss": 0.2148, | |
| "step": 13060 | |
| }, | |
| { | |
| "epoch": 8.35, | |
| "learning_rate": 0.0008351437699680511, | |
| "loss": 0.1722, | |
| "step": 13070 | |
| }, | |
| { | |
| "epoch": 8.36, | |
| "learning_rate": 0.0008357827476038338, | |
| "loss": 0.212, | |
| "step": 13080 | |
| }, | |
| { | |
| "epoch": 8.36, | |
| "learning_rate": 0.0008364217252396167, | |
| "loss": 0.2077, | |
| "step": 13090 | |
| }, | |
| { | |
| "epoch": 8.37, | |
| "learning_rate": 0.0008370607028753994, | |
| "loss": 0.2223, | |
| "step": 13100 | |
| }, | |
| { | |
| "epoch": 8.38, | |
| "learning_rate": 0.0008376996805111821, | |
| "loss": 0.2055, | |
| "step": 13110 | |
| }, | |
| { | |
| "epoch": 8.38, | |
| "learning_rate": 0.0008383386581469649, | |
| "loss": 0.1995, | |
| "step": 13120 | |
| }, | |
| { | |
| "epoch": 8.39, | |
| "learning_rate": 0.0008389776357827477, | |
| "loss": 0.176, | |
| "step": 13130 | |
| }, | |
| { | |
| "epoch": 8.4, | |
| "learning_rate": 0.0008396166134185303, | |
| "loss": 0.2049, | |
| "step": 13140 | |
| }, | |
| { | |
| "epoch": 8.4, | |
| "learning_rate": 0.0008402555910543132, | |
| "loss": 0.2177, | |
| "step": 13150 | |
| }, | |
| { | |
| "epoch": 8.41, | |
| "learning_rate": 0.0008408945686900958, | |
| "loss": 0.1961, | |
| "step": 13160 | |
| }, | |
| { | |
| "epoch": 8.42, | |
| "learning_rate": 0.0008415335463258786, | |
| "loss": 0.2094, | |
| "step": 13170 | |
| }, | |
| { | |
| "epoch": 8.42, | |
| "learning_rate": 0.0008421725239616614, | |
| "loss": 0.2121, | |
| "step": 13180 | |
| }, | |
| { | |
| "epoch": 8.43, | |
| "learning_rate": 0.0008428115015974441, | |
| "loss": 0.1996, | |
| "step": 13190 | |
| }, | |
| { | |
| "epoch": 8.43, | |
| "learning_rate": 0.0008434504792332268, | |
| "loss": 0.1836, | |
| "step": 13200 | |
| }, | |
| { | |
| "epoch": 8.44, | |
| "learning_rate": 0.0008440894568690097, | |
| "loss": 0.1804, | |
| "step": 13210 | |
| }, | |
| { | |
| "epoch": 8.45, | |
| "learning_rate": 0.0008447284345047923, | |
| "loss": 0.2604, | |
| "step": 13220 | |
| }, | |
| { | |
| "epoch": 8.45, | |
| "learning_rate": 0.0008453674121405751, | |
| "loss": 0.2071, | |
| "step": 13230 | |
| }, | |
| { | |
| "epoch": 8.46, | |
| "learning_rate": 0.0008460063897763578, | |
| "loss": 0.2113, | |
| "step": 13240 | |
| }, | |
| { | |
| "epoch": 8.47, | |
| "learning_rate": 0.0008466453674121406, | |
| "loss": 0.1961, | |
| "step": 13250 | |
| }, | |
| { | |
| "epoch": 8.47, | |
| "learning_rate": 0.0008472843450479233, | |
| "loss": 0.2149, | |
| "step": 13260 | |
| }, | |
| { | |
| "epoch": 8.48, | |
| "learning_rate": 0.0008479233226837061, | |
| "loss": 0.2112, | |
| "step": 13270 | |
| }, | |
| { | |
| "epoch": 8.49, | |
| "learning_rate": 0.0008485623003194889, | |
| "loss": 0.2003, | |
| "step": 13280 | |
| }, | |
| { | |
| "epoch": 8.49, | |
| "learning_rate": 0.0008492012779552716, | |
| "loss": 0.2098, | |
| "step": 13290 | |
| }, | |
| { | |
| "epoch": 8.5, | |
| "learning_rate": 0.0008498402555910543, | |
| "loss": 0.1986, | |
| "step": 13300 | |
| }, | |
| { | |
| "epoch": 8.5, | |
| "learning_rate": 0.000850479233226837, | |
| "loss": 0.2055, | |
| "step": 13310 | |
| }, | |
| { | |
| "epoch": 8.51, | |
| "learning_rate": 0.0008511182108626199, | |
| "loss": 0.169, | |
| "step": 13320 | |
| }, | |
| { | |
| "epoch": 8.52, | |
| "learning_rate": 0.0008517571884984025, | |
| "loss": 0.2417, | |
| "step": 13330 | |
| }, | |
| { | |
| "epoch": 8.52, | |
| "learning_rate": 0.0008523961661341853, | |
| "loss": 0.2163, | |
| "step": 13340 | |
| }, | |
| { | |
| "epoch": 8.53, | |
| "learning_rate": 0.0008530351437699681, | |
| "loss": 0.1996, | |
| "step": 13350 | |
| }, | |
| { | |
| "epoch": 8.54, | |
| "learning_rate": 0.0008536741214057508, | |
| "loss": 0.1736, | |
| "step": 13360 | |
| }, | |
| { | |
| "epoch": 8.54, | |
| "learning_rate": 0.0008543130990415335, | |
| "loss": 0.204, | |
| "step": 13370 | |
| }, | |
| { | |
| "epoch": 8.55, | |
| "learning_rate": 0.0008549520766773164, | |
| "loss": 0.2189, | |
| "step": 13380 | |
| }, | |
| { | |
| "epoch": 8.56, | |
| "learning_rate": 0.000855591054313099, | |
| "loss": 0.1797, | |
| "step": 13390 | |
| }, | |
| { | |
| "epoch": 8.56, | |
| "learning_rate": 0.0008562300319488818, | |
| "loss": 0.1723, | |
| "step": 13400 | |
| }, | |
| { | |
| "epoch": 8.57, | |
| "learning_rate": 0.0008568690095846646, | |
| "loss": 0.2189, | |
| "step": 13410 | |
| }, | |
| { | |
| "epoch": 8.57, | |
| "learning_rate": 0.0008575079872204473, | |
| "loss": 0.2004, | |
| "step": 13420 | |
| }, | |
| { | |
| "epoch": 8.58, | |
| "learning_rate": 0.00085814696485623, | |
| "loss": 0.2102, | |
| "step": 13430 | |
| }, | |
| { | |
| "epoch": 8.59, | |
| "learning_rate": 0.0008587859424920129, | |
| "loss": 0.173, | |
| "step": 13440 | |
| }, | |
| { | |
| "epoch": 8.59, | |
| "learning_rate": 0.0008594249201277955, | |
| "loss": 0.2067, | |
| "step": 13450 | |
| }, | |
| { | |
| "epoch": 8.6, | |
| "learning_rate": 0.0008600638977635783, | |
| "loss": 0.2229, | |
| "step": 13460 | |
| }, | |
| { | |
| "epoch": 8.61, | |
| "learning_rate": 0.0008607028753993609, | |
| "loss": 0.2101, | |
| "step": 13470 | |
| }, | |
| { | |
| "epoch": 8.61, | |
| "learning_rate": 0.0008613418530351438, | |
| "loss": 0.1975, | |
| "step": 13480 | |
| }, | |
| { | |
| "epoch": 8.62, | |
| "learning_rate": 0.0008619808306709266, | |
| "loss": 0.1821, | |
| "step": 13490 | |
| }, | |
| { | |
| "epoch": 8.63, | |
| "learning_rate": 0.0008626198083067092, | |
| "loss": 0.244, | |
| "step": 13500 | |
| }, | |
| { | |
| "epoch": 8.63, | |
| "learning_rate": 0.0008632587859424921, | |
| "loss": 0.1859, | |
| "step": 13510 | |
| }, | |
| { | |
| "epoch": 8.64, | |
| "learning_rate": 0.0008638977635782748, | |
| "loss": 0.178, | |
| "step": 13520 | |
| }, | |
| { | |
| "epoch": 8.65, | |
| "learning_rate": 0.0008645367412140575, | |
| "loss": 0.2166, | |
| "step": 13530 | |
| }, | |
| { | |
| "epoch": 8.65, | |
| "learning_rate": 0.0008651757188498403, | |
| "loss": 0.166, | |
| "step": 13540 | |
| }, | |
| { | |
| "epoch": 8.66, | |
| "learning_rate": 0.0008658146964856231, | |
| "loss": 0.1821, | |
| "step": 13550 | |
| }, | |
| { | |
| "epoch": 8.66, | |
| "learning_rate": 0.0008664536741214057, | |
| "loss": 0.1787, | |
| "step": 13560 | |
| }, | |
| { | |
| "epoch": 8.67, | |
| "learning_rate": 0.0008670926517571886, | |
| "loss": 0.1851, | |
| "step": 13570 | |
| }, | |
| { | |
| "epoch": 8.68, | |
| "learning_rate": 0.0008677316293929713, | |
| "loss": 0.181, | |
| "step": 13580 | |
| }, | |
| { | |
| "epoch": 8.68, | |
| "learning_rate": 0.000868370607028754, | |
| "loss": 0.1952, | |
| "step": 13590 | |
| }, | |
| { | |
| "epoch": 8.69, | |
| "learning_rate": 0.0008690095846645367, | |
| "loss": 0.1873, | |
| "step": 13600 | |
| }, | |
| { | |
| "epoch": 8.7, | |
| "learning_rate": 0.0008696485623003195, | |
| "loss": 0.212, | |
| "step": 13610 | |
| }, | |
| { | |
| "epoch": 8.7, | |
| "learning_rate": 0.0008702875399361022, | |
| "loss": 0.2072, | |
| "step": 13620 | |
| }, | |
| { | |
| "epoch": 8.71, | |
| "learning_rate": 0.000870926517571885, | |
| "loss": 0.2092, | |
| "step": 13630 | |
| }, | |
| { | |
| "epoch": 8.72, | |
| "learning_rate": 0.0008715654952076677, | |
| "loss": 0.2119, | |
| "step": 13640 | |
| }, | |
| { | |
| "epoch": 8.72, | |
| "learning_rate": 0.0008722044728434505, | |
| "loss": 0.2139, | |
| "step": 13650 | |
| }, | |
| { | |
| "epoch": 8.73, | |
| "learning_rate": 0.0008728434504792332, | |
| "loss": 0.1895, | |
| "step": 13660 | |
| }, | |
| { | |
| "epoch": 8.73, | |
| "learning_rate": 0.000873482428115016, | |
| "loss": 0.2178, | |
| "step": 13670 | |
| }, | |
| { | |
| "epoch": 8.74, | |
| "learning_rate": 0.0008741214057507988, | |
| "loss": 0.229, | |
| "step": 13680 | |
| }, | |
| { | |
| "epoch": 8.75, | |
| "learning_rate": 0.0008747603833865815, | |
| "loss": 0.2104, | |
| "step": 13690 | |
| }, | |
| { | |
| "epoch": 8.75, | |
| "learning_rate": 0.0008753993610223643, | |
| "loss": 0.2215, | |
| "step": 13700 | |
| }, | |
| { | |
| "epoch": 8.76, | |
| "learning_rate": 0.000876038338658147, | |
| "loss": 0.1943, | |
| "step": 13710 | |
| }, | |
| { | |
| "epoch": 8.77, | |
| "learning_rate": 0.0008766773162939298, | |
| "loss": 0.2193, | |
| "step": 13720 | |
| }, | |
| { | |
| "epoch": 8.77, | |
| "learning_rate": 0.0008773162939297124, | |
| "loss": 0.2294, | |
| "step": 13730 | |
| }, | |
| { | |
| "epoch": 8.78, | |
| "learning_rate": 0.0008779552715654953, | |
| "loss": 0.1998, | |
| "step": 13740 | |
| }, | |
| { | |
| "epoch": 8.79, | |
| "learning_rate": 0.0008785942492012779, | |
| "loss": 0.2152, | |
| "step": 13750 | |
| }, | |
| { | |
| "epoch": 8.79, | |
| "learning_rate": 0.0008792332268370607, | |
| "loss": 0.1832, | |
| "step": 13760 | |
| }, | |
| { | |
| "epoch": 8.8, | |
| "learning_rate": 0.0008798722044728435, | |
| "loss": 0.2159, | |
| "step": 13770 | |
| }, | |
| { | |
| "epoch": 8.8, | |
| "learning_rate": 0.0008805111821086262, | |
| "loss": 0.2204, | |
| "step": 13780 | |
| }, | |
| { | |
| "epoch": 8.81, | |
| "learning_rate": 0.0008811501597444089, | |
| "loss": 0.224, | |
| "step": 13790 | |
| }, | |
| { | |
| "epoch": 8.82, | |
| "learning_rate": 0.0008817891373801918, | |
| "loss": 0.2238, | |
| "step": 13800 | |
| }, | |
| { | |
| "epoch": 8.82, | |
| "learning_rate": 0.0008824281150159744, | |
| "loss": 0.2188, | |
| "step": 13810 | |
| }, | |
| { | |
| "epoch": 8.83, | |
| "learning_rate": 0.0008830670926517572, | |
| "loss": 0.2244, | |
| "step": 13820 | |
| }, | |
| { | |
| "epoch": 8.84, | |
| "learning_rate": 0.00088370607028754, | |
| "loss": 0.193, | |
| "step": 13830 | |
| }, | |
| { | |
| "epoch": 8.84, | |
| "learning_rate": 0.0008843450479233227, | |
| "loss": 0.2003, | |
| "step": 13840 | |
| }, | |
| { | |
| "epoch": 8.85, | |
| "learning_rate": 0.0008849840255591054, | |
| "loss": 0.2043, | |
| "step": 13850 | |
| }, | |
| { | |
| "epoch": 8.86, | |
| "learning_rate": 0.0008856230031948882, | |
| "loss": 0.2051, | |
| "step": 13860 | |
| }, | |
| { | |
| "epoch": 8.86, | |
| "learning_rate": 0.000886261980830671, | |
| "loss": 0.183, | |
| "step": 13870 | |
| }, | |
| { | |
| "epoch": 8.87, | |
| "learning_rate": 0.0008869009584664537, | |
| "loss": 0.2322, | |
| "step": 13880 | |
| }, | |
| { | |
| "epoch": 8.88, | |
| "learning_rate": 0.0008875399361022365, | |
| "loss": 0.2282, | |
| "step": 13890 | |
| }, | |
| { | |
| "epoch": 8.88, | |
| "learning_rate": 0.0008881789137380192, | |
| "loss": 0.196, | |
| "step": 13900 | |
| }, | |
| { | |
| "epoch": 8.89, | |
| "learning_rate": 0.000888817891373802, | |
| "loss": 0.1948, | |
| "step": 13910 | |
| }, | |
| { | |
| "epoch": 8.89, | |
| "learning_rate": 0.0008894568690095846, | |
| "loss": 0.2252, | |
| "step": 13920 | |
| }, | |
| { | |
| "epoch": 8.9, | |
| "learning_rate": 0.0008900958466453675, | |
| "loss": 0.2003, | |
| "step": 13930 | |
| }, | |
| { | |
| "epoch": 8.91, | |
| "learning_rate": 0.0008907348242811502, | |
| "loss": 0.2181, | |
| "step": 13940 | |
| }, | |
| { | |
| "epoch": 8.91, | |
| "learning_rate": 0.0008913738019169329, | |
| "loss": 0.2073, | |
| "step": 13950 | |
| }, | |
| { | |
| "epoch": 8.92, | |
| "learning_rate": 0.0008920127795527156, | |
| "loss": 0.2436, | |
| "step": 13960 | |
| }, | |
| { | |
| "epoch": 8.93, | |
| "learning_rate": 0.0008926517571884985, | |
| "loss": 0.1896, | |
| "step": 13970 | |
| }, | |
| { | |
| "epoch": 8.93, | |
| "learning_rate": 0.0008932907348242811, | |
| "loss": 0.201, | |
| "step": 13980 | |
| }, | |
| { | |
| "epoch": 8.94, | |
| "learning_rate": 0.0008939297124600639, | |
| "loss": 0.2023, | |
| "step": 13990 | |
| }, | |
| { | |
| "epoch": 8.95, | |
| "learning_rate": 0.0008945686900958467, | |
| "loss": 0.2138, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 8.95, | |
| "learning_rate": 0.0008952076677316294, | |
| "loss": 0.2247, | |
| "step": 14010 | |
| }, | |
| { | |
| "epoch": 8.96, | |
| "learning_rate": 0.0008958466453674121, | |
| "loss": 0.2329, | |
| "step": 14020 | |
| }, | |
| { | |
| "epoch": 8.96, | |
| "learning_rate": 0.000896485623003195, | |
| "loss": 0.1843, | |
| "step": 14030 | |
| }, | |
| { | |
| "epoch": 8.97, | |
| "learning_rate": 0.0008971246006389776, | |
| "loss": 0.1895, | |
| "step": 14040 | |
| }, | |
| { | |
| "epoch": 8.98, | |
| "learning_rate": 0.0008977635782747604, | |
| "loss": 0.1814, | |
| "step": 14050 | |
| }, | |
| { | |
| "epoch": 8.98, | |
| "learning_rate": 0.000898402555910543, | |
| "loss": 0.2078, | |
| "step": 14060 | |
| }, | |
| { | |
| "epoch": 8.99, | |
| "learning_rate": 0.0008990415335463259, | |
| "loss": 0.2324, | |
| "step": 14070 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 0.0008996805111821087, | |
| "loss": 0.2346, | |
| "step": 14080 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "learning_rate": 0.0009003194888178913, | |
| "loss": 0.2024, | |
| "step": 14090 | |
| }, | |
| { | |
| "epoch": 9.01, | |
| "learning_rate": 0.0009009584664536742, | |
| "loss": 0.174, | |
| "step": 14100 | |
| }, | |
| { | |
| "epoch": 9.02, | |
| "learning_rate": 0.0009015974440894569, | |
| "loss": 0.1736, | |
| "step": 14110 | |
| }, | |
| { | |
| "epoch": 9.02, | |
| "learning_rate": 0.0009022364217252396, | |
| "loss": 0.2153, | |
| "step": 14120 | |
| }, | |
| { | |
| "epoch": 9.03, | |
| "learning_rate": 0.0009028753993610224, | |
| "loss": 0.1848, | |
| "step": 14130 | |
| }, | |
| { | |
| "epoch": 9.04, | |
| "learning_rate": 0.0009035143769968052, | |
| "loss": 0.1719, | |
| "step": 14140 | |
| }, | |
| { | |
| "epoch": 9.04, | |
| "learning_rate": 0.0009041533546325878, | |
| "loss": 0.1904, | |
| "step": 14150 | |
| }, | |
| { | |
| "epoch": 9.05, | |
| "learning_rate": 0.0009047923322683707, | |
| "loss": 0.1692, | |
| "step": 14160 | |
| }, | |
| { | |
| "epoch": 9.05, | |
| "learning_rate": 0.0009054313099041534, | |
| "loss": 0.1367, | |
| "step": 14170 | |
| }, | |
| { | |
| "epoch": 9.06, | |
| "learning_rate": 0.0009060702875399361, | |
| "loss": 0.1853, | |
| "step": 14180 | |
| }, | |
| { | |
| "epoch": 9.07, | |
| "learning_rate": 0.0009067092651757188, | |
| "loss": 0.1945, | |
| "step": 14190 | |
| }, | |
| { | |
| "epoch": 9.07, | |
| "learning_rate": 0.0009073482428115017, | |
| "loss": 0.1827, | |
| "step": 14200 | |
| }, | |
| { | |
| "epoch": 9.08, | |
| "learning_rate": 0.0009079872204472843, | |
| "loss": 0.1927, | |
| "step": 14210 | |
| }, | |
| { | |
| "epoch": 9.09, | |
| "learning_rate": 0.0009086261980830671, | |
| "loss": 0.1513, | |
| "step": 14220 | |
| }, | |
| { | |
| "epoch": 9.09, | |
| "learning_rate": 0.0009092651757188498, | |
| "loss": 0.2149, | |
| "step": 14230 | |
| }, | |
| { | |
| "epoch": 9.1, | |
| "learning_rate": 0.0009099041533546326, | |
| "loss": 0.1609, | |
| "step": 14240 | |
| }, | |
| { | |
| "epoch": 9.11, | |
| "learning_rate": 0.0009105431309904153, | |
| "loss": 0.1814, | |
| "step": 14250 | |
| }, | |
| { | |
| "epoch": 9.11, | |
| "learning_rate": 0.0009111821086261981, | |
| "loss": 0.192, | |
| "step": 14260 | |
| }, | |
| { | |
| "epoch": 9.12, | |
| "learning_rate": 0.0009118210862619809, | |
| "loss": 0.2028, | |
| "step": 14270 | |
| }, | |
| { | |
| "epoch": 9.12, | |
| "learning_rate": 0.0009124600638977636, | |
| "loss": 0.1814, | |
| "step": 14280 | |
| }, | |
| { | |
| "epoch": 9.13, | |
| "learning_rate": 0.0009130990415335464, | |
| "loss": 0.1721, | |
| "step": 14290 | |
| }, | |
| { | |
| "epoch": 9.14, | |
| "learning_rate": 0.0009137380191693291, | |
| "loss": 0.1894, | |
| "step": 14300 | |
| }, | |
| { | |
| "epoch": 9.14, | |
| "learning_rate": 0.0009143769968051119, | |
| "loss": 0.1716, | |
| "step": 14310 | |
| }, | |
| { | |
| "epoch": 9.15, | |
| "learning_rate": 0.0009150159744408945, | |
| "loss": 0.1957, | |
| "step": 14320 | |
| }, | |
| { | |
| "epoch": 9.16, | |
| "learning_rate": 0.0009156549520766774, | |
| "loss": 0.1671, | |
| "step": 14330 | |
| }, | |
| { | |
| "epoch": 9.16, | |
| "learning_rate": 0.0009162939297124601, | |
| "loss": 0.1852, | |
| "step": 14340 | |
| }, | |
| { | |
| "epoch": 9.17, | |
| "learning_rate": 0.0009169329073482428, | |
| "loss": 0.2002, | |
| "step": 14350 | |
| }, | |
| { | |
| "epoch": 9.18, | |
| "learning_rate": 0.0009175718849840256, | |
| "loss": 0.1912, | |
| "step": 14360 | |
| }, | |
| { | |
| "epoch": 9.18, | |
| "learning_rate": 0.0009182108626198083, | |
| "loss": 0.1929, | |
| "step": 14370 | |
| }, | |
| { | |
| "epoch": 9.19, | |
| "learning_rate": 0.000918849840255591, | |
| "loss": 0.1772, | |
| "step": 14380 | |
| }, | |
| { | |
| "epoch": 9.19, | |
| "learning_rate": 0.0009194888178913739, | |
| "loss": 0.1767, | |
| "step": 14390 | |
| }, | |
| { | |
| "epoch": 9.2, | |
| "learning_rate": 0.0009201277955271565, | |
| "loss": 0.1999, | |
| "step": 14400 | |
| }, | |
| { | |
| "epoch": 9.21, | |
| "learning_rate": 0.0009207667731629393, | |
| "loss": 0.2022, | |
| "step": 14410 | |
| }, | |
| { | |
| "epoch": 9.21, | |
| "learning_rate": 0.000921405750798722, | |
| "loss": 0.2222, | |
| "step": 14420 | |
| }, | |
| { | |
| "epoch": 9.22, | |
| "learning_rate": 0.0009220447284345048, | |
| "loss": 0.1796, | |
| "step": 14430 | |
| }, | |
| { | |
| "epoch": 9.23, | |
| "learning_rate": 0.0009226837060702875, | |
| "loss": 0.197, | |
| "step": 14440 | |
| }, | |
| { | |
| "epoch": 9.23, | |
| "learning_rate": 0.0009233226837060703, | |
| "loss": 0.1699, | |
| "step": 14450 | |
| }, | |
| { | |
| "epoch": 9.24, | |
| "learning_rate": 0.000923961661341853, | |
| "loss": 0.1662, | |
| "step": 14460 | |
| }, | |
| { | |
| "epoch": 9.25, | |
| "learning_rate": 0.0009246006389776358, | |
| "loss": 0.1596, | |
| "step": 14470 | |
| }, | |
| { | |
| "epoch": 9.25, | |
| "learning_rate": 0.0009252396166134186, | |
| "loss": 0.1826, | |
| "step": 14480 | |
| }, | |
| { | |
| "epoch": 9.26, | |
| "learning_rate": 0.0009258785942492013, | |
| "loss": 0.1801, | |
| "step": 14490 | |
| }, | |
| { | |
| "epoch": 9.27, | |
| "learning_rate": 0.0009265175718849841, | |
| "loss": 0.217, | |
| "step": 14500 | |
| }, | |
| { | |
| "epoch": 9.27, | |
| "learning_rate": 0.0009271565495207667, | |
| "loss": 0.1575, | |
| "step": 14510 | |
| }, | |
| { | |
| "epoch": 9.28, | |
| "learning_rate": 0.0009277955271565496, | |
| "loss": 0.2204, | |
| "step": 14520 | |
| }, | |
| { | |
| "epoch": 9.28, | |
| "learning_rate": 0.0009284345047923323, | |
| "loss": 0.1904, | |
| "step": 14530 | |
| }, | |
| { | |
| "epoch": 9.29, | |
| "learning_rate": 0.000929073482428115, | |
| "loss": 0.1612, | |
| "step": 14540 | |
| }, | |
| { | |
| "epoch": 9.3, | |
| "learning_rate": 0.0009297124600638978, | |
| "loss": 0.2108, | |
| "step": 14550 | |
| }, | |
| { | |
| "epoch": 9.3, | |
| "learning_rate": 0.0009303514376996806, | |
| "loss": 0.2171, | |
| "step": 14560 | |
| }, | |
| { | |
| "epoch": 9.31, | |
| "learning_rate": 0.0009309904153354632, | |
| "loss": 0.1911, | |
| "step": 14570 | |
| }, | |
| { | |
| "epoch": 9.32, | |
| "learning_rate": 0.000931629392971246, | |
| "loss": 0.2062, | |
| "step": 14580 | |
| }, | |
| { | |
| "epoch": 9.32, | |
| "learning_rate": 0.0009322683706070288, | |
| "loss": 0.2073, | |
| "step": 14590 | |
| }, | |
| { | |
| "epoch": 9.33, | |
| "learning_rate": 0.0009329073482428115, | |
| "loss": 0.2118, | |
| "step": 14600 | |
| }, | |
| { | |
| "epoch": 9.34, | |
| "learning_rate": 0.0009335463258785942, | |
| "loss": 0.1814, | |
| "step": 14610 | |
| }, | |
| { | |
| "epoch": 9.34, | |
| "learning_rate": 0.0009341853035143771, | |
| "loss": 0.1654, | |
| "step": 14620 | |
| }, | |
| { | |
| "epoch": 9.35, | |
| "learning_rate": 0.0009348242811501597, | |
| "loss": 0.1794, | |
| "step": 14630 | |
| }, | |
| { | |
| "epoch": 9.35, | |
| "learning_rate": 0.0009354632587859425, | |
| "loss": 0.199, | |
| "step": 14640 | |
| }, | |
| { | |
| "epoch": 9.36, | |
| "learning_rate": 0.0009361022364217253, | |
| "loss": 0.1785, | |
| "step": 14650 | |
| }, | |
| { | |
| "epoch": 9.37, | |
| "learning_rate": 0.000936741214057508, | |
| "loss": 0.222, | |
| "step": 14660 | |
| }, | |
| { | |
| "epoch": 9.37, | |
| "learning_rate": 0.0009373801916932908, | |
| "loss": 0.2213, | |
| "step": 14670 | |
| }, | |
| { | |
| "epoch": 9.38, | |
| "learning_rate": 0.0009380191693290734, | |
| "loss": 0.1864, | |
| "step": 14680 | |
| }, | |
| { | |
| "epoch": 9.39, | |
| "learning_rate": 0.0009386581469648563, | |
| "loss": 0.1973, | |
| "step": 14690 | |
| }, | |
| { | |
| "epoch": 9.39, | |
| "learning_rate": 0.000939297124600639, | |
| "loss": 0.2027, | |
| "step": 14700 | |
| }, | |
| { | |
| "epoch": 9.4, | |
| "learning_rate": 0.0009399361022364217, | |
| "loss": 0.2115, | |
| "step": 14710 | |
| }, | |
| { | |
| "epoch": 9.41, | |
| "learning_rate": 0.0009405750798722045, | |
| "loss": 0.207, | |
| "step": 14720 | |
| }, | |
| { | |
| "epoch": 9.41, | |
| "learning_rate": 0.0009412140575079873, | |
| "loss": 0.1878, | |
| "step": 14730 | |
| }, | |
| { | |
| "epoch": 9.42, | |
| "learning_rate": 0.0009418530351437699, | |
| "loss": 0.1794, | |
| "step": 14740 | |
| }, | |
| { | |
| "epoch": 9.42, | |
| "learning_rate": 0.0009424920127795528, | |
| "loss": 0.2063, | |
| "step": 14750 | |
| }, | |
| { | |
| "epoch": 9.43, | |
| "learning_rate": 0.0009431309904153355, | |
| "loss": 0.2194, | |
| "step": 14760 | |
| }, | |
| { | |
| "epoch": 9.44, | |
| "learning_rate": 0.0009437699680511182, | |
| "loss": 0.1841, | |
| "step": 14770 | |
| }, | |
| { | |
| "epoch": 9.44, | |
| "learning_rate": 0.000944408945686901, | |
| "loss": 0.2375, | |
| "step": 14780 | |
| }, | |
| { | |
| "epoch": 9.45, | |
| "learning_rate": 0.0009450479233226838, | |
| "loss": 0.1869, | |
| "step": 14790 | |
| }, | |
| { | |
| "epoch": 9.46, | |
| "learning_rate": 0.0009456869009584664, | |
| "loss": 0.1953, | |
| "step": 14800 | |
| }, | |
| { | |
| "epoch": 9.46, | |
| "learning_rate": 0.0009463258785942493, | |
| "loss": 0.202, | |
| "step": 14810 | |
| }, | |
| { | |
| "epoch": 9.47, | |
| "learning_rate": 0.0009469648562300319, | |
| "loss": 0.2095, | |
| "step": 14820 | |
| }, | |
| { | |
| "epoch": 9.48, | |
| "learning_rate": 0.0009476038338658147, | |
| "loss": 0.1894, | |
| "step": 14830 | |
| }, | |
| { | |
| "epoch": 9.48, | |
| "learning_rate": 0.0009482428115015974, | |
| "loss": 0.2249, | |
| "step": 14840 | |
| }, | |
| { | |
| "epoch": 9.49, | |
| "learning_rate": 0.0009488817891373802, | |
| "loss": 0.1649, | |
| "step": 14850 | |
| }, | |
| { | |
| "epoch": 9.5, | |
| "learning_rate": 0.000949520766773163, | |
| "loss": 0.1917, | |
| "step": 14860 | |
| }, | |
| { | |
| "epoch": 9.5, | |
| "learning_rate": 0.0009501597444089457, | |
| "loss": 0.1856, | |
| "step": 14870 | |
| }, | |
| { | |
| "epoch": 9.51, | |
| "learning_rate": 0.0009507987220447285, | |
| "loss": 0.2134, | |
| "step": 14880 | |
| }, | |
| { | |
| "epoch": 9.51, | |
| "learning_rate": 0.0009514376996805112, | |
| "loss": 0.2183, | |
| "step": 14890 | |
| }, | |
| { | |
| "epoch": 9.52, | |
| "learning_rate": 0.000952076677316294, | |
| "loss": 0.2113, | |
| "step": 14900 | |
| }, | |
| { | |
| "epoch": 9.53, | |
| "learning_rate": 0.0009527156549520767, | |
| "loss": 0.1836, | |
| "step": 14910 | |
| }, | |
| { | |
| "epoch": 9.53, | |
| "learning_rate": 0.0009533546325878595, | |
| "loss": 0.1806, | |
| "step": 14920 | |
| }, | |
| { | |
| "epoch": 9.54, | |
| "learning_rate": 0.0009539936102236422, | |
| "loss": 0.2051, | |
| "step": 14930 | |
| }, | |
| { | |
| "epoch": 9.55, | |
| "learning_rate": 0.000954632587859425, | |
| "loss": 0.1987, | |
| "step": 14940 | |
| }, | |
| { | |
| "epoch": 9.55, | |
| "learning_rate": 0.0009552715654952077, | |
| "loss": 0.2183, | |
| "step": 14950 | |
| }, | |
| { | |
| "epoch": 9.56, | |
| "learning_rate": 0.0009559105431309905, | |
| "loss": 0.188, | |
| "step": 14960 | |
| }, | |
| { | |
| "epoch": 9.57, | |
| "learning_rate": 0.0009565495207667731, | |
| "loss": 0.2088, | |
| "step": 14970 | |
| }, | |
| { | |
| "epoch": 9.57, | |
| "learning_rate": 0.000957188498402556, | |
| "loss": 0.2153, | |
| "step": 14980 | |
| }, | |
| { | |
| "epoch": 9.58, | |
| "learning_rate": 0.0009578274760383386, | |
| "loss": 0.2069, | |
| "step": 14990 | |
| }, | |
| { | |
| "epoch": 9.58, | |
| "learning_rate": 0.0009584664536741214, | |
| "loss": 0.1698, | |
| "step": 15000 | |
| }, | |
| { | |
| "epoch": 9.59, | |
| "learning_rate": 0.0009591054313099042, | |
| "loss": 0.205, | |
| "step": 15010 | |
| }, | |
| { | |
| "epoch": 9.6, | |
| "learning_rate": 0.0009597444089456869, | |
| "loss": 0.1753, | |
| "step": 15020 | |
| }, | |
| { | |
| "epoch": 9.6, | |
| "learning_rate": 0.0009603833865814696, | |
| "loss": 0.1908, | |
| "step": 15030 | |
| }, | |
| { | |
| "epoch": 9.61, | |
| "learning_rate": 0.0009610223642172525, | |
| "loss": 0.1935, | |
| "step": 15040 | |
| }, | |
| { | |
| "epoch": 9.62, | |
| "learning_rate": 0.0009616613418530351, | |
| "loss": 0.2243, | |
| "step": 15050 | |
| }, | |
| { | |
| "epoch": 9.62, | |
| "learning_rate": 0.0009623003194888179, | |
| "loss": 0.2018, | |
| "step": 15060 | |
| }, | |
| { | |
| "epoch": 9.63, | |
| "learning_rate": 0.0009629392971246008, | |
| "loss": 0.2062, | |
| "step": 15070 | |
| }, | |
| { | |
| "epoch": 9.64, | |
| "learning_rate": 0.0009635782747603834, | |
| "loss": 0.2033, | |
| "step": 15080 | |
| }, | |
| { | |
| "epoch": 9.64, | |
| "learning_rate": 0.0009642172523961662, | |
| "loss": 0.1993, | |
| "step": 15090 | |
| }, | |
| { | |
| "epoch": 9.65, | |
| "learning_rate": 0.0009648562300319489, | |
| "loss": 0.1946, | |
| "step": 15100 | |
| }, | |
| { | |
| "epoch": 9.65, | |
| "learning_rate": 0.0009654952076677317, | |
| "loss": 0.2113, | |
| "step": 15110 | |
| }, | |
| { | |
| "epoch": 9.66, | |
| "learning_rate": 0.0009661341853035144, | |
| "loss": 0.2004, | |
| "step": 15120 | |
| }, | |
| { | |
| "epoch": 9.67, | |
| "learning_rate": 0.0009667731629392971, | |
| "loss": 0.21, | |
| "step": 15130 | |
| }, | |
| { | |
| "epoch": 9.67, | |
| "learning_rate": 0.0009674121405750799, | |
| "loss": 0.1794, | |
| "step": 15140 | |
| }, | |
| { | |
| "epoch": 9.68, | |
| "learning_rate": 0.0009680511182108627, | |
| "loss": 0.2395, | |
| "step": 15150 | |
| }, | |
| { | |
| "epoch": 9.69, | |
| "learning_rate": 0.0009686900958466453, | |
| "loss": 0.2506, | |
| "step": 15160 | |
| }, | |
| { | |
| "epoch": 9.69, | |
| "learning_rate": 0.0009693290734824282, | |
| "loss": 0.1916, | |
| "step": 15170 | |
| }, | |
| { | |
| "epoch": 9.7, | |
| "learning_rate": 0.0009699680511182109, | |
| "loss": 0.1933, | |
| "step": 15180 | |
| }, | |
| { | |
| "epoch": 9.71, | |
| "learning_rate": 0.0009706070287539936, | |
| "loss": 0.2162, | |
| "step": 15190 | |
| }, | |
| { | |
| "epoch": 9.71, | |
| "learning_rate": 0.0009712460063897763, | |
| "loss": 0.221, | |
| "step": 15200 | |
| }, | |
| { | |
| "epoch": 9.72, | |
| "learning_rate": 0.0009718849840255592, | |
| "loss": 0.1934, | |
| "step": 15210 | |
| }, | |
| { | |
| "epoch": 9.73, | |
| "learning_rate": 0.0009725239616613418, | |
| "loss": 0.1856, | |
| "step": 15220 | |
| }, | |
| { | |
| "epoch": 9.73, | |
| "learning_rate": 0.0009731629392971246, | |
| "loss": 0.1951, | |
| "step": 15230 | |
| }, | |
| { | |
| "epoch": 9.74, | |
| "learning_rate": 0.0009738019169329074, | |
| "loss": 0.1962, | |
| "step": 15240 | |
| }, | |
| { | |
| "epoch": 9.74, | |
| "learning_rate": 0.0009744408945686901, | |
| "loss": 0.1947, | |
| "step": 15250 | |
| }, | |
| { | |
| "epoch": 9.75, | |
| "learning_rate": 0.0009750798722044729, | |
| "loss": 0.217, | |
| "step": 15260 | |
| }, | |
| { | |
| "epoch": 9.76, | |
| "learning_rate": 0.0009757188498402556, | |
| "loss": 0.2092, | |
| "step": 15270 | |
| }, | |
| { | |
| "epoch": 9.76, | |
| "learning_rate": 0.0009763578274760384, | |
| "loss": 0.1695, | |
| "step": 15280 | |
| }, | |
| { | |
| "epoch": 9.77, | |
| "learning_rate": 0.0009769968051118211, | |
| "loss": 0.1863, | |
| "step": 15290 | |
| }, | |
| { | |
| "epoch": 9.78, | |
| "learning_rate": 0.0009776357827476038, | |
| "loss": 0.1947, | |
| "step": 15300 | |
| }, | |
| { | |
| "epoch": 9.78, | |
| "learning_rate": 0.0009782747603833866, | |
| "loss": 0.1878, | |
| "step": 15310 | |
| }, | |
| { | |
| "epoch": 9.79, | |
| "learning_rate": 0.0009789137380191693, | |
| "loss": 0.2087, | |
| "step": 15320 | |
| }, | |
| { | |
| "epoch": 9.8, | |
| "learning_rate": 0.000979552715654952, | |
| "loss": 0.183, | |
| "step": 15330 | |
| }, | |
| { | |
| "epoch": 9.8, | |
| "learning_rate": 0.000980191693290735, | |
| "loss": 0.1836, | |
| "step": 15340 | |
| }, | |
| { | |
| "epoch": 9.81, | |
| "learning_rate": 0.0009808306709265175, | |
| "loss": 0.2152, | |
| "step": 15350 | |
| }, | |
| { | |
| "epoch": 9.81, | |
| "learning_rate": 0.0009814696485623004, | |
| "loss": 0.2007, | |
| "step": 15360 | |
| }, | |
| { | |
| "epoch": 9.82, | |
| "learning_rate": 0.000982108626198083, | |
| "loss": 0.2202, | |
| "step": 15370 | |
| }, | |
| { | |
| "epoch": 9.83, | |
| "learning_rate": 0.000982747603833866, | |
| "loss": 0.2071, | |
| "step": 15380 | |
| }, | |
| { | |
| "epoch": 9.83, | |
| "learning_rate": 0.0009833865814696486, | |
| "loss": 0.212, | |
| "step": 15390 | |
| }, | |
| { | |
| "epoch": 9.84, | |
| "learning_rate": 0.0009840255591054314, | |
| "loss": 0.217, | |
| "step": 15400 | |
| }, | |
| { | |
| "epoch": 9.85, | |
| "learning_rate": 0.000984664536741214, | |
| "loss": 0.1713, | |
| "step": 15410 | |
| }, | |
| { | |
| "epoch": 9.85, | |
| "learning_rate": 0.0009853035143769968, | |
| "loss": 0.1993, | |
| "step": 15420 | |
| }, | |
| { | |
| "epoch": 9.86, | |
| "learning_rate": 0.0009859424920127795, | |
| "loss": 0.1823, | |
| "step": 15430 | |
| }, | |
| { | |
| "epoch": 9.87, | |
| "learning_rate": 0.0009865814696485623, | |
| "loss": 0.179, | |
| "step": 15440 | |
| }, | |
| { | |
| "epoch": 9.87, | |
| "learning_rate": 0.000987220447284345, | |
| "loss": 0.1938, | |
| "step": 15450 | |
| }, | |
| { | |
| "epoch": 9.88, | |
| "learning_rate": 0.0009878594249201277, | |
| "loss": 0.2068, | |
| "step": 15460 | |
| }, | |
| { | |
| "epoch": 9.88, | |
| "learning_rate": 0.0009884984025559107, | |
| "loss": 0.1709, | |
| "step": 15470 | |
| }, | |
| { | |
| "epoch": 9.89, | |
| "learning_rate": 0.0009891373801916934, | |
| "loss": 0.2332, | |
| "step": 15480 | |
| }, | |
| { | |
| "epoch": 9.9, | |
| "learning_rate": 0.0009897763578274761, | |
| "loss": 0.193, | |
| "step": 15490 | |
| }, | |
| { | |
| "epoch": 9.9, | |
| "learning_rate": 0.0009904153354632589, | |
| "loss": 0.212, | |
| "step": 15500 | |
| }, | |
| { | |
| "epoch": 9.91, | |
| "learning_rate": 0.0009910543130990416, | |
| "loss": 0.2095, | |
| "step": 15510 | |
| }, | |
| { | |
| "epoch": 9.92, | |
| "learning_rate": 0.0009916932907348243, | |
| "loss": 0.1849, | |
| "step": 15520 | |
| }, | |
| { | |
| "epoch": 9.92, | |
| "learning_rate": 0.000992332268370607, | |
| "loss": 0.212, | |
| "step": 15530 | |
| }, | |
| { | |
| "epoch": 9.93, | |
| "learning_rate": 0.0009929712460063898, | |
| "loss": 0.1945, | |
| "step": 15540 | |
| }, | |
| { | |
| "epoch": 9.94, | |
| "learning_rate": 0.0009936102236421725, | |
| "loss": 0.2293, | |
| "step": 15550 | |
| }, | |
| { | |
| "epoch": 9.94, | |
| "learning_rate": 0.0009942492012779552, | |
| "loss": 0.2218, | |
| "step": 15560 | |
| }, | |
| { | |
| "epoch": 9.95, | |
| "learning_rate": 0.000994888178913738, | |
| "loss": 0.2198, | |
| "step": 15570 | |
| }, | |
| { | |
| "epoch": 9.95, | |
| "learning_rate": 0.0009955271565495207, | |
| "loss": 0.2099, | |
| "step": 15580 | |
| }, | |
| { | |
| "epoch": 9.96, | |
| "learning_rate": 0.0009961661341853036, | |
| "loss": 0.2159, | |
| "step": 15590 | |
| }, | |
| { | |
| "epoch": 9.97, | |
| "learning_rate": 0.0009968051118210862, | |
| "loss": 0.2077, | |
| "step": 15600 | |
| }, | |
| { | |
| "epoch": 9.97, | |
| "learning_rate": 0.000997444089456869, | |
| "loss": 0.2324, | |
| "step": 15610 | |
| }, | |
| { | |
| "epoch": 9.98, | |
| "learning_rate": 0.0009980830670926518, | |
| "loss": 0.2459, | |
| "step": 15620 | |
| }, | |
| { | |
| "epoch": 9.99, | |
| "learning_rate": 0.0009987220447284346, | |
| "loss": 0.2167, | |
| "step": 15630 | |
| }, | |
| { | |
| "epoch": 9.99, | |
| "learning_rate": 0.0009993610223642173, | |
| "loss": 0.1978, | |
| "step": 15640 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "learning_rate": 0.001, | |
| "loss": 0.1983, | |
| "step": 15650 | |
| }, | |
| { | |
| "epoch": 10.01, | |
| "learning_rate": 0.000999929002484913, | |
| "loss": 0.1927, | |
| "step": 15660 | |
| }, | |
| { | |
| "epoch": 10.01, | |
| "learning_rate": 0.000999858004969826, | |
| "loss": 0.1822, | |
| "step": 15670 | |
| }, | |
| { | |
| "epoch": 10.02, | |
| "learning_rate": 0.0009997870074547391, | |
| "loss": 0.1596, | |
| "step": 15680 | |
| }, | |
| { | |
| "epoch": 10.03, | |
| "learning_rate": 0.000999716009939652, | |
| "loss": 0.163, | |
| "step": 15690 | |
| }, | |
| { | |
| "epoch": 10.03, | |
| "learning_rate": 0.0009996450124245652, | |
| "loss": 0.1961, | |
| "step": 15700 | |
| }, | |
| { | |
| "epoch": 10.04, | |
| "learning_rate": 0.0009995740149094782, | |
| "loss": 0.1907, | |
| "step": 15710 | |
| }, | |
| { | |
| "epoch": 10.04, | |
| "learning_rate": 0.0009995030173943912, | |
| "loss": 0.1704, | |
| "step": 15720 | |
| }, | |
| { | |
| "epoch": 10.05, | |
| "learning_rate": 0.0009994320198793041, | |
| "loss": 0.1994, | |
| "step": 15730 | |
| }, | |
| { | |
| "epoch": 10.06, | |
| "learning_rate": 0.0009993610223642173, | |
| "loss": 0.1503, | |
| "step": 15740 | |
| }, | |
| { | |
| "epoch": 10.06, | |
| "learning_rate": 0.0009992900248491302, | |
| "loss": 0.151, | |
| "step": 15750 | |
| }, | |
| { | |
| "epoch": 10.07, | |
| "learning_rate": 0.0009992190273340434, | |
| "loss": 0.1875, | |
| "step": 15760 | |
| }, | |
| { | |
| "epoch": 10.08, | |
| "learning_rate": 0.0009991480298189564, | |
| "loss": 0.1754, | |
| "step": 15770 | |
| }, | |
| { | |
| "epoch": 10.08, | |
| "learning_rate": 0.0009990770323038693, | |
| "loss": 0.1899, | |
| "step": 15780 | |
| }, | |
| { | |
| "epoch": 10.09, | |
| "learning_rate": 0.0009990060347887823, | |
| "loss": 0.1809, | |
| "step": 15790 | |
| }, | |
| { | |
| "epoch": 10.1, | |
| "learning_rate": 0.0009989350372736955, | |
| "loss": 0.1691, | |
| "step": 15800 | |
| }, | |
| { | |
| "epoch": 10.1, | |
| "learning_rate": 0.0009988640397586084, | |
| "loss": 0.1784, | |
| "step": 15810 | |
| }, | |
| { | |
| "epoch": 10.11, | |
| "learning_rate": 0.0009987930422435216, | |
| "loss": 0.1872, | |
| "step": 15820 | |
| }, | |
| { | |
| "epoch": 10.11, | |
| "learning_rate": 0.0009987220447284346, | |
| "loss": 0.1759, | |
| "step": 15830 | |
| }, | |
| { | |
| "epoch": 10.12, | |
| "learning_rate": 0.0009986510472133475, | |
| "loss": 0.1688, | |
| "step": 15840 | |
| }, | |
| { | |
| "epoch": 10.13, | |
| "learning_rate": 0.0009985800496982605, | |
| "loss": 0.2019, | |
| "step": 15850 | |
| }, | |
| { | |
| "epoch": 10.13, | |
| "learning_rate": 0.0009985090521831737, | |
| "loss": 0.1546, | |
| "step": 15860 | |
| }, | |
| { | |
| "epoch": 10.14, | |
| "learning_rate": 0.0009984380546680866, | |
| "loss": 0.207, | |
| "step": 15870 | |
| }, | |
| { | |
| "epoch": 10.15, | |
| "learning_rate": 0.0009983670571529998, | |
| "loss": 0.1832, | |
| "step": 15880 | |
| }, | |
| { | |
| "epoch": 10.15, | |
| "learning_rate": 0.0009982960596379127, | |
| "loss": 0.1724, | |
| "step": 15890 | |
| }, | |
| { | |
| "epoch": 10.16, | |
| "learning_rate": 0.0009982250621228257, | |
| "loss": 0.1905, | |
| "step": 15900 | |
| }, | |
| { | |
| "epoch": 10.17, | |
| "learning_rate": 0.0009981540646077387, | |
| "loss": 0.1705, | |
| "step": 15910 | |
| }, | |
| { | |
| "epoch": 10.17, | |
| "learning_rate": 0.0009980830670926518, | |
| "loss": 0.1848, | |
| "step": 15920 | |
| }, | |
| { | |
| "epoch": 10.18, | |
| "learning_rate": 0.0009980120695775648, | |
| "loss": 0.1958, | |
| "step": 15930 | |
| }, | |
| { | |
| "epoch": 10.19, | |
| "learning_rate": 0.000997941072062478, | |
| "loss": 0.1769, | |
| "step": 15940 | |
| }, | |
| { | |
| "epoch": 10.19, | |
| "learning_rate": 0.000997870074547391, | |
| "loss": 0.1765, | |
| "step": 15950 | |
| }, | |
| { | |
| "epoch": 10.2, | |
| "learning_rate": 0.0009977990770323039, | |
| "loss": 0.2068, | |
| "step": 15960 | |
| }, | |
| { | |
| "epoch": 10.2, | |
| "learning_rate": 0.0009977280795172168, | |
| "loss": 0.146, | |
| "step": 15970 | |
| }, | |
| { | |
| "epoch": 10.21, | |
| "learning_rate": 0.0009976570820021298, | |
| "loss": 0.1541, | |
| "step": 15980 | |
| }, | |
| { | |
| "epoch": 10.22, | |
| "learning_rate": 0.000997586084487043, | |
| "loss": 0.188, | |
| "step": 15990 | |
| }, | |
| { | |
| "epoch": 10.22, | |
| "learning_rate": 0.000997515086971956, | |
| "loss": 0.1822, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 10.23, | |
| "learning_rate": 0.000997444089456869, | |
| "loss": 0.1641, | |
| "step": 16010 | |
| }, | |
| { | |
| "epoch": 10.24, | |
| "learning_rate": 0.000997373091941782, | |
| "loss": 0.1893, | |
| "step": 16020 | |
| }, | |
| { | |
| "epoch": 10.24, | |
| "learning_rate": 0.000997302094426695, | |
| "loss": 0.191, | |
| "step": 16030 | |
| }, | |
| { | |
| "epoch": 10.25, | |
| "learning_rate": 0.000997231096911608, | |
| "loss": 0.2111, | |
| "step": 16040 | |
| }, | |
| { | |
| "epoch": 10.26, | |
| "learning_rate": 0.0009971600993965212, | |
| "loss": 0.186, | |
| "step": 16050 | |
| }, | |
| { | |
| "epoch": 10.26, | |
| "learning_rate": 0.0009970891018814341, | |
| "loss": 0.1952, | |
| "step": 16060 | |
| }, | |
| { | |
| "epoch": 10.27, | |
| "learning_rate": 0.0009970181043663473, | |
| "loss": 0.1963, | |
| "step": 16070 | |
| }, | |
| { | |
| "epoch": 10.27, | |
| "learning_rate": 0.0009969471068512602, | |
| "loss": 0.183, | |
| "step": 16080 | |
| }, | |
| { | |
| "epoch": 10.28, | |
| "learning_rate": 0.0009968761093361732, | |
| "loss": 0.1845, | |
| "step": 16090 | |
| }, | |
| { | |
| "epoch": 10.29, | |
| "learning_rate": 0.0009968051118210862, | |
| "loss": 0.2002, | |
| "step": 16100 | |
| }, | |
| { | |
| "epoch": 10.29, | |
| "learning_rate": 0.0009967341143059993, | |
| "loss": 0.1953, | |
| "step": 16110 | |
| }, | |
| { | |
| "epoch": 10.3, | |
| "learning_rate": 0.0009966631167909123, | |
| "loss": 0.1778, | |
| "step": 16120 | |
| }, | |
| { | |
| "epoch": 10.31, | |
| "learning_rate": 0.0009965921192758255, | |
| "loss": 0.2073, | |
| "step": 16130 | |
| }, | |
| { | |
| "epoch": 10.31, | |
| "learning_rate": 0.0009965211217607384, | |
| "loss": 0.1755, | |
| "step": 16140 | |
| }, | |
| { | |
| "epoch": 10.32, | |
| "learning_rate": 0.0009964501242456514, | |
| "loss": 0.2085, | |
| "step": 16150 | |
| }, | |
| { | |
| "epoch": 10.33, | |
| "learning_rate": 0.0009963791267305643, | |
| "loss": 0.1978, | |
| "step": 16160 | |
| }, | |
| { | |
| "epoch": 10.33, | |
| "learning_rate": 0.0009963081292154775, | |
| "loss": 0.2101, | |
| "step": 16170 | |
| }, | |
| { | |
| "epoch": 10.34, | |
| "learning_rate": 0.0009962371317003905, | |
| "loss": 0.2027, | |
| "step": 16180 | |
| }, | |
| { | |
| "epoch": 10.34, | |
| "learning_rate": 0.0009961661341853036, | |
| "loss": 0.1905, | |
| "step": 16190 | |
| }, | |
| { | |
| "epoch": 10.35, | |
| "learning_rate": 0.0009960951366702166, | |
| "loss": 0.175, | |
| "step": 16200 | |
| }, | |
| { | |
| "epoch": 10.36, | |
| "learning_rate": 0.0009960241391551296, | |
| "loss": 0.1816, | |
| "step": 16210 | |
| }, | |
| { | |
| "epoch": 10.36, | |
| "learning_rate": 0.0009959531416400425, | |
| "loss": 0.1917, | |
| "step": 16220 | |
| }, | |
| { | |
| "epoch": 10.37, | |
| "learning_rate": 0.0009958821441249557, | |
| "loss": 0.1956, | |
| "step": 16230 | |
| }, | |
| { | |
| "epoch": 10.38, | |
| "learning_rate": 0.0009958111466098687, | |
| "loss": 0.2037, | |
| "step": 16240 | |
| }, | |
| { | |
| "epoch": 10.38, | |
| "learning_rate": 0.0009957401490947818, | |
| "loss": 0.2194, | |
| "step": 16250 | |
| }, | |
| { | |
| "epoch": 10.39, | |
| "learning_rate": 0.0009956691515796948, | |
| "loss": 0.1633, | |
| "step": 16260 | |
| }, | |
| { | |
| "epoch": 10.4, | |
| "learning_rate": 0.0009955981540646077, | |
| "loss": 0.1803, | |
| "step": 16270 | |
| }, | |
| { | |
| "epoch": 10.4, | |
| "learning_rate": 0.0009955271565495207, | |
| "loss": 0.1885, | |
| "step": 16280 | |
| }, | |
| { | |
| "epoch": 10.41, | |
| "learning_rate": 0.0009954561590344337, | |
| "loss": 0.2004, | |
| "step": 16290 | |
| }, | |
| { | |
| "epoch": 10.42, | |
| "learning_rate": 0.0009953851615193468, | |
| "loss": 0.1961, | |
| "step": 16300 | |
| }, | |
| { | |
| "epoch": 10.42, | |
| "learning_rate": 0.0009953141640042598, | |
| "loss": 0.1827, | |
| "step": 16310 | |
| }, | |
| { | |
| "epoch": 10.43, | |
| "learning_rate": 0.000995243166489173, | |
| "loss": 0.1775, | |
| "step": 16320 | |
| }, | |
| { | |
| "epoch": 10.43, | |
| "learning_rate": 0.000995172168974086, | |
| "loss": 0.1905, | |
| "step": 16330 | |
| }, | |
| { | |
| "epoch": 10.44, | |
| "learning_rate": 0.0009951011714589989, | |
| "loss": 0.2072, | |
| "step": 16340 | |
| }, | |
| { | |
| "epoch": 10.45, | |
| "learning_rate": 0.0009950301739439118, | |
| "loss": 0.1725, | |
| "step": 16350 | |
| }, | |
| { | |
| "epoch": 10.45, | |
| "learning_rate": 0.000994959176428825, | |
| "loss": 0.2023, | |
| "step": 16360 | |
| }, | |
| { | |
| "epoch": 10.46, | |
| "learning_rate": 0.000994888178913738, | |
| "loss": 0.1921, | |
| "step": 16370 | |
| }, | |
| { | |
| "epoch": 10.47, | |
| "learning_rate": 0.0009948171813986511, | |
| "loss": 0.1988, | |
| "step": 16380 | |
| }, | |
| { | |
| "epoch": 10.47, | |
| "learning_rate": 0.000994746183883564, | |
| "loss": 0.1888, | |
| "step": 16390 | |
| }, | |
| { | |
| "epoch": 10.48, | |
| "learning_rate": 0.000994675186368477, | |
| "loss": 0.2047, | |
| "step": 16400 | |
| }, | |
| { | |
| "epoch": 10.49, | |
| "learning_rate": 0.00099460418885339, | |
| "loss": 0.179, | |
| "step": 16410 | |
| }, | |
| { | |
| "epoch": 10.49, | |
| "learning_rate": 0.0009945331913383032, | |
| "loss": 0.1867, | |
| "step": 16420 | |
| }, | |
| { | |
| "epoch": 10.5, | |
| "learning_rate": 0.0009944621938232162, | |
| "loss": 0.1868, | |
| "step": 16430 | |
| }, | |
| { | |
| "epoch": 10.5, | |
| "learning_rate": 0.0009943911963081293, | |
| "loss": 0.212, | |
| "step": 16440 | |
| }, | |
| { | |
| "epoch": 10.51, | |
| "learning_rate": 0.0009943201987930423, | |
| "loss": 0.1937, | |
| "step": 16450 | |
| }, | |
| { | |
| "epoch": 10.52, | |
| "learning_rate": 0.0009942492012779552, | |
| "loss": 0.1915, | |
| "step": 16460 | |
| }, | |
| { | |
| "epoch": 10.52, | |
| "learning_rate": 0.0009941782037628682, | |
| "loss": 0.1712, | |
| "step": 16470 | |
| }, | |
| { | |
| "epoch": 10.53, | |
| "learning_rate": 0.0009941072062477814, | |
| "loss": 0.2135, | |
| "step": 16480 | |
| }, | |
| { | |
| "epoch": 10.54, | |
| "learning_rate": 0.0009940362087326943, | |
| "loss": 0.1716, | |
| "step": 16490 | |
| }, | |
| { | |
| "epoch": 10.54, | |
| "learning_rate": 0.0009939652112176075, | |
| "loss": 0.193, | |
| "step": 16500 | |
| }, | |
| { | |
| "epoch": 10.55, | |
| "learning_rate": 0.0009938942137025205, | |
| "loss": 0.2042, | |
| "step": 16510 | |
| }, | |
| { | |
| "epoch": 10.56, | |
| "learning_rate": 0.0009938232161874334, | |
| "loss": 0.2068, | |
| "step": 16520 | |
| }, | |
| { | |
| "epoch": 10.56, | |
| "learning_rate": 0.0009937522186723464, | |
| "loss": 0.1977, | |
| "step": 16530 | |
| }, | |
| { | |
| "epoch": 10.57, | |
| "learning_rate": 0.0009936812211572596, | |
| "loss": 0.1968, | |
| "step": 16540 | |
| }, | |
| { | |
| "epoch": 10.57, | |
| "learning_rate": 0.0009936102236421725, | |
| "loss": 0.2021, | |
| "step": 16550 | |
| }, | |
| { | |
| "epoch": 10.58, | |
| "learning_rate": 0.0009935392261270857, | |
| "loss": 0.2083, | |
| "step": 16560 | |
| }, | |
| { | |
| "epoch": 10.59, | |
| "learning_rate": 0.0009934682286119986, | |
| "loss": 0.1932, | |
| "step": 16570 | |
| }, | |
| { | |
| "epoch": 10.59, | |
| "learning_rate": 0.0009933972310969116, | |
| "loss": 0.2191, | |
| "step": 16580 | |
| }, | |
| { | |
| "epoch": 10.6, | |
| "learning_rate": 0.0009933262335818246, | |
| "loss": 0.2102, | |
| "step": 16590 | |
| }, | |
| { | |
| "epoch": 10.61, | |
| "learning_rate": 0.0009932552360667377, | |
| "loss": 0.1698, | |
| "step": 16600 | |
| }, | |
| { | |
| "epoch": 10.61, | |
| "learning_rate": 0.0009931842385516507, | |
| "loss": 0.2065, | |
| "step": 16610 | |
| }, | |
| { | |
| "epoch": 10.62, | |
| "learning_rate": 0.0009931132410365637, | |
| "loss": 0.1976, | |
| "step": 16620 | |
| }, | |
| { | |
| "epoch": 10.63, | |
| "learning_rate": 0.0009930422435214768, | |
| "loss": 0.2074, | |
| "step": 16630 | |
| }, | |
| { | |
| "epoch": 10.63, | |
| "learning_rate": 0.0009929712460063898, | |
| "loss": 0.22, | |
| "step": 16640 | |
| }, | |
| { | |
| "epoch": 10.64, | |
| "learning_rate": 0.0009929002484913027, | |
| "loss": 0.1612, | |
| "step": 16650 | |
| }, | |
| { | |
| "epoch": 10.65, | |
| "learning_rate": 0.000992829250976216, | |
| "loss": 0.2161, | |
| "step": 16660 | |
| }, | |
| { | |
| "epoch": 10.65, | |
| "learning_rate": 0.0009927582534611289, | |
| "loss": 0.1898, | |
| "step": 16670 | |
| }, | |
| { | |
| "epoch": 10.66, | |
| "learning_rate": 0.0009926872559460418, | |
| "loss": 0.155, | |
| "step": 16680 | |
| }, | |
| { | |
| "epoch": 10.66, | |
| "learning_rate": 0.000992616258430955, | |
| "loss": 0.1943, | |
| "step": 16690 | |
| }, | |
| { | |
| "epoch": 10.67, | |
| "learning_rate": 0.000992545260915868, | |
| "loss": 0.1812, | |
| "step": 16700 | |
| }, | |
| { | |
| "epoch": 10.68, | |
| "learning_rate": 0.000992474263400781, | |
| "loss": 0.19, | |
| "step": 16710 | |
| }, | |
| { | |
| "epoch": 10.68, | |
| "learning_rate": 0.000992403265885694, | |
| "loss": 0.2032, | |
| "step": 16720 | |
| }, | |
| { | |
| "epoch": 10.69, | |
| "learning_rate": 0.000992332268370607, | |
| "loss": 0.1948, | |
| "step": 16730 | |
| }, | |
| { | |
| "epoch": 10.7, | |
| "learning_rate": 0.00099226127085552, | |
| "loss": 0.2, | |
| "step": 16740 | |
| }, | |
| { | |
| "epoch": 10.7, | |
| "learning_rate": 0.0009921902733404332, | |
| "loss": 0.1899, | |
| "step": 16750 | |
| }, | |
| { | |
| "epoch": 10.71, | |
| "learning_rate": 0.0009921192758253461, | |
| "loss": 0.1937, | |
| "step": 16760 | |
| }, | |
| { | |
| "epoch": 10.72, | |
| "learning_rate": 0.000992048278310259, | |
| "loss": 0.1854, | |
| "step": 16770 | |
| }, | |
| { | |
| "epoch": 10.72, | |
| "learning_rate": 0.0009919772807951723, | |
| "loss": 0.2145, | |
| "step": 16780 | |
| }, | |
| { | |
| "epoch": 10.73, | |
| "learning_rate": 0.0009919062832800852, | |
| "loss": 0.2008, | |
| "step": 16790 | |
| }, | |
| { | |
| "epoch": 10.73, | |
| "learning_rate": 0.0009918352857649982, | |
| "loss": 0.1859, | |
| "step": 16800 | |
| }, | |
| { | |
| "epoch": 10.74, | |
| "learning_rate": 0.0009917642882499114, | |
| "loss": 0.1952, | |
| "step": 16810 | |
| }, | |
| { | |
| "epoch": 10.75, | |
| "learning_rate": 0.0009916932907348243, | |
| "loss": 0.1662, | |
| "step": 16820 | |
| }, | |
| { | |
| "epoch": 10.75, | |
| "learning_rate": 0.0009916222932197373, | |
| "loss": 0.1971, | |
| "step": 16830 | |
| }, | |
| { | |
| "epoch": 10.76, | |
| "learning_rate": 0.0009915512957046502, | |
| "loss": 0.176, | |
| "step": 16840 | |
| }, | |
| { | |
| "epoch": 10.77, | |
| "learning_rate": 0.0009914802981895634, | |
| "loss": 0.1621, | |
| "step": 16850 | |
| }, | |
| { | |
| "epoch": 10.77, | |
| "learning_rate": 0.0009914093006744764, | |
| "loss": 0.2204, | |
| "step": 16860 | |
| }, | |
| { | |
| "epoch": 10.78, | |
| "learning_rate": 0.0009913383031593895, | |
| "loss": 0.1798, | |
| "step": 16870 | |
| }, | |
| { | |
| "epoch": 10.79, | |
| "learning_rate": 0.0009912673056443025, | |
| "loss": 0.1984, | |
| "step": 16880 | |
| }, | |
| { | |
| "epoch": 10.79, | |
| "learning_rate": 0.0009911963081292155, | |
| "loss": 0.1789, | |
| "step": 16890 | |
| }, | |
| { | |
| "epoch": 10.8, | |
| "learning_rate": 0.0009911253106141284, | |
| "loss": 0.1897, | |
| "step": 16900 | |
| }, | |
| { | |
| "epoch": 10.8, | |
| "learning_rate": 0.0009910543130990416, | |
| "loss": 0.1888, | |
| "step": 16910 | |
| }, | |
| { | |
| "epoch": 10.81, | |
| "learning_rate": 0.0009909833155839546, | |
| "loss": 0.1828, | |
| "step": 16920 | |
| }, | |
| { | |
| "epoch": 10.82, | |
| "learning_rate": 0.0009909123180688675, | |
| "loss": 0.1798, | |
| "step": 16930 | |
| }, | |
| { | |
| "epoch": 10.82, | |
| "learning_rate": 0.0009908413205537807, | |
| "loss": 0.1729, | |
| "step": 16940 | |
| }, | |
| { | |
| "epoch": 10.83, | |
| "learning_rate": 0.0009907703230386936, | |
| "loss": 0.2113, | |
| "step": 16950 | |
| }, | |
| { | |
| "epoch": 10.84, | |
| "learning_rate": 0.0009906993255236066, | |
| "loss": 0.2041, | |
| "step": 16960 | |
| }, | |
| { | |
| "epoch": 10.84, | |
| "learning_rate": 0.0009906283280085198, | |
| "loss": 0.1625, | |
| "step": 16970 | |
| }, | |
| { | |
| "epoch": 10.85, | |
| "learning_rate": 0.0009905573304934327, | |
| "loss": 0.1726, | |
| "step": 16980 | |
| }, | |
| { | |
| "epoch": 10.86, | |
| "learning_rate": 0.0009904863329783457, | |
| "loss": 0.1875, | |
| "step": 16990 | |
| }, | |
| { | |
| "epoch": 10.86, | |
| "learning_rate": 0.0009904153354632589, | |
| "loss": 0.2126, | |
| "step": 17000 | |
| }, | |
| { | |
| "epoch": 10.87, | |
| "learning_rate": 0.0009903443379481718, | |
| "loss": 0.1882, | |
| "step": 17010 | |
| }, | |
| { | |
| "epoch": 10.88, | |
| "learning_rate": 0.0009902733404330848, | |
| "loss": 0.2062, | |
| "step": 17020 | |
| }, | |
| { | |
| "epoch": 10.88, | |
| "learning_rate": 0.000990202342917998, | |
| "loss": 0.1705, | |
| "step": 17030 | |
| }, | |
| { | |
| "epoch": 10.89, | |
| "learning_rate": 0.000990131345402911, | |
| "loss": 0.2103, | |
| "step": 17040 | |
| }, | |
| { | |
| "epoch": 10.89, | |
| "learning_rate": 0.0009900603478878239, | |
| "loss": 0.1766, | |
| "step": 17050 | |
| }, | |
| { | |
| "epoch": 10.9, | |
| "learning_rate": 0.000989989350372737, | |
| "loss": 0.189, | |
| "step": 17060 | |
| }, | |
| { | |
| "epoch": 10.91, | |
| "learning_rate": 0.00098991835285765, | |
| "loss": 0.1797, | |
| "step": 17070 | |
| }, | |
| { | |
| "epoch": 10.91, | |
| "learning_rate": 0.000989847355342563, | |
| "loss": 0.2013, | |
| "step": 17080 | |
| }, | |
| { | |
| "epoch": 10.92, | |
| "learning_rate": 0.0009897763578274761, | |
| "loss": 0.2034, | |
| "step": 17090 | |
| }, | |
| { | |
| "epoch": 10.93, | |
| "learning_rate": 0.000989705360312389, | |
| "loss": 0.1947, | |
| "step": 17100 | |
| }, | |
| { | |
| "epoch": 10.93, | |
| "learning_rate": 0.000989634362797302, | |
| "loss": 0.2248, | |
| "step": 17110 | |
| }, | |
| { | |
| "epoch": 10.94, | |
| "learning_rate": 0.0009895633652822152, | |
| "loss": 0.2021, | |
| "step": 17120 | |
| }, | |
| { | |
| "epoch": 10.95, | |
| "learning_rate": 0.0009894923677671282, | |
| "loss": 0.1932, | |
| "step": 17130 | |
| }, | |
| { | |
| "epoch": 10.95, | |
| "learning_rate": 0.0009894213702520411, | |
| "loss": 0.1998, | |
| "step": 17140 | |
| }, | |
| { | |
| "epoch": 10.96, | |
| "learning_rate": 0.0009893503727369543, | |
| "loss": 0.2081, | |
| "step": 17150 | |
| }, | |
| { | |
| "epoch": 10.96, | |
| "learning_rate": 0.0009892793752218673, | |
| "loss": 0.2047, | |
| "step": 17160 | |
| }, | |
| { | |
| "epoch": 10.97, | |
| "learning_rate": 0.0009892083777067802, | |
| "loss": 0.1864, | |
| "step": 17170 | |
| }, | |
| { | |
| "epoch": 10.98, | |
| "learning_rate": 0.0009891373801916934, | |
| "loss": 0.2137, | |
| "step": 17180 | |
| }, | |
| { | |
| "epoch": 10.98, | |
| "learning_rate": 0.0009890663826766064, | |
| "loss": 0.1858, | |
| "step": 17190 | |
| }, | |
| { | |
| "epoch": 10.99, | |
| "learning_rate": 0.0009889953851615193, | |
| "loss": 0.2036, | |
| "step": 17200 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "learning_rate": 0.0009889243876464325, | |
| "loss": 0.1979, | |
| "step": 17210 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "learning_rate": 0.0009888533901313455, | |
| "loss": 0.1788, | |
| "step": 17220 | |
| }, | |
| { | |
| "epoch": 11.01, | |
| "learning_rate": 0.0009887823926162584, | |
| "loss": 0.1777, | |
| "step": 17230 | |
| }, | |
| { | |
| "epoch": 11.02, | |
| "learning_rate": 0.0009887113951011714, | |
| "loss": 0.1835, | |
| "step": 17240 | |
| }, | |
| { | |
| "epoch": 11.02, | |
| "learning_rate": 0.0009886403975860845, | |
| "loss": 0.1546, | |
| "step": 17250 | |
| }, | |
| { | |
| "epoch": 11.03, | |
| "learning_rate": 0.0009885694000709975, | |
| "loss": 0.1461, | |
| "step": 17260 | |
| }, | |
| { | |
| "epoch": 11.04, | |
| "learning_rate": 0.0009884984025559107, | |
| "loss": 0.1716, | |
| "step": 17270 | |
| }, | |
| { | |
| "epoch": 11.04, | |
| "learning_rate": 0.0009884274050408236, | |
| "loss": 0.1556, | |
| "step": 17280 | |
| }, | |
| { | |
| "epoch": 11.05, | |
| "learning_rate": 0.0009883564075257366, | |
| "loss": 0.1664, | |
| "step": 17290 | |
| }, | |
| { | |
| "epoch": 11.05, | |
| "learning_rate": 0.0009882854100106496, | |
| "loss": 0.1738, | |
| "step": 17300 | |
| }, | |
| { | |
| "epoch": 11.06, | |
| "learning_rate": 0.0009882144124955627, | |
| "loss": 0.1797, | |
| "step": 17310 | |
| }, | |
| { | |
| "epoch": 11.07, | |
| "learning_rate": 0.0009881434149804757, | |
| "loss": 0.2018, | |
| "step": 17320 | |
| }, | |
| { | |
| "epoch": 11.07, | |
| "learning_rate": 0.0009880724174653889, | |
| "loss": 0.1683, | |
| "step": 17330 | |
| }, | |
| { | |
| "epoch": 11.08, | |
| "learning_rate": 0.0009880014199503018, | |
| "loss": 0.1928, | |
| "step": 17340 | |
| }, | |
| { | |
| "epoch": 11.09, | |
| "learning_rate": 0.0009879304224352148, | |
| "loss": 0.1737, | |
| "step": 17350 | |
| }, | |
| { | |
| "epoch": 11.09, | |
| "learning_rate": 0.0009878594249201277, | |
| "loss": 0.1715, | |
| "step": 17360 | |
| }, | |
| { | |
| "epoch": 11.1, | |
| "learning_rate": 0.000987788427405041, | |
| "loss": 0.1691, | |
| "step": 17370 | |
| }, | |
| { | |
| "epoch": 11.11, | |
| "learning_rate": 0.0009877174298899539, | |
| "loss": 0.1462, | |
| "step": 17380 | |
| }, | |
| { | |
| "epoch": 11.11, | |
| "learning_rate": 0.000987646432374867, | |
| "loss": 0.1835, | |
| "step": 17390 | |
| }, | |
| { | |
| "epoch": 11.12, | |
| "learning_rate": 0.00098757543485978, | |
| "loss": 0.1515, | |
| "step": 17400 | |
| }, | |
| { | |
| "epoch": 11.12, | |
| "learning_rate": 0.000987504437344693, | |
| "loss": 0.1819, | |
| "step": 17410 | |
| }, | |
| { | |
| "epoch": 11.13, | |
| "learning_rate": 0.000987433439829606, | |
| "loss": 0.137, | |
| "step": 17420 | |
| }, | |
| { | |
| "epoch": 11.14, | |
| "learning_rate": 0.000987362442314519, | |
| "loss": 0.1742, | |
| "step": 17430 | |
| }, | |
| { | |
| "epoch": 11.14, | |
| "learning_rate": 0.000987291444799432, | |
| "loss": 0.147, | |
| "step": 17440 | |
| }, | |
| { | |
| "epoch": 11.15, | |
| "learning_rate": 0.000987220447284345, | |
| "loss": 0.1645, | |
| "step": 17450 | |
| }, | |
| { | |
| "epoch": 11.16, | |
| "learning_rate": 0.0009871494497692582, | |
| "loss": 0.1775, | |
| "step": 17460 | |
| }, | |
| { | |
| "epoch": 11.16, | |
| "learning_rate": 0.0009870784522541711, | |
| "loss": 0.1766, | |
| "step": 17470 | |
| }, | |
| { | |
| "epoch": 11.17, | |
| "learning_rate": 0.000987007454739084, | |
| "loss": 0.19, | |
| "step": 17480 | |
| }, | |
| { | |
| "epoch": 11.18, | |
| "learning_rate": 0.0009869364572239973, | |
| "loss": 0.1521, | |
| "step": 17490 | |
| }, | |
| { | |
| "epoch": 11.18, | |
| "learning_rate": 0.0009868654597089102, | |
| "loss": 0.1355, | |
| "step": 17500 | |
| }, | |
| { | |
| "epoch": 11.19, | |
| "learning_rate": 0.0009867944621938232, | |
| "loss": 0.169, | |
| "step": 17510 | |
| }, | |
| { | |
| "epoch": 11.19, | |
| "learning_rate": 0.0009867234646787364, | |
| "loss": 0.1842, | |
| "step": 17520 | |
| }, | |
| { | |
| "epoch": 11.2, | |
| "learning_rate": 0.0009866524671636493, | |
| "loss": 0.1588, | |
| "step": 17530 | |
| }, | |
| { | |
| "epoch": 11.21, | |
| "learning_rate": 0.0009865814696485623, | |
| "loss": 0.1587, | |
| "step": 17540 | |
| }, | |
| { | |
| "epoch": 11.21, | |
| "learning_rate": 0.0009865104721334752, | |
| "loss": 0.1792, | |
| "step": 17550 | |
| }, | |
| { | |
| "epoch": 11.22, | |
| "learning_rate": 0.0009864394746183884, | |
| "loss": 0.1832, | |
| "step": 17560 | |
| }, | |
| { | |
| "epoch": 11.23, | |
| "learning_rate": 0.0009863684771033014, | |
| "loss": 0.145, | |
| "step": 17570 | |
| }, | |
| { | |
| "epoch": 11.23, | |
| "learning_rate": 0.0009862974795882145, | |
| "loss": 0.1764, | |
| "step": 17580 | |
| }, | |
| { | |
| "epoch": 11.24, | |
| "learning_rate": 0.0009862264820731275, | |
| "loss": 0.1706, | |
| "step": 17590 | |
| }, | |
| { | |
| "epoch": 11.25, | |
| "learning_rate": 0.0009861554845580405, | |
| "loss": 0.1737, | |
| "step": 17600 | |
| }, | |
| { | |
| "epoch": 11.25, | |
| "learning_rate": 0.0009860844870429534, | |
| "loss": 0.1445, | |
| "step": 17610 | |
| }, | |
| { | |
| "epoch": 11.26, | |
| "learning_rate": 0.0009860134895278666, | |
| "loss": 0.1704, | |
| "step": 17620 | |
| }, | |
| { | |
| "epoch": 11.27, | |
| "learning_rate": 0.0009859424920127795, | |
| "loss": 0.1714, | |
| "step": 17630 | |
| }, | |
| { | |
| "epoch": 11.27, | |
| "learning_rate": 0.0009858714944976927, | |
| "loss": 0.1495, | |
| "step": 17640 | |
| }, | |
| { | |
| "epoch": 11.28, | |
| "learning_rate": 0.0009858004969826057, | |
| "loss": 0.1698, | |
| "step": 17650 | |
| }, | |
| { | |
| "epoch": 11.28, | |
| "learning_rate": 0.0009857294994675186, | |
| "loss": 0.1824, | |
| "step": 17660 | |
| }, | |
| { | |
| "epoch": 11.29, | |
| "learning_rate": 0.0009856585019524316, | |
| "loss": 0.1515, | |
| "step": 17670 | |
| }, | |
| { | |
| "epoch": 11.3, | |
| "learning_rate": 0.0009855875044373448, | |
| "loss": 0.169, | |
| "step": 17680 | |
| }, | |
| { | |
| "epoch": 11.3, | |
| "learning_rate": 0.0009855165069222577, | |
| "loss": 0.1814, | |
| "step": 17690 | |
| }, | |
| { | |
| "epoch": 11.31, | |
| "learning_rate": 0.000985445509407171, | |
| "loss": 0.1548, | |
| "step": 17700 | |
| }, | |
| { | |
| "epoch": 11.32, | |
| "learning_rate": 0.0009853745118920839, | |
| "loss": 0.1615, | |
| "step": 17710 | |
| }, | |
| { | |
| "epoch": 11.32, | |
| "learning_rate": 0.0009853035143769968, | |
| "loss": 0.1975, | |
| "step": 17720 | |
| }, | |
| { | |
| "epoch": 11.33, | |
| "learning_rate": 0.0009852325168619098, | |
| "loss": 0.1402, | |
| "step": 17730 | |
| }, | |
| { | |
| "epoch": 11.34, | |
| "learning_rate": 0.000985161519346823, | |
| "loss": 0.1733, | |
| "step": 17740 | |
| }, | |
| { | |
| "epoch": 11.34, | |
| "learning_rate": 0.000985090521831736, | |
| "loss": 0.1782, | |
| "step": 17750 | |
| }, | |
| { | |
| "epoch": 11.35, | |
| "learning_rate": 0.000985019524316649, | |
| "loss": 0.1664, | |
| "step": 17760 | |
| }, | |
| { | |
| "epoch": 11.35, | |
| "learning_rate": 0.000984948526801562, | |
| "loss": 0.2117, | |
| "step": 17770 | |
| }, | |
| { | |
| "epoch": 11.36, | |
| "learning_rate": 0.000984877529286475, | |
| "loss": 0.1698, | |
| "step": 17780 | |
| }, | |
| { | |
| "epoch": 11.37, | |
| "learning_rate": 0.000984806531771388, | |
| "loss": 0.1607, | |
| "step": 17790 | |
| }, | |
| { | |
| "epoch": 11.37, | |
| "learning_rate": 0.0009847355342563011, | |
| "loss": 0.171, | |
| "step": 17800 | |
| }, | |
| { | |
| "epoch": 11.38, | |
| "learning_rate": 0.000984664536741214, | |
| "loss": 0.1969, | |
| "step": 17810 | |
| }, | |
| { | |
| "epoch": 11.39, | |
| "learning_rate": 0.0009845935392261273, | |
| "loss": 0.1615, | |
| "step": 17820 | |
| }, | |
| { | |
| "epoch": 11.39, | |
| "learning_rate": 0.0009845225417110402, | |
| "loss": 0.1649, | |
| "step": 17830 | |
| }, | |
| { | |
| "epoch": 11.4, | |
| "learning_rate": 0.0009844515441959532, | |
| "loss": 0.1773, | |
| "step": 17840 | |
| }, | |
| { | |
| "epoch": 11.41, | |
| "learning_rate": 0.0009843805466808661, | |
| "loss": 0.19, | |
| "step": 17850 | |
| }, | |
| { | |
| "epoch": 11.41, | |
| "learning_rate": 0.000984309549165779, | |
| "loss": 0.1501, | |
| "step": 17860 | |
| }, | |
| { | |
| "epoch": 11.42, | |
| "learning_rate": 0.0009842385516506923, | |
| "loss": 0.1397, | |
| "step": 17870 | |
| }, | |
| { | |
| "epoch": 11.42, | |
| "learning_rate": 0.0009841675541356052, | |
| "loss": 0.1641, | |
| "step": 17880 | |
| }, | |
| { | |
| "epoch": 11.43, | |
| "learning_rate": 0.0009840965566205184, | |
| "loss": 0.161, | |
| "step": 17890 | |
| }, | |
| { | |
| "epoch": 11.44, | |
| "learning_rate": 0.0009840255591054314, | |
| "loss": 0.1751, | |
| "step": 17900 | |
| }, | |
| { | |
| "epoch": 11.44, | |
| "learning_rate": 0.0009839545615903443, | |
| "loss": 0.1774, | |
| "step": 17910 | |
| }, | |
| { | |
| "epoch": 11.45, | |
| "learning_rate": 0.0009838835640752573, | |
| "loss": 0.2226, | |
| "step": 17920 | |
| }, | |
| { | |
| "epoch": 11.46, | |
| "learning_rate": 0.0009838125665601704, | |
| "loss": 0.1531, | |
| "step": 17930 | |
| }, | |
| { | |
| "epoch": 11.46, | |
| "learning_rate": 0.0009837415690450834, | |
| "loss": 0.1807, | |
| "step": 17940 | |
| }, | |
| { | |
| "epoch": 11.47, | |
| "learning_rate": 0.0009836705715299966, | |
| "loss": 0.1769, | |
| "step": 17950 | |
| }, | |
| { | |
| "epoch": 11.48, | |
| "learning_rate": 0.0009835995740149095, | |
| "loss": 0.1727, | |
| "step": 17960 | |
| }, | |
| { | |
| "epoch": 11.48, | |
| "learning_rate": 0.0009835285764998225, | |
| "loss": 0.1738, | |
| "step": 17970 | |
| }, | |
| { | |
| "epoch": 11.49, | |
| "learning_rate": 0.0009834575789847355, | |
| "loss": 0.1354, | |
| "step": 17980 | |
| }, | |
| { | |
| "epoch": 11.5, | |
| "learning_rate": 0.0009833865814696486, | |
| "loss": 0.1979, | |
| "step": 17990 | |
| }, | |
| { | |
| "epoch": 11.5, | |
| "learning_rate": 0.0009833155839545616, | |
| "loss": 0.1774, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 11.51, | |
| "learning_rate": 0.0009832445864394748, | |
| "loss": 0.1869, | |
| "step": 18010 | |
| }, | |
| { | |
| "epoch": 11.51, | |
| "learning_rate": 0.0009831735889243877, | |
| "loss": 0.1486, | |
| "step": 18020 | |
| }, | |
| { | |
| "epoch": 11.52, | |
| "learning_rate": 0.0009831025914093007, | |
| "loss": 0.2041, | |
| "step": 18030 | |
| }, | |
| { | |
| "epoch": 11.53, | |
| "learning_rate": 0.0009830315938942136, | |
| "loss": 0.188, | |
| "step": 18040 | |
| }, | |
| { | |
| "epoch": 11.53, | |
| "learning_rate": 0.0009829605963791268, | |
| "loss": 0.1349, | |
| "step": 18050 | |
| }, | |
| { | |
| "epoch": 11.54, | |
| "learning_rate": 0.0009828895988640398, | |
| "loss": 0.1786, | |
| "step": 18060 | |
| }, | |
| { | |
| "epoch": 11.55, | |
| "learning_rate": 0.000982818601348953, | |
| "loss": 0.1886, | |
| "step": 18070 | |
| }, | |
| { | |
| "epoch": 11.55, | |
| "learning_rate": 0.000982747603833866, | |
| "loss": 0.1876, | |
| "step": 18080 | |
| }, | |
| { | |
| "epoch": 11.56, | |
| "learning_rate": 0.0009826766063187789, | |
| "loss": 0.189, | |
| "step": 18090 | |
| }, | |
| { | |
| "epoch": 11.57, | |
| "learning_rate": 0.0009826056088036918, | |
| "loss": 0.1677, | |
| "step": 18100 | |
| }, | |
| { | |
| "epoch": 11.57, | |
| "learning_rate": 0.000982534611288605, | |
| "loss": 0.2143, | |
| "step": 18110 | |
| }, | |
| { | |
| "epoch": 11.58, | |
| "learning_rate": 0.000982463613773518, | |
| "loss": 0.1722, | |
| "step": 18120 | |
| }, | |
| { | |
| "epoch": 11.58, | |
| "learning_rate": 0.0009823926162584311, | |
| "loss": 0.1762, | |
| "step": 18130 | |
| }, | |
| { | |
| "epoch": 11.59, | |
| "learning_rate": 0.000982321618743344, | |
| "loss": 0.1833, | |
| "step": 18140 | |
| }, | |
| { | |
| "epoch": 11.6, | |
| "learning_rate": 0.000982250621228257, | |
| "loss": 0.1845, | |
| "step": 18150 | |
| }, | |
| { | |
| "epoch": 11.6, | |
| "learning_rate": 0.00098217962371317, | |
| "loss": 0.1567, | |
| "step": 18160 | |
| }, | |
| { | |
| "epoch": 11.61, | |
| "learning_rate": 0.000982108626198083, | |
| "loss": 0.1642, | |
| "step": 18170 | |
| }, | |
| { | |
| "epoch": 11.62, | |
| "learning_rate": 0.0009820376286829961, | |
| "loss": 0.1576, | |
| "step": 18180 | |
| }, | |
| { | |
| "epoch": 11.62, | |
| "learning_rate": 0.000981966631167909, | |
| "loss": 0.1377, | |
| "step": 18190 | |
| }, | |
| { | |
| "epoch": 11.63, | |
| "learning_rate": 0.0009818956336528223, | |
| "loss": 0.1921, | |
| "step": 18200 | |
| }, | |
| { | |
| "epoch": 11.64, | |
| "learning_rate": 0.0009818246361377352, | |
| "loss": 0.2037, | |
| "step": 18210 | |
| }, | |
| { | |
| "epoch": 11.64, | |
| "learning_rate": 0.0009817536386226482, | |
| "loss": 0.1988, | |
| "step": 18220 | |
| }, | |
| { | |
| "epoch": 11.65, | |
| "learning_rate": 0.0009816826411075611, | |
| "loss": 0.1576, | |
| "step": 18230 | |
| }, | |
| { | |
| "epoch": 11.65, | |
| "learning_rate": 0.0009816116435924743, | |
| "loss": 0.1727, | |
| "step": 18240 | |
| }, | |
| { | |
| "epoch": 11.66, | |
| "learning_rate": 0.0009815406460773873, | |
| "loss": 0.1925, | |
| "step": 18250 | |
| }, | |
| { | |
| "epoch": 11.67, | |
| "learning_rate": 0.0009814696485623004, | |
| "loss": 0.1942, | |
| "step": 18260 | |
| }, | |
| { | |
| "epoch": 11.67, | |
| "learning_rate": 0.0009813986510472134, | |
| "loss": 0.1506, | |
| "step": 18270 | |
| }, | |
| { | |
| "epoch": 11.68, | |
| "learning_rate": 0.0009813276535321264, | |
| "loss": 0.1973, | |
| "step": 18280 | |
| }, | |
| { | |
| "epoch": 11.69, | |
| "learning_rate": 0.0009812566560170393, | |
| "loss": 0.1641, | |
| "step": 18290 | |
| }, | |
| { | |
| "epoch": 11.69, | |
| "learning_rate": 0.0009811856585019525, | |
| "loss": 0.1719, | |
| "step": 18300 | |
| }, | |
| { | |
| "epoch": 11.7, | |
| "learning_rate": 0.0009811146609868654, | |
| "loss": 0.1681, | |
| "step": 18310 | |
| }, | |
| { | |
| "epoch": 11.71, | |
| "learning_rate": 0.0009810436634717786, | |
| "loss": 0.1644, | |
| "step": 18320 | |
| }, | |
| { | |
| "epoch": 11.71, | |
| "learning_rate": 0.0009809726659566916, | |
| "loss": 0.153, | |
| "step": 18330 | |
| }, | |
| { | |
| "epoch": 11.72, | |
| "learning_rate": 0.0009809016684416045, | |
| "loss": 0.1978, | |
| "step": 18340 | |
| }, | |
| { | |
| "epoch": 11.73, | |
| "learning_rate": 0.0009808306709265175, | |
| "loss": 0.1808, | |
| "step": 18350 | |
| }, | |
| { | |
| "epoch": 11.73, | |
| "learning_rate": 0.0009807596734114307, | |
| "loss": 0.1967, | |
| "step": 18360 | |
| }, | |
| { | |
| "epoch": 11.74, | |
| "learning_rate": 0.0009806886758963436, | |
| "loss": 0.1699, | |
| "step": 18370 | |
| }, | |
| { | |
| "epoch": 11.74, | |
| "learning_rate": 0.0009806176783812568, | |
| "loss": 0.1866, | |
| "step": 18380 | |
| }, | |
| { | |
| "epoch": 11.75, | |
| "learning_rate": 0.0009805466808661698, | |
| "loss": 0.1813, | |
| "step": 18390 | |
| }, | |
| { | |
| "epoch": 11.76, | |
| "learning_rate": 0.0009804756833510827, | |
| "loss": 0.1742, | |
| "step": 18400 | |
| }, | |
| { | |
| "epoch": 11.76, | |
| "learning_rate": 0.0009804046858359957, | |
| "loss": 0.2112, | |
| "step": 18410 | |
| }, | |
| { | |
| "epoch": 11.77, | |
| "learning_rate": 0.0009803336883209088, | |
| "loss": 0.1966, | |
| "step": 18420 | |
| }, | |
| { | |
| "epoch": 11.78, | |
| "learning_rate": 0.0009802626908058218, | |
| "loss": 0.1639, | |
| "step": 18430 | |
| }, | |
| { | |
| "epoch": 11.78, | |
| "learning_rate": 0.000980191693290735, | |
| "loss": 0.1614, | |
| "step": 18440 | |
| }, | |
| { | |
| "epoch": 11.79, | |
| "learning_rate": 0.000980120695775648, | |
| "loss": 0.1992, | |
| "step": 18450 | |
| }, | |
| { | |
| "epoch": 11.8, | |
| "learning_rate": 0.000980049698260561, | |
| "loss": 0.1965, | |
| "step": 18460 | |
| }, | |
| { | |
| "epoch": 11.8, | |
| "learning_rate": 0.0009799787007454739, | |
| "loss": 0.1885, | |
| "step": 18470 | |
| }, | |
| { | |
| "epoch": 11.81, | |
| "learning_rate": 0.0009799077032303868, | |
| "loss": 0.1509, | |
| "step": 18480 | |
| }, | |
| { | |
| "epoch": 11.81, | |
| "learning_rate": 0.0009798367057153, | |
| "loss": 0.1952, | |
| "step": 18490 | |
| }, | |
| { | |
| "epoch": 11.82, | |
| "learning_rate": 0.000979765708200213, | |
| "loss": 0.1801, | |
| "step": 18500 | |
| }, | |
| { | |
| "epoch": 11.83, | |
| "learning_rate": 0.0009796947106851261, | |
| "loss": 0.1521, | |
| "step": 18510 | |
| }, | |
| { | |
| "epoch": 11.83, | |
| "learning_rate": 0.000979623713170039, | |
| "loss": 0.1632, | |
| "step": 18520 | |
| }, | |
| { | |
| "epoch": 11.84, | |
| "learning_rate": 0.000979552715654952, | |
| "loss": 0.1945, | |
| "step": 18530 | |
| }, | |
| { | |
| "epoch": 11.85, | |
| "learning_rate": 0.000979481718139865, | |
| "loss": 0.1883, | |
| "step": 18540 | |
| }, | |
| { | |
| "epoch": 11.85, | |
| "learning_rate": 0.0009794107206247782, | |
| "loss": 0.1832, | |
| "step": 18550 | |
| }, | |
| { | |
| "epoch": 11.86, | |
| "learning_rate": 0.0009793397231096911, | |
| "loss": 0.1933, | |
| "step": 18560 | |
| }, | |
| { | |
| "epoch": 11.87, | |
| "learning_rate": 0.0009792687255946043, | |
| "loss": 0.1785, | |
| "step": 18570 | |
| }, | |
| { | |
| "epoch": 11.87, | |
| "learning_rate": 0.0009791977280795173, | |
| "loss": 0.1788, | |
| "step": 18580 | |
| }, | |
| { | |
| "epoch": 11.88, | |
| "learning_rate": 0.0009791267305644302, | |
| "loss": 0.18, | |
| "step": 18590 | |
| }, | |
| { | |
| "epoch": 11.88, | |
| "learning_rate": 0.0009790557330493432, | |
| "loss": 0.1882, | |
| "step": 18600 | |
| }, | |
| { | |
| "epoch": 11.89, | |
| "learning_rate": 0.0009789847355342563, | |
| "loss": 0.1823, | |
| "step": 18610 | |
| }, | |
| { | |
| "epoch": 11.9, | |
| "learning_rate": 0.0009789137380191693, | |
| "loss": 0.1843, | |
| "step": 18620 | |
| }, | |
| { | |
| "epoch": 11.9, | |
| "learning_rate": 0.0009788427405040825, | |
| "loss": 0.1725, | |
| "step": 18630 | |
| }, | |
| { | |
| "epoch": 11.91, | |
| "learning_rate": 0.0009787717429889954, | |
| "loss": 0.1905, | |
| "step": 18640 | |
| }, | |
| { | |
| "epoch": 11.92, | |
| "learning_rate": 0.0009787007454739084, | |
| "loss": 0.1904, | |
| "step": 18650 | |
| }, | |
| { | |
| "epoch": 11.92, | |
| "learning_rate": 0.0009786297479588214, | |
| "loss": 0.1537, | |
| "step": 18660 | |
| }, | |
| { | |
| "epoch": 11.93, | |
| "learning_rate": 0.0009785587504437345, | |
| "loss": 0.1519, | |
| "step": 18670 | |
| }, | |
| { | |
| "epoch": 11.94, | |
| "learning_rate": 0.0009784877529286475, | |
| "loss": 0.1831, | |
| "step": 18680 | |
| }, | |
| { | |
| "epoch": 11.94, | |
| "learning_rate": 0.0009784167554135607, | |
| "loss": 0.1562, | |
| "step": 18690 | |
| }, | |
| { | |
| "epoch": 11.95, | |
| "learning_rate": 0.0009783457578984736, | |
| "loss": 0.2007, | |
| "step": 18700 | |
| }, | |
| { | |
| "epoch": 11.95, | |
| "learning_rate": 0.0009782747603833866, | |
| "loss": 0.1683, | |
| "step": 18710 | |
| }, | |
| { | |
| "epoch": 11.96, | |
| "learning_rate": 0.0009782037628682995, | |
| "loss": 0.1927, | |
| "step": 18720 | |
| }, | |
| { | |
| "epoch": 11.97, | |
| "learning_rate": 0.0009781327653532127, | |
| "loss": 0.178, | |
| "step": 18730 | |
| }, | |
| { | |
| "epoch": 11.97, | |
| "learning_rate": 0.0009780617678381257, | |
| "loss": 0.1629, | |
| "step": 18740 | |
| }, | |
| { | |
| "epoch": 11.98, | |
| "learning_rate": 0.0009779907703230388, | |
| "loss": 0.177, | |
| "step": 18750 | |
| }, | |
| { | |
| "epoch": 11.99, | |
| "learning_rate": 0.0009779197728079518, | |
| "loss": 0.1758, | |
| "step": 18760 | |
| }, | |
| { | |
| "epoch": 11.99, | |
| "learning_rate": 0.0009778487752928648, | |
| "loss": 0.2114, | |
| "step": 18770 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "learning_rate": 0.0009777777777777777, | |
| "loss": 0.1582, | |
| "step": 18780 | |
| }, | |
| { | |
| "epoch": 12.01, | |
| "learning_rate": 0.0009777067802626907, | |
| "loss": 0.1586, | |
| "step": 18790 | |
| }, | |
| { | |
| "epoch": 12.01, | |
| "learning_rate": 0.0009776357827476038, | |
| "loss": 0.1523, | |
| "step": 18800 | |
| }, | |
| { | |
| "epoch": 12.02, | |
| "learning_rate": 0.0009775647852325168, | |
| "loss": 0.1614, | |
| "step": 18810 | |
| }, | |
| { | |
| "epoch": 12.03, | |
| "learning_rate": 0.00097749378771743, | |
| "loss": 0.169, | |
| "step": 18820 | |
| }, | |
| { | |
| "epoch": 12.03, | |
| "learning_rate": 0.000977422790202343, | |
| "loss": 0.1339, | |
| "step": 18830 | |
| }, | |
| { | |
| "epoch": 12.04, | |
| "learning_rate": 0.000977351792687256, | |
| "loss": 0.1313, | |
| "step": 18840 | |
| }, | |
| { | |
| "epoch": 12.04, | |
| "learning_rate": 0.0009772807951721689, | |
| "loss": 0.1481, | |
| "step": 18850 | |
| }, | |
| { | |
| "epoch": 12.05, | |
| "learning_rate": 0.000977209797657082, | |
| "loss": 0.1294, | |
| "step": 18860 | |
| }, | |
| { | |
| "epoch": 12.06, | |
| "learning_rate": 0.000977138800141995, | |
| "loss": 0.1555, | |
| "step": 18870 | |
| }, | |
| { | |
| "epoch": 12.06, | |
| "learning_rate": 0.0009770678026269082, | |
| "loss": 0.1555, | |
| "step": 18880 | |
| }, | |
| { | |
| "epoch": 12.07, | |
| "learning_rate": 0.0009769968051118211, | |
| "loss": 0.1688, | |
| "step": 18890 | |
| }, | |
| { | |
| "epoch": 12.08, | |
| "learning_rate": 0.000976925807596734, | |
| "loss": 0.1738, | |
| "step": 18900 | |
| }, | |
| { | |
| "epoch": 12.08, | |
| "learning_rate": 0.000976854810081647, | |
| "loss": 0.1463, | |
| "step": 18910 | |
| }, | |
| { | |
| "epoch": 12.09, | |
| "learning_rate": 0.0009767838125665602, | |
| "loss": 0.1241, | |
| "step": 18920 | |
| }, | |
| { | |
| "epoch": 12.1, | |
| "learning_rate": 0.0009767128150514732, | |
| "loss": 0.1401, | |
| "step": 18930 | |
| }, | |
| { | |
| "epoch": 12.1, | |
| "learning_rate": 0.0009766418175363863, | |
| "loss": 0.1685, | |
| "step": 18940 | |
| }, | |
| { | |
| "epoch": 12.11, | |
| "learning_rate": 0.0009765708200212993, | |
| "loss": 0.1761, | |
| "step": 18950 | |
| }, | |
| { | |
| "epoch": 12.11, | |
| "learning_rate": 0.0009764998225062123, | |
| "loss": 0.1738, | |
| "step": 18960 | |
| }, | |
| { | |
| "epoch": 12.12, | |
| "learning_rate": 0.0009764288249911253, | |
| "loss": 0.1195, | |
| "step": 18970 | |
| }, | |
| { | |
| "epoch": 12.13, | |
| "learning_rate": 0.0009763578274760384, | |
| "loss": 0.1416, | |
| "step": 18980 | |
| }, | |
| { | |
| "epoch": 12.13, | |
| "learning_rate": 0.0009762868299609515, | |
| "loss": 0.1504, | |
| "step": 18990 | |
| }, | |
| { | |
| "epoch": 12.14, | |
| "learning_rate": 0.0009762158324458644, | |
| "loss": 0.1515, | |
| "step": 19000 | |
| }, | |
| { | |
| "epoch": 12.15, | |
| "learning_rate": 0.0009761448349307775, | |
| "loss": 0.1773, | |
| "step": 19010 | |
| }, | |
| { | |
| "epoch": 12.15, | |
| "learning_rate": 0.0009760738374156904, | |
| "loss": 0.1548, | |
| "step": 19020 | |
| }, | |
| { | |
| "epoch": 12.16, | |
| "learning_rate": 0.0009760028399006035, | |
| "loss": 0.1606, | |
| "step": 19030 | |
| }, | |
| { | |
| "epoch": 12.17, | |
| "learning_rate": 0.0009759318423855166, | |
| "loss": 0.1607, | |
| "step": 19040 | |
| }, | |
| { | |
| "epoch": 12.17, | |
| "learning_rate": 0.0009758608448704296, | |
| "loss": 0.1473, | |
| "step": 19050 | |
| }, | |
| { | |
| "epoch": 12.18, | |
| "learning_rate": 0.0009757898473553426, | |
| "loss": 0.1539, | |
| "step": 19060 | |
| }, | |
| { | |
| "epoch": 12.19, | |
| "learning_rate": 0.0009757188498402556, | |
| "loss": 0.1577, | |
| "step": 19070 | |
| }, | |
| { | |
| "epoch": 12.19, | |
| "learning_rate": 0.0009756478523251686, | |
| "loss": 0.1825, | |
| "step": 19080 | |
| }, | |
| { | |
| "epoch": 12.2, | |
| "learning_rate": 0.0009755768548100816, | |
| "loss": 0.1687, | |
| "step": 19090 | |
| }, | |
| { | |
| "epoch": 12.2, | |
| "learning_rate": 0.0009755058572949948, | |
| "loss": 0.188, | |
| "step": 19100 | |
| }, | |
| { | |
| "epoch": 12.21, | |
| "learning_rate": 0.0009754348597799077, | |
| "loss": 0.1424, | |
| "step": 19110 | |
| }, | |
| { | |
| "epoch": 12.22, | |
| "learning_rate": 0.0009753638622648208, | |
| "loss": 0.1478, | |
| "step": 19120 | |
| }, | |
| { | |
| "epoch": 12.22, | |
| "learning_rate": 0.0009752928647497337, | |
| "loss": 0.1601, | |
| "step": 19130 | |
| }, | |
| { | |
| "epoch": 12.23, | |
| "learning_rate": 0.0009752218672346468, | |
| "loss": 0.1706, | |
| "step": 19140 | |
| }, | |
| { | |
| "epoch": 12.24, | |
| "learning_rate": 0.0009751508697195598, | |
| "loss": 0.1565, | |
| "step": 19150 | |
| }, | |
| { | |
| "epoch": 12.24, | |
| "learning_rate": 0.0009750798722044729, | |
| "loss": 0.1258, | |
| "step": 19160 | |
| }, | |
| { | |
| "epoch": 12.25, | |
| "learning_rate": 0.0009750088746893859, | |
| "loss": 0.1468, | |
| "step": 19170 | |
| }, | |
| { | |
| "epoch": 12.26, | |
| "learning_rate": 0.000974937877174299, | |
| "loss": 0.1865, | |
| "step": 19180 | |
| }, | |
| { | |
| "epoch": 12.26, | |
| "learning_rate": 0.0009748668796592119, | |
| "loss": 0.1551, | |
| "step": 19190 | |
| }, | |
| { | |
| "epoch": 12.27, | |
| "learning_rate": 0.000974795882144125, | |
| "loss": 0.1688, | |
| "step": 19200 | |
| }, | |
| { | |
| "epoch": 12.27, | |
| "learning_rate": 0.0009747248846290379, | |
| "loss": 0.16, | |
| "step": 19210 | |
| }, | |
| { | |
| "epoch": 12.28, | |
| "learning_rate": 0.000974653887113951, | |
| "loss": 0.1686, | |
| "step": 19220 | |
| }, | |
| { | |
| "epoch": 12.29, | |
| "learning_rate": 0.0009745828895988641, | |
| "loss": 0.1644, | |
| "step": 19230 | |
| }, | |
| { | |
| "epoch": 12.29, | |
| "learning_rate": 0.0009745118920837771, | |
| "loss": 0.1605, | |
| "step": 19240 | |
| }, | |
| { | |
| "epoch": 12.3, | |
| "learning_rate": 0.0009744408945686901, | |
| "loss": 0.1506, | |
| "step": 19250 | |
| }, | |
| { | |
| "epoch": 12.31, | |
| "learning_rate": 0.0009743698970536032, | |
| "loss": 0.1436, | |
| "step": 19260 | |
| }, | |
| { | |
| "epoch": 12.31, | |
| "learning_rate": 0.0009742988995385161, | |
| "loss": 0.1685, | |
| "step": 19270 | |
| }, | |
| { | |
| "epoch": 12.32, | |
| "learning_rate": 0.0009742279020234292, | |
| "loss": 0.1505, | |
| "step": 19280 | |
| }, | |
| { | |
| "epoch": 12.33, | |
| "learning_rate": 0.0009741569045083423, | |
| "loss": 0.1609, | |
| "step": 19290 | |
| }, | |
| { | |
| "epoch": 12.33, | |
| "learning_rate": 0.0009740859069932553, | |
| "loss": 0.1803, | |
| "step": 19300 | |
| }, | |
| { | |
| "epoch": 12.34, | |
| "learning_rate": 0.0009740149094781683, | |
| "loss": 0.1806, | |
| "step": 19310 | |
| }, | |
| { | |
| "epoch": 12.34, | |
| "learning_rate": 0.0009739439119630813, | |
| "loss": 0.1733, | |
| "step": 19320 | |
| }, | |
| { | |
| "epoch": 12.35, | |
| "learning_rate": 0.0009738729144479943, | |
| "loss": 0.1618, | |
| "step": 19330 | |
| }, | |
| { | |
| "epoch": 12.36, | |
| "learning_rate": 0.0009738019169329074, | |
| "loss": 0.157, | |
| "step": 19340 | |
| }, | |
| { | |
| "epoch": 12.36, | |
| "learning_rate": 0.0009737309194178204, | |
| "loss": 0.1374, | |
| "step": 19350 | |
| }, | |
| { | |
| "epoch": 12.37, | |
| "learning_rate": 0.0009736599219027335, | |
| "loss": 0.1689, | |
| "step": 19360 | |
| }, | |
| { | |
| "epoch": 12.38, | |
| "learning_rate": 0.0009735889243876465, | |
| "loss": 0.1813, | |
| "step": 19370 | |
| }, | |
| { | |
| "epoch": 12.38, | |
| "learning_rate": 0.0009735179268725594, | |
| "loss": 0.1313, | |
| "step": 19380 | |
| }, | |
| { | |
| "epoch": 12.39, | |
| "learning_rate": 0.0009734469293574725, | |
| "loss": 0.16, | |
| "step": 19390 | |
| }, | |
| { | |
| "epoch": 12.4, | |
| "learning_rate": 0.0009733759318423854, | |
| "loss": 0.1317, | |
| "step": 19400 | |
| }, | |
| { | |
| "epoch": 12.4, | |
| "learning_rate": 0.0009733049343272986, | |
| "loss": 0.13, | |
| "step": 19410 | |
| }, | |
| { | |
| "epoch": 12.41, | |
| "learning_rate": 0.0009732339368122116, | |
| "loss": 0.15, | |
| "step": 19420 | |
| }, | |
| { | |
| "epoch": 12.42, | |
| "learning_rate": 0.0009731629392971246, | |
| "loss": 0.1567, | |
| "step": 19430 | |
| }, | |
| { | |
| "epoch": 12.42, | |
| "learning_rate": 0.0009730919417820376, | |
| "loss": 0.1477, | |
| "step": 19440 | |
| }, | |
| { | |
| "epoch": 12.43, | |
| "learning_rate": 0.0009730209442669507, | |
| "loss": 0.1409, | |
| "step": 19450 | |
| }, | |
| { | |
| "epoch": 12.43, | |
| "learning_rate": 0.0009729499467518636, | |
| "loss": 0.1793, | |
| "step": 19460 | |
| }, | |
| { | |
| "epoch": 12.44, | |
| "learning_rate": 0.0009728789492367768, | |
| "loss": 0.1322, | |
| "step": 19470 | |
| }, | |
| { | |
| "epoch": 12.45, | |
| "learning_rate": 0.0009728079517216898, | |
| "loss": 0.1645, | |
| "step": 19480 | |
| }, | |
| { | |
| "epoch": 12.45, | |
| "learning_rate": 0.0009727369542066028, | |
| "loss": 0.195, | |
| "step": 19490 | |
| }, | |
| { | |
| "epoch": 12.46, | |
| "learning_rate": 0.0009726659566915158, | |
| "loss": 0.1419, | |
| "step": 19500 | |
| }, | |
| { | |
| "epoch": 12.47, | |
| "learning_rate": 0.0009725949591764288, | |
| "loss": 0.1422, | |
| "step": 19510 | |
| }, | |
| { | |
| "epoch": 12.47, | |
| "learning_rate": 0.0009725239616613418, | |
| "loss": 0.1796, | |
| "step": 19520 | |
| }, | |
| { | |
| "epoch": 12.48, | |
| "learning_rate": 0.000972452964146255, | |
| "loss": 0.1615, | |
| "step": 19530 | |
| }, | |
| { | |
| "epoch": 12.49, | |
| "learning_rate": 0.0009723819666311679, | |
| "loss": 0.173, | |
| "step": 19540 | |
| }, | |
| { | |
| "epoch": 12.49, | |
| "learning_rate": 0.000972310969116081, | |
| "loss": 0.1442, | |
| "step": 19550 | |
| }, | |
| { | |
| "epoch": 12.5, | |
| "learning_rate": 0.000972239971600994, | |
| "loss": 0.1648, | |
| "step": 19560 | |
| }, | |
| { | |
| "epoch": 12.5, | |
| "learning_rate": 0.000972168974085907, | |
| "loss": 0.1543, | |
| "step": 19570 | |
| }, | |
| { | |
| "epoch": 12.51, | |
| "learning_rate": 0.00097209797657082, | |
| "loss": 0.1507, | |
| "step": 19580 | |
| }, | |
| { | |
| "epoch": 12.52, | |
| "learning_rate": 0.0009720269790557332, | |
| "loss": 0.1571, | |
| "step": 19590 | |
| }, | |
| { | |
| "epoch": 12.52, | |
| "learning_rate": 0.0009719559815406461, | |
| "loss": 0.1697, | |
| "step": 19600 | |
| }, | |
| { | |
| "epoch": 12.53, | |
| "learning_rate": 0.0009718849840255592, | |
| "loss": 0.1622, | |
| "step": 19610 | |
| }, | |
| { | |
| "epoch": 12.54, | |
| "learning_rate": 0.0009718139865104721, | |
| "loss": 0.1548, | |
| "step": 19620 | |
| }, | |
| { | |
| "epoch": 12.54, | |
| "learning_rate": 0.0009717429889953852, | |
| "loss": 0.169, | |
| "step": 19630 | |
| }, | |
| { | |
| "epoch": 12.55, | |
| "learning_rate": 0.0009716719914802982, | |
| "loss": 0.1644, | |
| "step": 19640 | |
| }, | |
| { | |
| "epoch": 12.56, | |
| "learning_rate": 0.0009716009939652113, | |
| "loss": 0.1387, | |
| "step": 19650 | |
| }, | |
| { | |
| "epoch": 12.56, | |
| "learning_rate": 0.0009715299964501243, | |
| "loss": 0.177, | |
| "step": 19660 | |
| }, | |
| { | |
| "epoch": 12.57, | |
| "learning_rate": 0.0009714589989350374, | |
| "loss": 0.1627, | |
| "step": 19670 | |
| }, | |
| { | |
| "epoch": 12.57, | |
| "learning_rate": 0.0009713880014199503, | |
| "loss": 0.1451, | |
| "step": 19680 | |
| }, | |
| { | |
| "epoch": 12.58, | |
| "learning_rate": 0.0009713170039048633, | |
| "loss": 0.1827, | |
| "step": 19690 | |
| }, | |
| { | |
| "epoch": 12.59, | |
| "learning_rate": 0.0009712460063897763, | |
| "loss": 0.1593, | |
| "step": 19700 | |
| }, | |
| { | |
| "epoch": 12.59, | |
| "learning_rate": 0.0009711750088746894, | |
| "loss": 0.1521, | |
| "step": 19710 | |
| }, | |
| { | |
| "epoch": 12.6, | |
| "learning_rate": 0.0009711040113596025, | |
| "loss": 0.1759, | |
| "step": 19720 | |
| }, | |
| { | |
| "epoch": 12.61, | |
| "learning_rate": 0.0009710330138445154, | |
| "loss": 0.1868, | |
| "step": 19730 | |
| }, | |
| { | |
| "epoch": 12.61, | |
| "learning_rate": 0.0009709620163294285, | |
| "loss": 0.1327, | |
| "step": 19740 | |
| }, | |
| { | |
| "epoch": 12.62, | |
| "learning_rate": 0.0009708910188143415, | |
| "loss": 0.1349, | |
| "step": 19750 | |
| }, | |
| { | |
| "epoch": 12.63, | |
| "learning_rate": 0.0009708200212992545, | |
| "loss": 0.1645, | |
| "step": 19760 | |
| }, | |
| { | |
| "epoch": 12.63, | |
| "learning_rate": 0.0009707490237841676, | |
| "loss": 0.1315, | |
| "step": 19770 | |
| }, | |
| { | |
| "epoch": 12.64, | |
| "learning_rate": 0.0009706780262690807, | |
| "loss": 0.184, | |
| "step": 19780 | |
| }, | |
| { | |
| "epoch": 12.65, | |
| "learning_rate": 0.0009706070287539936, | |
| "loss": 0.1557, | |
| "step": 19790 | |
| }, | |
| { | |
| "epoch": 12.65, | |
| "learning_rate": 0.0009705360312389067, | |
| "loss": 0.1622, | |
| "step": 19800 | |
| }, | |
| { | |
| "epoch": 12.66, | |
| "learning_rate": 0.0009704650337238196, | |
| "loss": 0.1598, | |
| "step": 19810 | |
| }, | |
| { | |
| "epoch": 12.66, | |
| "learning_rate": 0.0009703940362087327, | |
| "loss": 0.1914, | |
| "step": 19820 | |
| }, | |
| { | |
| "epoch": 12.67, | |
| "learning_rate": 0.0009703230386936457, | |
| "loss": 0.1757, | |
| "step": 19830 | |
| }, | |
| { | |
| "epoch": 12.68, | |
| "learning_rate": 0.0009702520411785588, | |
| "loss": 0.1613, | |
| "step": 19840 | |
| }, | |
| { | |
| "epoch": 12.68, | |
| "learning_rate": 0.0009701810436634718, | |
| "loss": 0.175, | |
| "step": 19850 | |
| }, | |
| { | |
| "epoch": 12.69, | |
| "learning_rate": 0.0009701100461483849, | |
| "loss": 0.1778, | |
| "step": 19860 | |
| }, | |
| { | |
| "epoch": 12.7, | |
| "learning_rate": 0.0009700390486332978, | |
| "loss": 0.14, | |
| "step": 19870 | |
| }, | |
| { | |
| "epoch": 12.7, | |
| "learning_rate": 0.0009699680511182109, | |
| "loss": 0.148, | |
| "step": 19880 | |
| }, | |
| { | |
| "epoch": 12.71, | |
| "learning_rate": 0.0009698970536031238, | |
| "loss": 0.1899, | |
| "step": 19890 | |
| }, | |
| { | |
| "epoch": 12.72, | |
| "learning_rate": 0.000969826056088037, | |
| "loss": 0.143, | |
| "step": 19900 | |
| }, | |
| { | |
| "epoch": 12.72, | |
| "learning_rate": 0.00096975505857295, | |
| "loss": 0.1668, | |
| "step": 19910 | |
| }, | |
| { | |
| "epoch": 12.73, | |
| "learning_rate": 0.000969684061057863, | |
| "loss": 0.1607, | |
| "step": 19920 | |
| }, | |
| { | |
| "epoch": 12.73, | |
| "learning_rate": 0.000969613063542776, | |
| "loss": 0.1357, | |
| "step": 19930 | |
| }, | |
| { | |
| "epoch": 12.74, | |
| "learning_rate": 0.0009695420660276891, | |
| "loss": 0.18, | |
| "step": 19940 | |
| }, | |
| { | |
| "epoch": 12.75, | |
| "learning_rate": 0.000969471068512602, | |
| "loss": 0.1766, | |
| "step": 19950 | |
| }, | |
| { | |
| "epoch": 12.75, | |
| "learning_rate": 0.0009694000709975152, | |
| "loss": 0.1852, | |
| "step": 19960 | |
| }, | |
| { | |
| "epoch": 12.76, | |
| "learning_rate": 0.0009693290734824282, | |
| "loss": 0.1969, | |
| "step": 19970 | |
| }, | |
| { | |
| "epoch": 12.77, | |
| "learning_rate": 0.0009692580759673412, | |
| "loss": 0.1483, | |
| "step": 19980 | |
| }, | |
| { | |
| "epoch": 12.77, | |
| "learning_rate": 0.0009691870784522542, | |
| "loss": 0.1823, | |
| "step": 19990 | |
| }, | |
| { | |
| "epoch": 12.78, | |
| "learning_rate": 0.0009691160809371671, | |
| "loss": 0.1495, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 12.79, | |
| "learning_rate": 0.0009690450834220802, | |
| "loss": 0.144, | |
| "step": 20010 | |
| }, | |
| { | |
| "epoch": 12.79, | |
| "learning_rate": 0.0009689740859069933, | |
| "loss": 0.1633, | |
| "step": 20020 | |
| }, | |
| { | |
| "epoch": 12.8, | |
| "learning_rate": 0.0009689030883919063, | |
| "loss": 0.1736, | |
| "step": 20030 | |
| }, | |
| { | |
| "epoch": 12.8, | |
| "learning_rate": 0.0009688320908768193, | |
| "loss": 0.1848, | |
| "step": 20040 | |
| }, | |
| { | |
| "epoch": 12.81, | |
| "learning_rate": 0.0009687610933617324, | |
| "loss": 0.1701, | |
| "step": 20050 | |
| }, | |
| { | |
| "epoch": 12.82, | |
| "learning_rate": 0.0009686900958466453, | |
| "loss": 0.1647, | |
| "step": 20060 | |
| }, | |
| { | |
| "epoch": 12.82, | |
| "learning_rate": 0.0009686190983315584, | |
| "loss": 0.1801, | |
| "step": 20070 | |
| }, | |
| { | |
| "epoch": 12.83, | |
| "learning_rate": 0.0009685481008164714, | |
| "loss": 0.1595, | |
| "step": 20080 | |
| }, | |
| { | |
| "epoch": 12.84, | |
| "learning_rate": 0.0009684771033013845, | |
| "loss": 0.1618, | |
| "step": 20090 | |
| }, | |
| { | |
| "epoch": 12.84, | |
| "learning_rate": 0.0009684061057862975, | |
| "loss": 0.1559, | |
| "step": 20100 | |
| }, | |
| { | |
| "epoch": 12.85, | |
| "learning_rate": 0.0009683351082712105, | |
| "loss": 0.173, | |
| "step": 20110 | |
| }, | |
| { | |
| "epoch": 12.86, | |
| "learning_rate": 0.0009682641107561235, | |
| "loss": 0.15, | |
| "step": 20120 | |
| }, | |
| { | |
| "epoch": 12.86, | |
| "learning_rate": 0.0009681931132410366, | |
| "loss": 0.1707, | |
| "step": 20130 | |
| }, | |
| { | |
| "epoch": 12.87, | |
| "learning_rate": 0.0009681221157259496, | |
| "loss": 0.1403, | |
| "step": 20140 | |
| }, | |
| { | |
| "epoch": 12.88, | |
| "learning_rate": 0.0009680511182108627, | |
| "loss": 0.1787, | |
| "step": 20150 | |
| }, | |
| { | |
| "epoch": 12.88, | |
| "learning_rate": 0.0009679801206957757, | |
| "loss": 0.1708, | |
| "step": 20160 | |
| }, | |
| { | |
| "epoch": 12.89, | |
| "learning_rate": 0.0009679091231806887, | |
| "loss": 0.1595, | |
| "step": 20170 | |
| }, | |
| { | |
| "epoch": 12.89, | |
| "learning_rate": 0.0009678381256656017, | |
| "loss": 0.1536, | |
| "step": 20180 | |
| }, | |
| { | |
| "epoch": 12.9, | |
| "learning_rate": 0.0009677671281505147, | |
| "loss": 0.1783, | |
| "step": 20190 | |
| }, | |
| { | |
| "epoch": 12.91, | |
| "learning_rate": 0.0009676961306354278, | |
| "loss": 0.1694, | |
| "step": 20200 | |
| }, | |
| { | |
| "epoch": 12.91, | |
| "learning_rate": 0.0009676251331203409, | |
| "loss": 0.1593, | |
| "step": 20210 | |
| }, | |
| { | |
| "epoch": 12.92, | |
| "learning_rate": 0.0009675541356052538, | |
| "loss": 0.1378, | |
| "step": 20220 | |
| }, | |
| { | |
| "epoch": 12.93, | |
| "learning_rate": 0.0009674831380901669, | |
| "loss": 0.174, | |
| "step": 20230 | |
| }, | |
| { | |
| "epoch": 12.93, | |
| "learning_rate": 0.0009674121405750799, | |
| "loss": 0.1588, | |
| "step": 20240 | |
| }, | |
| { | |
| "epoch": 12.94, | |
| "learning_rate": 0.0009673411430599929, | |
| "loss": 0.1726, | |
| "step": 20250 | |
| }, | |
| { | |
| "epoch": 12.95, | |
| "learning_rate": 0.000967270145544906, | |
| "loss": 0.1696, | |
| "step": 20260 | |
| }, | |
| { | |
| "epoch": 12.95, | |
| "learning_rate": 0.0009671991480298191, | |
| "loss": 0.1529, | |
| "step": 20270 | |
| }, | |
| { | |
| "epoch": 12.96, | |
| "learning_rate": 0.000967128150514732, | |
| "loss": 0.1869, | |
| "step": 20280 | |
| }, | |
| { | |
| "epoch": 12.96, | |
| "learning_rate": 0.0009670571529996451, | |
| "loss": 0.1673, | |
| "step": 20290 | |
| }, | |
| { | |
| "epoch": 12.97, | |
| "learning_rate": 0.000966986155484558, | |
| "loss": 0.1682, | |
| "step": 20300 | |
| }, | |
| { | |
| "epoch": 12.98, | |
| "learning_rate": 0.000966915157969471, | |
| "loss": 0.1937, | |
| "step": 20310 | |
| }, | |
| { | |
| "epoch": 12.98, | |
| "learning_rate": 0.0009668441604543842, | |
| "loss": 0.1636, | |
| "step": 20320 | |
| }, | |
| { | |
| "epoch": 12.99, | |
| "learning_rate": 0.0009667731629392971, | |
| "loss": 0.1535, | |
| "step": 20330 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "learning_rate": 0.0009667021654242102, | |
| "loss": 0.1794, | |
| "step": 20340 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "learning_rate": 0.0009666311679091232, | |
| "loss": 0.1457, | |
| "step": 20350 | |
| }, | |
| { | |
| "epoch": 13.01, | |
| "learning_rate": 0.0009665601703940362, | |
| "loss": 0.168, | |
| "step": 20360 | |
| }, | |
| { | |
| "epoch": 13.02, | |
| "learning_rate": 0.0009664891728789492, | |
| "loss": 0.1501, | |
| "step": 20370 | |
| }, | |
| { | |
| "epoch": 13.02, | |
| "learning_rate": 0.0009664181753638623, | |
| "loss": 0.1401, | |
| "step": 20380 | |
| }, | |
| { | |
| "epoch": 13.03, | |
| "learning_rate": 0.0009663471778487753, | |
| "loss": 0.1438, | |
| "step": 20390 | |
| }, | |
| { | |
| "epoch": 13.04, | |
| "learning_rate": 0.0009662761803336884, | |
| "loss": 0.1199, | |
| "step": 20400 | |
| }, | |
| { | |
| "epoch": 13.04, | |
| "learning_rate": 0.0009662051828186013, | |
| "loss": 0.1534, | |
| "step": 20410 | |
| }, | |
| { | |
| "epoch": 13.05, | |
| "learning_rate": 0.0009661341853035144, | |
| "loss": 0.1386, | |
| "step": 20420 | |
| }, | |
| { | |
| "epoch": 13.05, | |
| "learning_rate": 0.0009660631877884274, | |
| "loss": 0.1598, | |
| "step": 20430 | |
| }, | |
| { | |
| "epoch": 13.06, | |
| "learning_rate": 0.0009659921902733404, | |
| "loss": 0.1612, | |
| "step": 20440 | |
| }, | |
| { | |
| "epoch": 13.07, | |
| "learning_rate": 0.0009659211927582535, | |
| "loss": 0.1319, | |
| "step": 20450 | |
| }, | |
| { | |
| "epoch": 13.07, | |
| "learning_rate": 0.0009658501952431666, | |
| "loss": 0.157, | |
| "step": 20460 | |
| }, | |
| { | |
| "epoch": 13.08, | |
| "learning_rate": 0.0009657791977280795, | |
| "loss": 0.1411, | |
| "step": 20470 | |
| }, | |
| { | |
| "epoch": 13.09, | |
| "learning_rate": 0.0009657082002129926, | |
| "loss": 0.1287, | |
| "step": 20480 | |
| }, | |
| { | |
| "epoch": 13.09, | |
| "learning_rate": 0.0009656372026979055, | |
| "loss": 0.1241, | |
| "step": 20490 | |
| }, | |
| { | |
| "epoch": 13.1, | |
| "learning_rate": 0.0009655662051828186, | |
| "loss": 0.168, | |
| "step": 20500 | |
| }, | |
| { | |
| "epoch": 13.11, | |
| "learning_rate": 0.0009654952076677317, | |
| "loss": 0.1583, | |
| "step": 20510 | |
| }, | |
| { | |
| "epoch": 13.11, | |
| "learning_rate": 0.0009654242101526447, | |
| "loss": 0.1267, | |
| "step": 20520 | |
| }, | |
| { | |
| "epoch": 13.12, | |
| "learning_rate": 0.0009653532126375577, | |
| "loss": 0.1357, | |
| "step": 20530 | |
| }, | |
| { | |
| "epoch": 13.12, | |
| "learning_rate": 0.0009652822151224708, | |
| "loss": 0.126, | |
| "step": 20540 | |
| }, | |
| { | |
| "epoch": 13.13, | |
| "learning_rate": 0.0009652112176073837, | |
| "loss": 0.1379, | |
| "step": 20550 | |
| }, | |
| { | |
| "epoch": 13.14, | |
| "learning_rate": 0.0009651402200922968, | |
| "loss": 0.1572, | |
| "step": 20560 | |
| }, | |
| { | |
| "epoch": 13.14, | |
| "learning_rate": 0.0009650692225772098, | |
| "loss": 0.1551, | |
| "step": 20570 | |
| }, | |
| { | |
| "epoch": 13.15, | |
| "learning_rate": 0.0009649982250621229, | |
| "loss": 0.1277, | |
| "step": 20580 | |
| }, | |
| { | |
| "epoch": 13.16, | |
| "learning_rate": 0.0009649272275470359, | |
| "loss": 0.1609, | |
| "step": 20590 | |
| }, | |
| { | |
| "epoch": 13.16, | |
| "learning_rate": 0.0009648562300319489, | |
| "loss": 0.1459, | |
| "step": 20600 | |
| }, | |
| { | |
| "epoch": 13.17, | |
| "learning_rate": 0.0009647852325168619, | |
| "loss": 0.1602, | |
| "step": 20610 | |
| }, | |
| { | |
| "epoch": 13.18, | |
| "learning_rate": 0.0009647142350017749, | |
| "loss": 0.1472, | |
| "step": 20620 | |
| }, | |
| { | |
| "epoch": 13.18, | |
| "learning_rate": 0.000964643237486688, | |
| "loss": 0.128, | |
| "step": 20630 | |
| }, | |
| { | |
| "epoch": 13.19, | |
| "learning_rate": 0.000964572239971601, | |
| "loss": 0.1444, | |
| "step": 20640 | |
| }, | |
| { | |
| "epoch": 13.19, | |
| "learning_rate": 0.000964501242456514, | |
| "loss": 0.1627, | |
| "step": 20650 | |
| }, | |
| { | |
| "epoch": 13.2, | |
| "learning_rate": 0.000964430244941427, | |
| "loss": 0.1418, | |
| "step": 20660 | |
| }, | |
| { | |
| "epoch": 13.21, | |
| "learning_rate": 0.0009643592474263401, | |
| "loss": 0.135, | |
| "step": 20670 | |
| }, | |
| { | |
| "epoch": 13.21, | |
| "learning_rate": 0.000964288249911253, | |
| "loss": 0.1337, | |
| "step": 20680 | |
| }, | |
| { | |
| "epoch": 13.22, | |
| "learning_rate": 0.0009642172523961662, | |
| "loss": 0.1353, | |
| "step": 20690 | |
| }, | |
| { | |
| "epoch": 13.23, | |
| "learning_rate": 0.0009641462548810792, | |
| "loss": 0.1586, | |
| "step": 20700 | |
| }, | |
| { | |
| "epoch": 13.23, | |
| "learning_rate": 0.0009640752573659922, | |
| "loss": 0.1386, | |
| "step": 20710 | |
| }, | |
| { | |
| "epoch": 13.24, | |
| "learning_rate": 0.0009640042598509052, | |
| "loss": 0.1369, | |
| "step": 20720 | |
| }, | |
| { | |
| "epoch": 13.25, | |
| "learning_rate": 0.0009639332623358183, | |
| "loss": 0.1357, | |
| "step": 20730 | |
| }, | |
| { | |
| "epoch": 13.25, | |
| "learning_rate": 0.0009638622648207312, | |
| "loss": 0.1472, | |
| "step": 20740 | |
| }, | |
| { | |
| "epoch": 13.26, | |
| "learning_rate": 0.0009637912673056444, | |
| "loss": 0.1533, | |
| "step": 20750 | |
| }, | |
| { | |
| "epoch": 13.27, | |
| "learning_rate": 0.0009637202697905573, | |
| "loss": 0.1584, | |
| "step": 20760 | |
| }, | |
| { | |
| "epoch": 13.27, | |
| "learning_rate": 0.0009636492722754704, | |
| "loss": 0.126, | |
| "step": 20770 | |
| }, | |
| { | |
| "epoch": 13.28, | |
| "learning_rate": 0.0009635782747603834, | |
| "loss": 0.1642, | |
| "step": 20780 | |
| }, | |
| { | |
| "epoch": 13.28, | |
| "learning_rate": 0.0009635072772452964, | |
| "loss": 0.1284, | |
| "step": 20790 | |
| }, | |
| { | |
| "epoch": 13.29, | |
| "learning_rate": 0.0009634362797302094, | |
| "loss": 0.1457, | |
| "step": 20800 | |
| }, | |
| { | |
| "epoch": 13.3, | |
| "learning_rate": 0.0009633652822151226, | |
| "loss": 0.1481, | |
| "step": 20810 | |
| }, | |
| { | |
| "epoch": 13.3, | |
| "learning_rate": 0.0009632942847000355, | |
| "loss": 0.1639, | |
| "step": 20820 | |
| }, | |
| { | |
| "epoch": 13.31, | |
| "learning_rate": 0.0009632232871849486, | |
| "loss": 0.1459, | |
| "step": 20830 | |
| }, | |
| { | |
| "epoch": 13.32, | |
| "learning_rate": 0.0009631522896698616, | |
| "loss": 0.1742, | |
| "step": 20840 | |
| }, | |
| { | |
| "epoch": 13.32, | |
| "learning_rate": 0.0009630812921547746, | |
| "loss": 0.1388, | |
| "step": 20850 | |
| }, | |
| { | |
| "epoch": 13.33, | |
| "learning_rate": 0.0009630102946396876, | |
| "loss": 0.1769, | |
| "step": 20860 | |
| }, | |
| { | |
| "epoch": 13.34, | |
| "learning_rate": 0.0009629392971246008, | |
| "loss": 0.1517, | |
| "step": 20870 | |
| }, | |
| { | |
| "epoch": 13.34, | |
| "learning_rate": 0.0009628682996095137, | |
| "loss": 0.1463, | |
| "step": 20880 | |
| }, | |
| { | |
| "epoch": 13.35, | |
| "learning_rate": 0.0009627973020944268, | |
| "loss": 0.1135, | |
| "step": 20890 | |
| }, | |
| { | |
| "epoch": 13.35, | |
| "learning_rate": 0.0009627263045793397, | |
| "loss": 0.1543, | |
| "step": 20900 | |
| }, | |
| { | |
| "epoch": 13.36, | |
| "learning_rate": 0.0009626553070642528, | |
| "loss": 0.1598, | |
| "step": 20910 | |
| }, | |
| { | |
| "epoch": 13.37, | |
| "learning_rate": 0.0009625843095491658, | |
| "loss": 0.1745, | |
| "step": 20920 | |
| }, | |
| { | |
| "epoch": 13.37, | |
| "learning_rate": 0.0009625133120340789, | |
| "loss": 0.1595, | |
| "step": 20930 | |
| }, | |
| { | |
| "epoch": 13.38, | |
| "learning_rate": 0.0009624423145189919, | |
| "loss": 0.1329, | |
| "step": 20940 | |
| }, | |
| { | |
| "epoch": 13.39, | |
| "learning_rate": 0.0009623713170039048, | |
| "loss": 0.1612, | |
| "step": 20950 | |
| }, | |
| { | |
| "epoch": 13.39, | |
| "learning_rate": 0.0009623003194888179, | |
| "loss": 0.1528, | |
| "step": 20960 | |
| }, | |
| { | |
| "epoch": 13.4, | |
| "learning_rate": 0.0009622293219737309, | |
| "loss": 0.1518, | |
| "step": 20970 | |
| }, | |
| { | |
| "epoch": 13.41, | |
| "learning_rate": 0.0009621583244586439, | |
| "loss": 0.1635, | |
| "step": 20980 | |
| }, | |
| { | |
| "epoch": 13.41, | |
| "learning_rate": 0.000962087326943557, | |
| "loss": 0.1446, | |
| "step": 20990 | |
| }, | |
| { | |
| "epoch": 13.42, | |
| "learning_rate": 0.0009620163294284701, | |
| "loss": 0.1471, | |
| "step": 21000 | |
| }, | |
| { | |
| "epoch": 13.42, | |
| "learning_rate": 0.000961945331913383, | |
| "loss": 0.1476, | |
| "step": 21010 | |
| }, | |
| { | |
| "epoch": 13.43, | |
| "learning_rate": 0.0009618743343982961, | |
| "loss": 0.1907, | |
| "step": 21020 | |
| }, | |
| { | |
| "epoch": 13.44, | |
| "learning_rate": 0.000961803336883209, | |
| "loss": 0.1495, | |
| "step": 21030 | |
| }, | |
| { | |
| "epoch": 13.44, | |
| "learning_rate": 0.0009617323393681221, | |
| "loss": 0.1817, | |
| "step": 21040 | |
| }, | |
| { | |
| "epoch": 13.45, | |
| "learning_rate": 0.0009616613418530351, | |
| "loss": 0.1571, | |
| "step": 21050 | |
| }, | |
| { | |
| "epoch": 13.46, | |
| "learning_rate": 0.0009615903443379483, | |
| "loss": 0.1746, | |
| "step": 21060 | |
| }, | |
| { | |
| "epoch": 13.46, | |
| "learning_rate": 0.0009615193468228612, | |
| "loss": 0.1451, | |
| "step": 21070 | |
| }, | |
| { | |
| "epoch": 13.47, | |
| "learning_rate": 0.0009614483493077743, | |
| "loss": 0.1545, | |
| "step": 21080 | |
| }, | |
| { | |
| "epoch": 13.48, | |
| "learning_rate": 0.0009613773517926872, | |
| "loss": 0.148, | |
| "step": 21090 | |
| }, | |
| { | |
| "epoch": 13.48, | |
| "learning_rate": 0.0009613063542776003, | |
| "loss": 0.1368, | |
| "step": 21100 | |
| }, | |
| { | |
| "epoch": 13.49, | |
| "learning_rate": 0.0009612353567625133, | |
| "loss": 0.1401, | |
| "step": 21110 | |
| }, | |
| { | |
| "epoch": 13.5, | |
| "learning_rate": 0.0009611643592474264, | |
| "loss": 0.1375, | |
| "step": 21120 | |
| }, | |
| { | |
| "epoch": 13.5, | |
| "learning_rate": 0.0009610933617323394, | |
| "loss": 0.1525, | |
| "step": 21130 | |
| }, | |
| { | |
| "epoch": 13.51, | |
| "learning_rate": 0.0009610223642172525, | |
| "loss": 0.1509, | |
| "step": 21140 | |
| }, | |
| { | |
| "epoch": 13.51, | |
| "learning_rate": 0.0009609513667021654, | |
| "loss": 0.1531, | |
| "step": 21150 | |
| }, | |
| { | |
| "epoch": 13.52, | |
| "learning_rate": 0.0009608803691870785, | |
| "loss": 0.1096, | |
| "step": 21160 | |
| }, | |
| { | |
| "epoch": 13.53, | |
| "learning_rate": 0.0009608093716719914, | |
| "loss": 0.1678, | |
| "step": 21170 | |
| }, | |
| { | |
| "epoch": 13.53, | |
| "learning_rate": 0.0009607383741569046, | |
| "loss": 0.1366, | |
| "step": 21180 | |
| }, | |
| { | |
| "epoch": 13.54, | |
| "learning_rate": 0.0009606673766418176, | |
| "loss": 0.1431, | |
| "step": 21190 | |
| }, | |
| { | |
| "epoch": 13.55, | |
| "learning_rate": 0.0009605963791267306, | |
| "loss": 0.1709, | |
| "step": 21200 | |
| }, | |
| { | |
| "epoch": 13.55, | |
| "learning_rate": 0.0009605253816116436, | |
| "loss": 0.1812, | |
| "step": 21210 | |
| }, | |
| { | |
| "epoch": 13.56, | |
| "learning_rate": 0.0009604543840965567, | |
| "loss": 0.1601, | |
| "step": 21220 | |
| }, | |
| { | |
| "epoch": 13.57, | |
| "learning_rate": 0.0009603833865814696, | |
| "loss": 0.1491, | |
| "step": 21230 | |
| }, | |
| { | |
| "epoch": 13.57, | |
| "learning_rate": 0.0009603123890663828, | |
| "loss": 0.128, | |
| "step": 21240 | |
| }, | |
| { | |
| "epoch": 13.58, | |
| "learning_rate": 0.0009602413915512958, | |
| "loss": 0.1746, | |
| "step": 21250 | |
| }, | |
| { | |
| "epoch": 13.58, | |
| "learning_rate": 0.0009601703940362087, | |
| "loss": 0.1417, | |
| "step": 21260 | |
| }, | |
| { | |
| "epoch": 13.59, | |
| "learning_rate": 0.0009600993965211218, | |
| "loss": 0.1661, | |
| "step": 21270 | |
| }, | |
| { | |
| "epoch": 13.6, | |
| "learning_rate": 0.0009600283990060347, | |
| "loss": 0.1624, | |
| "step": 21280 | |
| }, | |
| { | |
| "epoch": 13.6, | |
| "learning_rate": 0.0009599574014909478, | |
| "loss": 0.1768, | |
| "step": 21290 | |
| }, | |
| { | |
| "epoch": 13.61, | |
| "learning_rate": 0.0009598864039758609, | |
| "loss": 0.1553, | |
| "step": 21300 | |
| }, | |
| { | |
| "epoch": 13.62, | |
| "learning_rate": 0.0009598154064607739, | |
| "loss": 0.1604, | |
| "step": 21310 | |
| }, | |
| { | |
| "epoch": 13.62, | |
| "learning_rate": 0.0009597444089456869, | |
| "loss": 0.1621, | |
| "step": 21320 | |
| }, | |
| { | |
| "epoch": 13.63, | |
| "learning_rate": 0.0009596734114306, | |
| "loss": 0.1551, | |
| "step": 21330 | |
| }, | |
| { | |
| "epoch": 13.64, | |
| "learning_rate": 0.0009596024139155129, | |
| "loss": 0.1578, | |
| "step": 21340 | |
| }, | |
| { | |
| "epoch": 13.64, | |
| "learning_rate": 0.000959531416400426, | |
| "loss": 0.1668, | |
| "step": 21350 | |
| }, | |
| { | |
| "epoch": 13.65, | |
| "learning_rate": 0.000959460418885339, | |
| "loss": 0.1563, | |
| "step": 21360 | |
| }, | |
| { | |
| "epoch": 13.65, | |
| "learning_rate": 0.0009593894213702521, | |
| "loss": 0.1717, | |
| "step": 21370 | |
| }, | |
| { | |
| "epoch": 13.66, | |
| "learning_rate": 0.0009593184238551651, | |
| "loss": 0.1706, | |
| "step": 21380 | |
| }, | |
| { | |
| "epoch": 13.67, | |
| "learning_rate": 0.0009592474263400781, | |
| "loss": 0.1705, | |
| "step": 21390 | |
| }, | |
| { | |
| "epoch": 13.67, | |
| "learning_rate": 0.0009591764288249911, | |
| "loss": 0.1619, | |
| "step": 21400 | |
| }, | |
| { | |
| "epoch": 13.68, | |
| "learning_rate": 0.0009591054313099042, | |
| "loss": 0.1597, | |
| "step": 21410 | |
| }, | |
| { | |
| "epoch": 13.69, | |
| "learning_rate": 0.0009590344337948172, | |
| "loss": 0.1756, | |
| "step": 21420 | |
| }, | |
| { | |
| "epoch": 13.69, | |
| "learning_rate": 0.0009589634362797303, | |
| "loss": 0.1706, | |
| "step": 21430 | |
| }, | |
| { | |
| "epoch": 13.7, | |
| "learning_rate": 0.0009588924387646433, | |
| "loss": 0.1657, | |
| "step": 21440 | |
| }, | |
| { | |
| "epoch": 13.71, | |
| "learning_rate": 0.0009588214412495563, | |
| "loss": 0.1659, | |
| "step": 21450 | |
| }, | |
| { | |
| "epoch": 13.71, | |
| "learning_rate": 0.0009587504437344693, | |
| "loss": 0.1977, | |
| "step": 21460 | |
| }, | |
| { | |
| "epoch": 13.72, | |
| "learning_rate": 0.0009586794462193823, | |
| "loss": 0.1391, | |
| "step": 21470 | |
| }, | |
| { | |
| "epoch": 13.73, | |
| "learning_rate": 0.0009586084487042954, | |
| "loss": 0.1594, | |
| "step": 21480 | |
| }, | |
| { | |
| "epoch": 13.73, | |
| "learning_rate": 0.0009585374511892085, | |
| "loss": 0.1668, | |
| "step": 21490 | |
| }, | |
| { | |
| "epoch": 13.74, | |
| "learning_rate": 0.0009584664536741214, | |
| "loss": 0.1544, | |
| "step": 21500 | |
| }, | |
| { | |
| "epoch": 13.74, | |
| "learning_rate": 0.0009583954561590345, | |
| "loss": 0.1808, | |
| "step": 21510 | |
| }, | |
| { | |
| "epoch": 13.75, | |
| "learning_rate": 0.0009583244586439475, | |
| "loss": 0.1779, | |
| "step": 21520 | |
| }, | |
| { | |
| "epoch": 13.76, | |
| "learning_rate": 0.0009582534611288605, | |
| "loss": 0.1392, | |
| "step": 21530 | |
| }, | |
| { | |
| "epoch": 13.76, | |
| "learning_rate": 0.0009581824636137736, | |
| "loss": 0.165, | |
| "step": 21540 | |
| }, | |
| { | |
| "epoch": 13.77, | |
| "learning_rate": 0.0009581114660986867, | |
| "loss": 0.1705, | |
| "step": 21550 | |
| }, | |
| { | |
| "epoch": 13.78, | |
| "learning_rate": 0.0009580404685835996, | |
| "loss": 0.1484, | |
| "step": 21560 | |
| }, | |
| { | |
| "epoch": 13.78, | |
| "learning_rate": 0.0009579694710685126, | |
| "loss": 0.1389, | |
| "step": 21570 | |
| }, | |
| { | |
| "epoch": 13.79, | |
| "learning_rate": 0.0009578984735534256, | |
| "loss": 0.1566, | |
| "step": 21580 | |
| }, | |
| { | |
| "epoch": 13.8, | |
| "learning_rate": 0.0009578274760383386, | |
| "loss": 0.133, | |
| "step": 21590 | |
| }, | |
| { | |
| "epoch": 13.8, | |
| "learning_rate": 0.0009577564785232517, | |
| "loss": 0.1441, | |
| "step": 21600 | |
| }, | |
| { | |
| "epoch": 13.81, | |
| "learning_rate": 0.0009576854810081647, | |
| "loss": 0.1644, | |
| "step": 21610 | |
| }, | |
| { | |
| "epoch": 13.81, | |
| "learning_rate": 0.0009576144834930778, | |
| "loss": 0.1805, | |
| "step": 21620 | |
| }, | |
| { | |
| "epoch": 13.82, | |
| "learning_rate": 0.0009575434859779907, | |
| "loss": 0.1491, | |
| "step": 21630 | |
| }, | |
| { | |
| "epoch": 13.83, | |
| "learning_rate": 0.0009574724884629038, | |
| "loss": 0.1472, | |
| "step": 21640 | |
| }, | |
| { | |
| "epoch": 13.83, | |
| "learning_rate": 0.0009574014909478168, | |
| "loss": 0.173, | |
| "step": 21650 | |
| }, | |
| { | |
| "epoch": 13.84, | |
| "learning_rate": 0.0009573304934327298, | |
| "loss": 0.1336, | |
| "step": 21660 | |
| }, | |
| { | |
| "epoch": 13.85, | |
| "learning_rate": 0.0009572594959176429, | |
| "loss": 0.1522, | |
| "step": 21670 | |
| }, | |
| { | |
| "epoch": 13.85, | |
| "learning_rate": 0.000957188498402556, | |
| "loss": 0.1586, | |
| "step": 21680 | |
| }, | |
| { | |
| "epoch": 13.86, | |
| "learning_rate": 0.0009571175008874689, | |
| "loss": 0.1364, | |
| "step": 21690 | |
| }, | |
| { | |
| "epoch": 13.87, | |
| "learning_rate": 0.000957046503372382, | |
| "loss": 0.1443, | |
| "step": 21700 | |
| }, | |
| { | |
| "epoch": 13.87, | |
| "learning_rate": 0.000956975505857295, | |
| "loss": 0.182, | |
| "step": 21710 | |
| }, | |
| { | |
| "epoch": 13.88, | |
| "learning_rate": 0.000956904508342208, | |
| "loss": 0.1481, | |
| "step": 21720 | |
| }, | |
| { | |
| "epoch": 13.88, | |
| "learning_rate": 0.0009568335108271211, | |
| "loss": 0.1608, | |
| "step": 21730 | |
| }, | |
| { | |
| "epoch": 13.89, | |
| "learning_rate": 0.0009567625133120342, | |
| "loss": 0.1596, | |
| "step": 21740 | |
| }, | |
| { | |
| "epoch": 13.9, | |
| "learning_rate": 0.0009566915157969471, | |
| "loss": 0.1546, | |
| "step": 21750 | |
| }, | |
| { | |
| "epoch": 13.9, | |
| "learning_rate": 0.0009566205182818602, | |
| "loss": 0.1417, | |
| "step": 21760 | |
| }, | |
| { | |
| "epoch": 13.91, | |
| "learning_rate": 0.0009565495207667731, | |
| "loss": 0.1342, | |
| "step": 21770 | |
| }, | |
| { | |
| "epoch": 13.92, | |
| "learning_rate": 0.0009564785232516862, | |
| "loss": 0.1615, | |
| "step": 21780 | |
| }, | |
| { | |
| "epoch": 13.92, | |
| "learning_rate": 0.0009564075257365993, | |
| "loss": 0.1452, | |
| "step": 21790 | |
| }, | |
| { | |
| "epoch": 13.93, | |
| "learning_rate": 0.0009563365282215123, | |
| "loss": 0.1705, | |
| "step": 21800 | |
| }, | |
| { | |
| "epoch": 13.94, | |
| "learning_rate": 0.0009562655307064253, | |
| "loss": 0.1404, | |
| "step": 21810 | |
| }, | |
| { | |
| "epoch": 13.94, | |
| "learning_rate": 0.0009561945331913384, | |
| "loss": 0.141, | |
| "step": 21820 | |
| }, | |
| { | |
| "epoch": 13.95, | |
| "learning_rate": 0.0009561235356762513, | |
| "loss": 0.1642, | |
| "step": 21830 | |
| }, | |
| { | |
| "epoch": 13.95, | |
| "learning_rate": 0.0009560525381611644, | |
| "loss": 0.1654, | |
| "step": 21840 | |
| }, | |
| { | |
| "epoch": 13.96, | |
| "learning_rate": 0.0009559815406460774, | |
| "loss": 0.1722, | |
| "step": 21850 | |
| }, | |
| { | |
| "epoch": 13.97, | |
| "learning_rate": 0.0009559105431309905, | |
| "loss": 0.1509, | |
| "step": 21860 | |
| }, | |
| { | |
| "epoch": 13.97, | |
| "learning_rate": 0.0009558395456159035, | |
| "loss": 0.1557, | |
| "step": 21870 | |
| }, | |
| { | |
| "epoch": 13.98, | |
| "learning_rate": 0.0009557685481008164, | |
| "loss": 0.1645, | |
| "step": 21880 | |
| }, | |
| { | |
| "epoch": 13.99, | |
| "learning_rate": 0.0009556975505857295, | |
| "loss": 0.1729, | |
| "step": 21890 | |
| }, | |
| { | |
| "epoch": 13.99, | |
| "learning_rate": 0.0009556265530706425, | |
| "loss": 0.1471, | |
| "step": 21900 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "learning_rate": 0.0009555555555555556, | |
| "loss": 0.1493, | |
| "step": 21910 | |
| }, | |
| { | |
| "epoch": 14.01, | |
| "learning_rate": 0.0009554845580404686, | |
| "loss": 0.1662, | |
| "step": 21920 | |
| }, | |
| { | |
| "epoch": 14.01, | |
| "learning_rate": 0.0009554135605253817, | |
| "loss": 0.1034, | |
| "step": 21930 | |
| }, | |
| { | |
| "epoch": 14.02, | |
| "learning_rate": 0.0009553425630102946, | |
| "loss": 0.1537, | |
| "step": 21940 | |
| }, | |
| { | |
| "epoch": 14.03, | |
| "learning_rate": 0.0009552715654952077, | |
| "loss": 0.1495, | |
| "step": 21950 | |
| }, | |
| { | |
| "epoch": 14.03, | |
| "learning_rate": 0.0009552005679801206, | |
| "loss": 0.1488, | |
| "step": 21960 | |
| }, | |
| { | |
| "epoch": 14.04, | |
| "learning_rate": 0.0009551295704650338, | |
| "loss": 0.1242, | |
| "step": 21970 | |
| }, | |
| { | |
| "epoch": 14.04, | |
| "learning_rate": 0.0009550585729499468, | |
| "loss": 0.1232, | |
| "step": 21980 | |
| }, | |
| { | |
| "epoch": 14.05, | |
| "learning_rate": 0.0009549875754348598, | |
| "loss": 0.126, | |
| "step": 21990 | |
| }, | |
| { | |
| "epoch": 14.06, | |
| "learning_rate": 0.0009549165779197728, | |
| "loss": 0.1493, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 14.06, | |
| "learning_rate": 0.0009548455804046859, | |
| "loss": 0.145, | |
| "step": 22010 | |
| }, | |
| { | |
| "epoch": 14.07, | |
| "learning_rate": 0.0009547745828895988, | |
| "loss": 0.1363, | |
| "step": 22020 | |
| }, | |
| { | |
| "epoch": 14.08, | |
| "learning_rate": 0.000954703585374512, | |
| "loss": 0.1487, | |
| "step": 22030 | |
| }, | |
| { | |
| "epoch": 14.08, | |
| "learning_rate": 0.000954632587859425, | |
| "loss": 0.15, | |
| "step": 22040 | |
| }, | |
| { | |
| "epoch": 14.09, | |
| "learning_rate": 0.000954561590344338, | |
| "loss": 0.1205, | |
| "step": 22050 | |
| }, | |
| { | |
| "epoch": 14.1, | |
| "learning_rate": 0.000954490592829251, | |
| "loss": 0.1431, | |
| "step": 22060 | |
| }, | |
| { | |
| "epoch": 14.1, | |
| "learning_rate": 0.000954419595314164, | |
| "loss": 0.1134, | |
| "step": 22070 | |
| }, | |
| { | |
| "epoch": 14.11, | |
| "learning_rate": 0.000954348597799077, | |
| "loss": 0.1431, | |
| "step": 22080 | |
| }, | |
| { | |
| "epoch": 14.11, | |
| "learning_rate": 0.0009542776002839902, | |
| "loss": 0.1484, | |
| "step": 22090 | |
| }, | |
| { | |
| "epoch": 14.12, | |
| "learning_rate": 0.0009542066027689031, | |
| "loss": 0.1435, | |
| "step": 22100 | |
| }, | |
| { | |
| "epoch": 14.13, | |
| "learning_rate": 0.0009541356052538162, | |
| "loss": 0.1595, | |
| "step": 22110 | |
| }, | |
| { | |
| "epoch": 14.13, | |
| "learning_rate": 0.0009540646077387292, | |
| "loss": 0.1407, | |
| "step": 22120 | |
| }, | |
| { | |
| "epoch": 14.14, | |
| "learning_rate": 0.0009539936102236422, | |
| "loss": 0.1514, | |
| "step": 22130 | |
| }, | |
| { | |
| "epoch": 14.15, | |
| "learning_rate": 0.0009539226127085552, | |
| "loss": 0.1391, | |
| "step": 22140 | |
| }, | |
| { | |
| "epoch": 14.15, | |
| "learning_rate": 0.0009538516151934684, | |
| "loss": 0.1266, | |
| "step": 22150 | |
| }, | |
| { | |
| "epoch": 14.16, | |
| "learning_rate": 0.0009537806176783813, | |
| "loss": 0.1598, | |
| "step": 22160 | |
| }, | |
| { | |
| "epoch": 14.17, | |
| "learning_rate": 0.0009537096201632944, | |
| "loss": 0.1071, | |
| "step": 22170 | |
| }, | |
| { | |
| "epoch": 14.17, | |
| "learning_rate": 0.0009536386226482073, | |
| "loss": 0.1529, | |
| "step": 22180 | |
| }, | |
| { | |
| "epoch": 14.18, | |
| "learning_rate": 0.0009535676251331203, | |
| "loss": 0.1626, | |
| "step": 22190 | |
| }, | |
| { | |
| "epoch": 14.19, | |
| "learning_rate": 0.0009534966276180334, | |
| "loss": 0.0999, | |
| "step": 22200 | |
| }, | |
| { | |
| "epoch": 14.19, | |
| "learning_rate": 0.0009534256301029463, | |
| "loss": 0.1244, | |
| "step": 22210 | |
| }, | |
| { | |
| "epoch": 14.2, | |
| "learning_rate": 0.0009533546325878595, | |
| "loss": 0.1518, | |
| "step": 22220 | |
| }, | |
| { | |
| "epoch": 14.2, | |
| "learning_rate": 0.0009532836350727724, | |
| "loss": 0.1589, | |
| "step": 22230 | |
| }, | |
| { | |
| "epoch": 14.21, | |
| "learning_rate": 0.0009532126375576855, | |
| "loss": 0.128, | |
| "step": 22240 | |
| }, | |
| { | |
| "epoch": 14.22, | |
| "learning_rate": 0.0009531416400425985, | |
| "loss": 0.155, | |
| "step": 22250 | |
| }, | |
| { | |
| "epoch": 14.22, | |
| "learning_rate": 0.0009530706425275115, | |
| "loss": 0.1533, | |
| "step": 22260 | |
| }, | |
| { | |
| "epoch": 14.23, | |
| "learning_rate": 0.0009529996450124245, | |
| "loss": 0.1312, | |
| "step": 22270 | |
| }, | |
| { | |
| "epoch": 14.24, | |
| "learning_rate": 0.0009529286474973377, | |
| "loss": 0.1448, | |
| "step": 22280 | |
| }, | |
| { | |
| "epoch": 14.24, | |
| "learning_rate": 0.0009528576499822506, | |
| "loss": 0.1474, | |
| "step": 22290 | |
| }, | |
| { | |
| "epoch": 14.25, | |
| "learning_rate": 0.0009527866524671637, | |
| "loss": 0.1018, | |
| "step": 22300 | |
| }, | |
| { | |
| "epoch": 14.26, | |
| "learning_rate": 0.0009527156549520767, | |
| "loss": 0.1606, | |
| "step": 22310 | |
| }, | |
| { | |
| "epoch": 14.26, | |
| "learning_rate": 0.0009526446574369897, | |
| "loss": 0.1233, | |
| "step": 22320 | |
| }, | |
| { | |
| "epoch": 14.27, | |
| "learning_rate": 0.0009525736599219027, | |
| "loss": 0.1554, | |
| "step": 22330 | |
| }, | |
| { | |
| "epoch": 14.27, | |
| "learning_rate": 0.0009525026624068159, | |
| "loss": 0.1245, | |
| "step": 22340 | |
| }, | |
| { | |
| "epoch": 14.28, | |
| "learning_rate": 0.0009524316648917288, | |
| "loss": 0.1178, | |
| "step": 22350 | |
| }, | |
| { | |
| "epoch": 14.29, | |
| "learning_rate": 0.0009523606673766419, | |
| "loss": 0.1328, | |
| "step": 22360 | |
| }, | |
| { | |
| "epoch": 14.29, | |
| "learning_rate": 0.0009522896698615548, | |
| "loss": 0.1562, | |
| "step": 22370 | |
| }, | |
| { | |
| "epoch": 14.3, | |
| "learning_rate": 0.0009522186723464679, | |
| "loss": 0.1414, | |
| "step": 22380 | |
| }, | |
| { | |
| "epoch": 14.31, | |
| "learning_rate": 0.0009521476748313809, | |
| "loss": 0.1537, | |
| "step": 22390 | |
| }, | |
| { | |
| "epoch": 14.31, | |
| "learning_rate": 0.000952076677316294, | |
| "loss": 0.1343, | |
| "step": 22400 | |
| }, | |
| { | |
| "epoch": 14.32, | |
| "learning_rate": 0.000952005679801207, | |
| "loss": 0.1536, | |
| "step": 22410 | |
| }, | |
| { | |
| "epoch": 14.33, | |
| "learning_rate": 0.0009519346822861201, | |
| "loss": 0.1516, | |
| "step": 22420 | |
| }, | |
| { | |
| "epoch": 14.33, | |
| "learning_rate": 0.000951863684771033, | |
| "loss": 0.1512, | |
| "step": 22430 | |
| }, | |
| { | |
| "epoch": 14.34, | |
| "learning_rate": 0.0009517926872559461, | |
| "loss": 0.1475, | |
| "step": 22440 | |
| }, | |
| { | |
| "epoch": 14.34, | |
| "learning_rate": 0.000951721689740859, | |
| "loss": 0.1431, | |
| "step": 22450 | |
| }, | |
| { | |
| "epoch": 14.35, | |
| "learning_rate": 0.0009516506922257722, | |
| "loss": 0.1415, | |
| "step": 22460 | |
| }, | |
| { | |
| "epoch": 14.36, | |
| "learning_rate": 0.0009515796947106852, | |
| "loss": 0.1334, | |
| "step": 22470 | |
| }, | |
| { | |
| "epoch": 14.36, | |
| "learning_rate": 0.0009515086971955982, | |
| "loss": 0.1613, | |
| "step": 22480 | |
| }, | |
| { | |
| "epoch": 14.37, | |
| "learning_rate": 0.0009514376996805112, | |
| "loss": 0.1442, | |
| "step": 22490 | |
| }, | |
| { | |
| "epoch": 14.38, | |
| "learning_rate": 0.0009513667021654242, | |
| "loss": 0.1368, | |
| "step": 22500 | |
| }, | |
| { | |
| "epoch": 14.38, | |
| "learning_rate": 0.0009512957046503372, | |
| "loss": 0.1551, | |
| "step": 22510 | |
| }, | |
| { | |
| "epoch": 14.39, | |
| "learning_rate": 0.0009512247071352503, | |
| "loss": 0.1346, | |
| "step": 22520 | |
| }, | |
| { | |
| "epoch": 14.4, | |
| "learning_rate": 0.0009511537096201633, | |
| "loss": 0.1497, | |
| "step": 22530 | |
| }, | |
| { | |
| "epoch": 14.4, | |
| "learning_rate": 0.0009510827121050763, | |
| "loss": 0.1537, | |
| "step": 22540 | |
| }, | |
| { | |
| "epoch": 14.41, | |
| "learning_rate": 0.0009510117145899894, | |
| "loss": 0.1407, | |
| "step": 22550 | |
| }, | |
| { | |
| "epoch": 14.42, | |
| "learning_rate": 0.0009509407170749023, | |
| "loss": 0.1513, | |
| "step": 22560 | |
| }, | |
| { | |
| "epoch": 14.42, | |
| "learning_rate": 0.0009508697195598154, | |
| "loss": 0.1479, | |
| "step": 22570 | |
| }, | |
| { | |
| "epoch": 14.43, | |
| "learning_rate": 0.0009507987220447285, | |
| "loss": 0.1532, | |
| "step": 22580 | |
| }, | |
| { | |
| "epoch": 14.43, | |
| "learning_rate": 0.0009507277245296415, | |
| "loss": 0.1189, | |
| "step": 22590 | |
| }, | |
| { | |
| "epoch": 14.44, | |
| "learning_rate": 0.0009506567270145545, | |
| "loss": 0.1349, | |
| "step": 22600 | |
| }, | |
| { | |
| "epoch": 14.45, | |
| "learning_rate": 0.0009505857294994676, | |
| "loss": 0.1508, | |
| "step": 22610 | |
| }, | |
| { | |
| "epoch": 14.45, | |
| "learning_rate": 0.0009505147319843805, | |
| "loss": 0.1711, | |
| "step": 22620 | |
| }, | |
| { | |
| "epoch": 14.46, | |
| "learning_rate": 0.0009504437344692936, | |
| "loss": 0.1591, | |
| "step": 22630 | |
| }, | |
| { | |
| "epoch": 14.47, | |
| "learning_rate": 0.0009503727369542066, | |
| "loss": 0.1572, | |
| "step": 22640 | |
| }, | |
| { | |
| "epoch": 14.47, | |
| "learning_rate": 0.0009503017394391197, | |
| "loss": 0.1153, | |
| "step": 22650 | |
| }, | |
| { | |
| "epoch": 14.48, | |
| "learning_rate": 0.0009502307419240327, | |
| "loss": 0.1261, | |
| "step": 22660 | |
| }, | |
| { | |
| "epoch": 14.49, | |
| "learning_rate": 0.0009501597444089457, | |
| "loss": 0.1392, | |
| "step": 22670 | |
| }, | |
| { | |
| "epoch": 14.49, | |
| "learning_rate": 0.0009500887468938587, | |
| "loss": 0.1275, | |
| "step": 22680 | |
| }, | |
| { | |
| "epoch": 14.5, | |
| "learning_rate": 0.0009500177493787718, | |
| "loss": 0.1472, | |
| "step": 22690 | |
| }, | |
| { | |
| "epoch": 14.5, | |
| "learning_rate": 0.0009499467518636848, | |
| "loss": 0.1568, | |
| "step": 22700 | |
| }, | |
| { | |
| "epoch": 14.51, | |
| "learning_rate": 0.0009498757543485979, | |
| "loss": 0.1386, | |
| "step": 22710 | |
| }, | |
| { | |
| "epoch": 14.52, | |
| "learning_rate": 0.0009498047568335108, | |
| "loss": 0.1265, | |
| "step": 22720 | |
| }, | |
| { | |
| "epoch": 14.52, | |
| "learning_rate": 0.0009497337593184239, | |
| "loss": 0.1428, | |
| "step": 22730 | |
| }, | |
| { | |
| "epoch": 14.53, | |
| "learning_rate": 0.0009496627618033369, | |
| "loss": 0.175, | |
| "step": 22740 | |
| }, | |
| { | |
| "epoch": 14.54, | |
| "learning_rate": 0.0009495917642882499, | |
| "loss": 0.1614, | |
| "step": 22750 | |
| }, | |
| { | |
| "epoch": 14.54, | |
| "learning_rate": 0.000949520766773163, | |
| "loss": 0.1728, | |
| "step": 22760 | |
| }, | |
| { | |
| "epoch": 14.55, | |
| "learning_rate": 0.0009494497692580761, | |
| "loss": 0.1589, | |
| "step": 22770 | |
| }, | |
| { | |
| "epoch": 14.56, | |
| "learning_rate": 0.000949378771742989, | |
| "loss": 0.1652, | |
| "step": 22780 | |
| }, | |
| { | |
| "epoch": 14.56, | |
| "learning_rate": 0.0009493077742279021, | |
| "loss": 0.1545, | |
| "step": 22790 | |
| }, | |
| { | |
| "epoch": 14.57, | |
| "learning_rate": 0.000949236776712815, | |
| "loss": 0.1602, | |
| "step": 22800 | |
| }, | |
| { | |
| "epoch": 14.57, | |
| "learning_rate": 0.000949165779197728, | |
| "loss": 0.1615, | |
| "step": 22810 | |
| }, | |
| { | |
| "epoch": 14.58, | |
| "learning_rate": 0.0009490947816826411, | |
| "loss": 0.167, | |
| "step": 22820 | |
| }, | |
| { | |
| "epoch": 14.59, | |
| "learning_rate": 0.0009490237841675541, | |
| "loss": 0.145, | |
| "step": 22830 | |
| }, | |
| { | |
| "epoch": 14.59, | |
| "learning_rate": 0.0009489527866524672, | |
| "loss": 0.15, | |
| "step": 22840 | |
| }, | |
| { | |
| "epoch": 14.6, | |
| "learning_rate": 0.0009488817891373802, | |
| "loss": 0.141, | |
| "step": 22850 | |
| }, | |
| { | |
| "epoch": 14.61, | |
| "learning_rate": 0.0009488107916222932, | |
| "loss": 0.1568, | |
| "step": 22860 | |
| }, | |
| { | |
| "epoch": 14.61, | |
| "learning_rate": 0.0009487397941072062, | |
| "loss": 0.1405, | |
| "step": 22870 | |
| }, | |
| { | |
| "epoch": 14.62, | |
| "learning_rate": 0.0009486687965921193, | |
| "loss": 0.1496, | |
| "step": 22880 | |
| }, | |
| { | |
| "epoch": 14.63, | |
| "learning_rate": 0.0009485977990770323, | |
| "loss": 0.1532, | |
| "step": 22890 | |
| }, | |
| { | |
| "epoch": 14.63, | |
| "learning_rate": 0.0009485268015619454, | |
| "loss": 0.1574, | |
| "step": 22900 | |
| }, | |
| { | |
| "epoch": 14.64, | |
| "learning_rate": 0.0009484558040468583, | |
| "loss": 0.144, | |
| "step": 22910 | |
| }, | |
| { | |
| "epoch": 14.65, | |
| "learning_rate": 0.0009483848065317714, | |
| "loss": 0.1783, | |
| "step": 22920 | |
| }, | |
| { | |
| "epoch": 14.65, | |
| "learning_rate": 0.0009483138090166844, | |
| "loss": 0.1661, | |
| "step": 22930 | |
| }, | |
| { | |
| "epoch": 14.66, | |
| "learning_rate": 0.0009482428115015974, | |
| "loss": 0.142, | |
| "step": 22940 | |
| }, | |
| { | |
| "epoch": 14.66, | |
| "learning_rate": 0.0009481718139865105, | |
| "loss": 0.1407, | |
| "step": 22950 | |
| }, | |
| { | |
| "epoch": 14.67, | |
| "learning_rate": 0.0009481008164714236, | |
| "loss": 0.146, | |
| "step": 22960 | |
| }, | |
| { | |
| "epoch": 14.68, | |
| "learning_rate": 0.0009480298189563365, | |
| "loss": 0.1423, | |
| "step": 22970 | |
| }, | |
| { | |
| "epoch": 14.68, | |
| "learning_rate": 0.0009479588214412496, | |
| "loss": 0.1735, | |
| "step": 22980 | |
| }, | |
| { | |
| "epoch": 14.69, | |
| "learning_rate": 0.0009478878239261626, | |
| "loss": 0.1355, | |
| "step": 22990 | |
| }, | |
| { | |
| "epoch": 14.7, | |
| "learning_rate": 0.0009478168264110756, | |
| "loss": 0.1344, | |
| "step": 23000 | |
| }, | |
| { | |
| "epoch": 14.7, | |
| "learning_rate": 0.0009477458288959887, | |
| "loss": 0.1427, | |
| "step": 23010 | |
| }, | |
| { | |
| "epoch": 14.71, | |
| "learning_rate": 0.0009476748313809018, | |
| "loss": 0.1657, | |
| "step": 23020 | |
| }, | |
| { | |
| "epoch": 14.72, | |
| "learning_rate": 0.0009476038338658147, | |
| "loss": 0.1527, | |
| "step": 23030 | |
| }, | |
| { | |
| "epoch": 14.72, | |
| "learning_rate": 0.0009475328363507278, | |
| "loss": 0.1503, | |
| "step": 23040 | |
| }, | |
| { | |
| "epoch": 14.73, | |
| "learning_rate": 0.0009474618388356407, | |
| "loss": 0.1619, | |
| "step": 23050 | |
| }, | |
| { | |
| "epoch": 14.73, | |
| "learning_rate": 0.0009473908413205538, | |
| "loss": 0.1645, | |
| "step": 23060 | |
| }, | |
| { | |
| "epoch": 14.74, | |
| "learning_rate": 0.0009473198438054669, | |
| "loss": 0.1143, | |
| "step": 23070 | |
| }, | |
| { | |
| "epoch": 14.75, | |
| "learning_rate": 0.0009472488462903799, | |
| "loss": 0.1702, | |
| "step": 23080 | |
| }, | |
| { | |
| "epoch": 14.75, | |
| "learning_rate": 0.0009471778487752929, | |
| "loss": 0.1313, | |
| "step": 23090 | |
| }, | |
| { | |
| "epoch": 14.76, | |
| "learning_rate": 0.000947106851260206, | |
| "loss": 0.1716, | |
| "step": 23100 | |
| }, | |
| { | |
| "epoch": 14.77, | |
| "learning_rate": 0.0009470358537451189, | |
| "loss": 0.1421, | |
| "step": 23110 | |
| }, | |
| { | |
| "epoch": 14.77, | |
| "learning_rate": 0.0009469648562300319, | |
| "loss": 0.1407, | |
| "step": 23120 | |
| }, | |
| { | |
| "epoch": 14.78, | |
| "learning_rate": 0.000946893858714945, | |
| "loss": 0.1345, | |
| "step": 23130 | |
| }, | |
| { | |
| "epoch": 14.79, | |
| "learning_rate": 0.000946822861199858, | |
| "loss": 0.162, | |
| "step": 23140 | |
| }, | |
| { | |
| "epoch": 14.79, | |
| "learning_rate": 0.0009467518636847711, | |
| "loss": 0.1601, | |
| "step": 23150 | |
| }, | |
| { | |
| "epoch": 14.8, | |
| "learning_rate": 0.000946680866169684, | |
| "loss": 0.1415, | |
| "step": 23160 | |
| }, | |
| { | |
| "epoch": 14.8, | |
| "learning_rate": 0.0009466098686545971, | |
| "loss": 0.182, | |
| "step": 23170 | |
| }, | |
| { | |
| "epoch": 14.81, | |
| "learning_rate": 0.00094653887113951, | |
| "loss": 0.1519, | |
| "step": 23180 | |
| }, | |
| { | |
| "epoch": 14.82, | |
| "learning_rate": 0.0009464678736244232, | |
| "loss": 0.1856, | |
| "step": 23190 | |
| }, | |
| { | |
| "epoch": 14.82, | |
| "learning_rate": 0.0009463968761093362, | |
| "loss": 0.1641, | |
| "step": 23200 | |
| }, | |
| { | |
| "epoch": 14.83, | |
| "learning_rate": 0.0009463258785942493, | |
| "loss": 0.1401, | |
| "step": 23210 | |
| }, | |
| { | |
| "epoch": 14.84, | |
| "learning_rate": 0.0009462548810791622, | |
| "loss": 0.1536, | |
| "step": 23220 | |
| }, | |
| { | |
| "epoch": 14.84, | |
| "learning_rate": 0.0009461838835640753, | |
| "loss": 0.1346, | |
| "step": 23230 | |
| }, | |
| { | |
| "epoch": 14.85, | |
| "learning_rate": 0.0009461128860489882, | |
| "loss": 0.1536, | |
| "step": 23240 | |
| }, | |
| { | |
| "epoch": 14.86, | |
| "learning_rate": 0.0009460418885339014, | |
| "loss": 0.1416, | |
| "step": 23250 | |
| }, | |
| { | |
| "epoch": 14.86, | |
| "learning_rate": 0.0009459708910188144, | |
| "loss": 0.1659, | |
| "step": 23260 | |
| }, | |
| { | |
| "epoch": 14.87, | |
| "learning_rate": 0.0009458998935037274, | |
| "loss": 0.1343, | |
| "step": 23270 | |
| }, | |
| { | |
| "epoch": 14.88, | |
| "learning_rate": 0.0009458288959886404, | |
| "loss": 0.1592, | |
| "step": 23280 | |
| }, | |
| { | |
| "epoch": 14.88, | |
| "learning_rate": 0.0009457578984735535, | |
| "loss": 0.1342, | |
| "step": 23290 | |
| }, | |
| { | |
| "epoch": 14.89, | |
| "learning_rate": 0.0009456869009584664, | |
| "loss": 0.1514, | |
| "step": 23300 | |
| }, | |
| { | |
| "epoch": 14.89, | |
| "learning_rate": 0.0009456159034433796, | |
| "loss": 0.1519, | |
| "step": 23310 | |
| }, | |
| { | |
| "epoch": 14.9, | |
| "learning_rate": 0.0009455449059282925, | |
| "loss": 0.1524, | |
| "step": 23320 | |
| }, | |
| { | |
| "epoch": 14.91, | |
| "learning_rate": 0.0009454739084132056, | |
| "loss": 0.1608, | |
| "step": 23330 | |
| }, | |
| { | |
| "epoch": 14.91, | |
| "learning_rate": 0.0009454029108981186, | |
| "loss": 0.1324, | |
| "step": 23340 | |
| }, | |
| { | |
| "epoch": 14.92, | |
| "learning_rate": 0.0009453319133830316, | |
| "loss": 0.1542, | |
| "step": 23350 | |
| }, | |
| { | |
| "epoch": 14.93, | |
| "learning_rate": 0.0009452609158679446, | |
| "loss": 0.1339, | |
| "step": 23360 | |
| }, | |
| { | |
| "epoch": 14.93, | |
| "learning_rate": 0.0009451899183528578, | |
| "loss": 0.1496, | |
| "step": 23370 | |
| }, | |
| { | |
| "epoch": 14.94, | |
| "learning_rate": 0.0009451189208377707, | |
| "loss": 0.1244, | |
| "step": 23380 | |
| }, | |
| { | |
| "epoch": 14.95, | |
| "learning_rate": 0.0009450479233226838, | |
| "loss": 0.1439, | |
| "step": 23390 | |
| }, | |
| { | |
| "epoch": 14.95, | |
| "learning_rate": 0.0009449769258075968, | |
| "loss": 0.1165, | |
| "step": 23400 | |
| }, | |
| { | |
| "epoch": 14.96, | |
| "learning_rate": 0.0009449059282925098, | |
| "loss": 0.1267, | |
| "step": 23410 | |
| }, | |
| { | |
| "epoch": 14.96, | |
| "learning_rate": 0.0009448349307774228, | |
| "loss": 0.1383, | |
| "step": 23420 | |
| }, | |
| { | |
| "epoch": 14.97, | |
| "learning_rate": 0.0009447639332623357, | |
| "loss": 0.1468, | |
| "step": 23430 | |
| }, | |
| { | |
| "epoch": 14.98, | |
| "learning_rate": 0.0009446929357472489, | |
| "loss": 0.1508, | |
| "step": 23440 | |
| }, | |
| { | |
| "epoch": 14.98, | |
| "learning_rate": 0.0009446219382321619, | |
| "loss": 0.1566, | |
| "step": 23450 | |
| }, | |
| { | |
| "epoch": 14.99, | |
| "learning_rate": 0.0009445509407170749, | |
| "loss": 0.1399, | |
| "step": 23460 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "learning_rate": 0.0009444799432019879, | |
| "loss": 0.1656, | |
| "step": 23470 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "learning_rate": 0.000944408945686901, | |
| "loss": 0.1503, | |
| "step": 23480 | |
| }, | |
| { | |
| "epoch": 15.01, | |
| "learning_rate": 0.0009443379481718139, | |
| "loss": 0.1385, | |
| "step": 23490 | |
| }, | |
| { | |
| "epoch": 15.02, | |
| "learning_rate": 0.0009442669506567271, | |
| "loss": 0.1249, | |
| "step": 23500 | |
| }, | |
| { | |
| "epoch": 15.02, | |
| "learning_rate": 0.00094419595314164, | |
| "loss": 0.1565, | |
| "step": 23510 | |
| }, | |
| { | |
| "epoch": 15.03, | |
| "learning_rate": 0.0009441249556265531, | |
| "loss": 0.1236, | |
| "step": 23520 | |
| }, | |
| { | |
| "epoch": 15.04, | |
| "learning_rate": 0.0009440539581114661, | |
| "loss": 0.1381, | |
| "step": 23530 | |
| }, | |
| { | |
| "epoch": 15.04, | |
| "learning_rate": 0.0009439829605963791, | |
| "loss": 0.1496, | |
| "step": 23540 | |
| }, | |
| { | |
| "epoch": 15.05, | |
| "learning_rate": 0.0009439119630812921, | |
| "loss": 0.1309, | |
| "step": 23550 | |
| }, | |
| { | |
| "epoch": 15.05, | |
| "learning_rate": 0.0009438409655662053, | |
| "loss": 0.1029, | |
| "step": 23560 | |
| }, | |
| { | |
| "epoch": 15.06, | |
| "learning_rate": 0.0009437699680511182, | |
| "loss": 0.1542, | |
| "step": 23570 | |
| }, | |
| { | |
| "epoch": 15.07, | |
| "learning_rate": 0.0009436989705360313, | |
| "loss": 0.1186, | |
| "step": 23580 | |
| }, | |
| { | |
| "epoch": 15.07, | |
| "learning_rate": 0.0009436279730209442, | |
| "loss": 0.1395, | |
| "step": 23590 | |
| }, | |
| { | |
| "epoch": 15.08, | |
| "learning_rate": 0.0009435569755058573, | |
| "loss": 0.1368, | |
| "step": 23600 | |
| }, | |
| { | |
| "epoch": 15.09, | |
| "learning_rate": 0.0009434859779907703, | |
| "loss": 0.1187, | |
| "step": 23610 | |
| }, | |
| { | |
| "epoch": 15.09, | |
| "learning_rate": 0.0009434149804756834, | |
| "loss": 0.1232, | |
| "step": 23620 | |
| }, | |
| { | |
| "epoch": 15.1, | |
| "learning_rate": 0.0009433439829605964, | |
| "loss": 0.1449, | |
| "step": 23630 | |
| }, | |
| { | |
| "epoch": 15.11, | |
| "learning_rate": 0.0009432729854455095, | |
| "loss": 0.1134, | |
| "step": 23640 | |
| }, | |
| { | |
| "epoch": 15.11, | |
| "learning_rate": 0.0009432019879304224, | |
| "loss": 0.1189, | |
| "step": 23650 | |
| }, | |
| { | |
| "epoch": 15.12, | |
| "learning_rate": 0.0009431309904153355, | |
| "loss": 0.1534, | |
| "step": 23660 | |
| }, | |
| { | |
| "epoch": 15.12, | |
| "learning_rate": 0.0009430599929002485, | |
| "loss": 0.1376, | |
| "step": 23670 | |
| }, | |
| { | |
| "epoch": 15.13, | |
| "learning_rate": 0.0009429889953851616, | |
| "loss": 0.1442, | |
| "step": 23680 | |
| }, | |
| { | |
| "epoch": 15.14, | |
| "learning_rate": 0.0009429179978700746, | |
| "loss": 0.1275, | |
| "step": 23690 | |
| }, | |
| { | |
| "epoch": 15.14, | |
| "learning_rate": 0.0009428470003549877, | |
| "loss": 0.1406, | |
| "step": 23700 | |
| }, | |
| { | |
| "epoch": 15.15, | |
| "learning_rate": 0.0009427760028399006, | |
| "loss": 0.1367, | |
| "step": 23710 | |
| }, | |
| { | |
| "epoch": 15.16, | |
| "learning_rate": 0.0009427050053248137, | |
| "loss": 0.149, | |
| "step": 23720 | |
| }, | |
| { | |
| "epoch": 15.16, | |
| "learning_rate": 0.0009426340078097266, | |
| "loss": 0.1376, | |
| "step": 23730 | |
| }, | |
| { | |
| "epoch": 15.17, | |
| "learning_rate": 0.0009425630102946398, | |
| "loss": 0.1431, | |
| "step": 23740 | |
| }, | |
| { | |
| "epoch": 15.18, | |
| "learning_rate": 0.0009424920127795528, | |
| "loss": 0.1326, | |
| "step": 23750 | |
| }, | |
| { | |
| "epoch": 15.18, | |
| "learning_rate": 0.0009424210152644657, | |
| "loss": 0.1056, | |
| "step": 23760 | |
| }, | |
| { | |
| "epoch": 15.19, | |
| "learning_rate": 0.0009423500177493788, | |
| "loss": 0.1506, | |
| "step": 23770 | |
| }, | |
| { | |
| "epoch": 15.19, | |
| "learning_rate": 0.0009422790202342917, | |
| "loss": 0.153, | |
| "step": 23780 | |
| }, | |
| { | |
| "epoch": 15.2, | |
| "learning_rate": 0.0009422080227192048, | |
| "loss": 0.1368, | |
| "step": 23790 | |
| }, | |
| { | |
| "epoch": 15.21, | |
| "learning_rate": 0.0009421370252041179, | |
| "loss": 0.1508, | |
| "step": 23800 | |
| }, | |
| { | |
| "epoch": 15.21, | |
| "learning_rate": 0.000942066027689031, | |
| "loss": 0.1398, | |
| "step": 23810 | |
| }, | |
| { | |
| "epoch": 15.22, | |
| "learning_rate": 0.0009419950301739439, | |
| "loss": 0.1396, | |
| "step": 23820 | |
| }, | |
| { | |
| "epoch": 15.23, | |
| "learning_rate": 0.000941924032658857, | |
| "loss": 0.1394, | |
| "step": 23830 | |
| }, | |
| { | |
| "epoch": 15.23, | |
| "learning_rate": 0.0009418530351437699, | |
| "loss": 0.1578, | |
| "step": 23840 | |
| }, | |
| { | |
| "epoch": 15.24, | |
| "learning_rate": 0.000941782037628683, | |
| "loss": 0.1626, | |
| "step": 23850 | |
| }, | |
| { | |
| "epoch": 15.25, | |
| "learning_rate": 0.0009417110401135961, | |
| "loss": 0.1428, | |
| "step": 23860 | |
| }, | |
| { | |
| "epoch": 15.25, | |
| "learning_rate": 0.0009416400425985091, | |
| "loss": 0.1478, | |
| "step": 23870 | |
| }, | |
| { | |
| "epoch": 15.26, | |
| "learning_rate": 0.0009415690450834221, | |
| "loss": 0.1482, | |
| "step": 23880 | |
| }, | |
| { | |
| "epoch": 15.27, | |
| "learning_rate": 0.0009414980475683352, | |
| "loss": 0.1329, | |
| "step": 23890 | |
| }, | |
| { | |
| "epoch": 15.27, | |
| "learning_rate": 0.0009414270500532481, | |
| "loss": 0.1287, | |
| "step": 23900 | |
| }, | |
| { | |
| "epoch": 15.28, | |
| "learning_rate": 0.0009413560525381612, | |
| "loss": 0.1443, | |
| "step": 23910 | |
| }, | |
| { | |
| "epoch": 15.28, | |
| "learning_rate": 0.0009412850550230742, | |
| "loss": 0.1398, | |
| "step": 23920 | |
| }, | |
| { | |
| "epoch": 15.29, | |
| "learning_rate": 0.0009412140575079873, | |
| "loss": 0.1211, | |
| "step": 23930 | |
| }, | |
| { | |
| "epoch": 15.3, | |
| "learning_rate": 0.0009411430599929003, | |
| "loss": 0.137, | |
| "step": 23940 | |
| }, | |
| { | |
| "epoch": 15.3, | |
| "learning_rate": 0.0009410720624778133, | |
| "loss": 0.1539, | |
| "step": 23950 | |
| }, | |
| { | |
| "epoch": 15.31, | |
| "learning_rate": 0.0009410010649627263, | |
| "loss": 0.1305, | |
| "step": 23960 | |
| }, | |
| { | |
| "epoch": 15.32, | |
| "learning_rate": 0.0009409300674476394, | |
| "loss": 0.1501, | |
| "step": 23970 | |
| }, | |
| { | |
| "epoch": 15.32, | |
| "learning_rate": 0.0009408590699325523, | |
| "loss": 0.1517, | |
| "step": 23980 | |
| }, | |
| { | |
| "epoch": 15.33, | |
| "learning_rate": 0.0009407880724174655, | |
| "loss": 0.1436, | |
| "step": 23990 | |
| }, | |
| { | |
| "epoch": 15.34, | |
| "learning_rate": 0.0009407170749023784, | |
| "loss": 0.1175, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 15.34, | |
| "learning_rate": 0.0009406460773872915, | |
| "loss": 0.1333, | |
| "step": 24010 | |
| }, | |
| { | |
| "epoch": 15.35, | |
| "learning_rate": 0.0009405750798722045, | |
| "loss": 0.1091, | |
| "step": 24020 | |
| }, | |
| { | |
| "epoch": 15.35, | |
| "learning_rate": 0.0009405040823571175, | |
| "loss": 0.143, | |
| "step": 24030 | |
| }, | |
| { | |
| "epoch": 15.36, | |
| "learning_rate": 0.0009404330848420305, | |
| "loss": 0.1213, | |
| "step": 24040 | |
| }, | |
| { | |
| "epoch": 15.37, | |
| "learning_rate": 0.0009403620873269437, | |
| "loss": 0.1295, | |
| "step": 24050 | |
| }, | |
| { | |
| "epoch": 15.37, | |
| "learning_rate": 0.0009402910898118566, | |
| "loss": 0.1312, | |
| "step": 24060 | |
| }, | |
| { | |
| "epoch": 15.38, | |
| "learning_rate": 0.0009402200922967696, | |
| "loss": 0.1402, | |
| "step": 24070 | |
| }, | |
| { | |
| "epoch": 15.39, | |
| "learning_rate": 0.0009401490947816827, | |
| "loss": 0.1299, | |
| "step": 24080 | |
| }, | |
| { | |
| "epoch": 15.39, | |
| "learning_rate": 0.0009400780972665956, | |
| "loss": 0.1399, | |
| "step": 24090 | |
| }, | |
| { | |
| "epoch": 15.4, | |
| "learning_rate": 0.0009400070997515087, | |
| "loss": 0.1339, | |
| "step": 24100 | |
| }, | |
| { | |
| "epoch": 15.41, | |
| "learning_rate": 0.0009399361022364217, | |
| "loss": 0.1145, | |
| "step": 24110 | |
| }, | |
| { | |
| "epoch": 15.41, | |
| "learning_rate": 0.0009398651047213348, | |
| "loss": 0.1567, | |
| "step": 24120 | |
| }, | |
| { | |
| "epoch": 15.42, | |
| "learning_rate": 0.0009397941072062478, | |
| "loss": 0.1406, | |
| "step": 24130 | |
| }, | |
| { | |
| "epoch": 15.42, | |
| "learning_rate": 0.0009397231096911608, | |
| "loss": 0.1522, | |
| "step": 24140 | |
| }, | |
| { | |
| "epoch": 15.43, | |
| "learning_rate": 0.0009396521121760738, | |
| "loss": 0.1274, | |
| "step": 24150 | |
| }, | |
| { | |
| "epoch": 15.44, | |
| "learning_rate": 0.0009395811146609869, | |
| "loss": 0.1309, | |
| "step": 24160 | |
| }, | |
| { | |
| "epoch": 15.44, | |
| "learning_rate": 0.0009395101171458999, | |
| "loss": 0.1333, | |
| "step": 24170 | |
| }, | |
| { | |
| "epoch": 15.45, | |
| "learning_rate": 0.000939439119630813, | |
| "loss": 0.1439, | |
| "step": 24180 | |
| }, | |
| { | |
| "epoch": 15.46, | |
| "learning_rate": 0.000939368122115726, | |
| "loss": 0.1288, | |
| "step": 24190 | |
| }, | |
| { | |
| "epoch": 15.46, | |
| "learning_rate": 0.000939297124600639, | |
| "loss": 0.1154, | |
| "step": 24200 | |
| }, | |
| { | |
| "epoch": 15.47, | |
| "learning_rate": 0.000939226127085552, | |
| "loss": 0.1208, | |
| "step": 24210 | |
| }, | |
| { | |
| "epoch": 15.48, | |
| "learning_rate": 0.000939155129570465, | |
| "loss": 0.1275, | |
| "step": 24220 | |
| }, | |
| { | |
| "epoch": 15.48, | |
| "learning_rate": 0.0009390841320553781, | |
| "loss": 0.136, | |
| "step": 24230 | |
| }, | |
| { | |
| "epoch": 15.49, | |
| "learning_rate": 0.0009390131345402912, | |
| "loss": 0.1182, | |
| "step": 24240 | |
| }, | |
| { | |
| "epoch": 15.5, | |
| "learning_rate": 0.0009389421370252041, | |
| "loss": 0.136, | |
| "step": 24250 | |
| }, | |
| { | |
| "epoch": 15.5, | |
| "learning_rate": 0.0009388711395101172, | |
| "loss": 0.1294, | |
| "step": 24260 | |
| }, | |
| { | |
| "epoch": 15.51, | |
| "learning_rate": 0.0009388001419950302, | |
| "loss": 0.1553, | |
| "step": 24270 | |
| }, | |
| { | |
| "epoch": 15.51, | |
| "learning_rate": 0.0009387291444799432, | |
| "loss": 0.1494, | |
| "step": 24280 | |
| }, | |
| { | |
| "epoch": 15.52, | |
| "learning_rate": 0.0009386581469648563, | |
| "loss": 0.1119, | |
| "step": 24290 | |
| }, | |
| { | |
| "epoch": 15.53, | |
| "learning_rate": 0.0009385871494497694, | |
| "loss": 0.1552, | |
| "step": 24300 | |
| }, | |
| { | |
| "epoch": 15.53, | |
| "learning_rate": 0.0009385161519346823, | |
| "loss": 0.1289, | |
| "step": 24310 | |
| }, | |
| { | |
| "epoch": 15.54, | |
| "learning_rate": 0.0009384451544195954, | |
| "loss": 0.1435, | |
| "step": 24320 | |
| }, | |
| { | |
| "epoch": 15.55, | |
| "learning_rate": 0.0009383741569045083, | |
| "loss": 0.1491, | |
| "step": 24330 | |
| }, | |
| { | |
| "epoch": 15.55, | |
| "learning_rate": 0.0009383031593894214, | |
| "loss": 0.1536, | |
| "step": 24340 | |
| }, | |
| { | |
| "epoch": 15.56, | |
| "learning_rate": 0.0009382321618743345, | |
| "loss": 0.1418, | |
| "step": 24350 | |
| }, | |
| { | |
| "epoch": 15.57, | |
| "learning_rate": 0.0009381611643592475, | |
| "loss": 0.1373, | |
| "step": 24360 | |
| }, | |
| { | |
| "epoch": 15.57, | |
| "learning_rate": 0.0009380901668441605, | |
| "loss": 0.1431, | |
| "step": 24370 | |
| }, | |
| { | |
| "epoch": 15.58, | |
| "learning_rate": 0.0009380191693290734, | |
| "loss": 0.1286, | |
| "step": 24380 | |
| }, | |
| { | |
| "epoch": 15.58, | |
| "learning_rate": 0.0009379481718139865, | |
| "loss": 0.1437, | |
| "step": 24390 | |
| }, | |
| { | |
| "epoch": 15.59, | |
| "learning_rate": 0.0009378771742988995, | |
| "loss": 0.184, | |
| "step": 24400 | |
| }, | |
| { | |
| "epoch": 15.6, | |
| "learning_rate": 0.0009378061767838126, | |
| "loss": 0.1034, | |
| "step": 24410 | |
| }, | |
| { | |
| "epoch": 15.6, | |
| "learning_rate": 0.0009377351792687256, | |
| "loss": 0.1458, | |
| "step": 24420 | |
| }, | |
| { | |
| "epoch": 15.61, | |
| "learning_rate": 0.0009376641817536387, | |
| "loss": 0.1409, | |
| "step": 24430 | |
| }, | |
| { | |
| "epoch": 15.62, | |
| "learning_rate": 0.0009375931842385516, | |
| "loss": 0.1224, | |
| "step": 24440 | |
| }, | |
| { | |
| "epoch": 15.62, | |
| "learning_rate": 0.0009375221867234647, | |
| "loss": 0.1531, | |
| "step": 24450 | |
| }, | |
| { | |
| "epoch": 15.63, | |
| "learning_rate": 0.0009374511892083777, | |
| "loss": 0.1554, | |
| "step": 24460 | |
| }, | |
| { | |
| "epoch": 15.64, | |
| "learning_rate": 0.0009373801916932908, | |
| "loss": 0.145, | |
| "step": 24470 | |
| }, | |
| { | |
| "epoch": 15.64, | |
| "learning_rate": 0.0009373091941782038, | |
| "loss": 0.1375, | |
| "step": 24480 | |
| }, | |
| { | |
| "epoch": 15.65, | |
| "learning_rate": 0.0009372381966631168, | |
| "loss": 0.1538, | |
| "step": 24490 | |
| }, | |
| { | |
| "epoch": 15.65, | |
| "learning_rate": 0.0009371671991480298, | |
| "loss": 0.1313, | |
| "step": 24500 | |
| }, | |
| { | |
| "epoch": 15.66, | |
| "learning_rate": 0.0009370962016329429, | |
| "loss": 0.1241, | |
| "step": 24510 | |
| }, | |
| { | |
| "epoch": 15.67, | |
| "learning_rate": 0.0009370252041178558, | |
| "loss": 0.1408, | |
| "step": 24520 | |
| }, | |
| { | |
| "epoch": 15.67, | |
| "learning_rate": 0.000936954206602769, | |
| "loss": 0.1285, | |
| "step": 24530 | |
| }, | |
| { | |
| "epoch": 15.68, | |
| "learning_rate": 0.000936883209087682, | |
| "loss": 0.1444, | |
| "step": 24540 | |
| }, | |
| { | |
| "epoch": 15.69, | |
| "learning_rate": 0.000936812211572595, | |
| "loss": 0.1534, | |
| "step": 24550 | |
| }, | |
| { | |
| "epoch": 15.69, | |
| "learning_rate": 0.000936741214057508, | |
| "loss": 0.1407, | |
| "step": 24560 | |
| }, | |
| { | |
| "epoch": 15.7, | |
| "learning_rate": 0.000936670216542421, | |
| "loss": 0.1189, | |
| "step": 24570 | |
| }, | |
| { | |
| "epoch": 15.71, | |
| "learning_rate": 0.000936599219027334, | |
| "loss": 0.1567, | |
| "step": 24580 | |
| }, | |
| { | |
| "epoch": 15.71, | |
| "learning_rate": 0.0009365282215122471, | |
| "loss": 0.149, | |
| "step": 24590 | |
| }, | |
| { | |
| "epoch": 15.72, | |
| "learning_rate": 0.0009364572239971601, | |
| "loss": 0.1743, | |
| "step": 24600 | |
| }, | |
| { | |
| "epoch": 15.73, | |
| "learning_rate": 0.0009363862264820732, | |
| "loss": 0.158, | |
| "step": 24610 | |
| }, | |
| { | |
| "epoch": 15.73, | |
| "learning_rate": 0.0009363152289669862, | |
| "loss": 0.1391, | |
| "step": 24620 | |
| }, | |
| { | |
| "epoch": 15.74, | |
| "learning_rate": 0.0009362442314518992, | |
| "loss": 0.147, | |
| "step": 24630 | |
| }, | |
| { | |
| "epoch": 15.74, | |
| "learning_rate": 0.0009361732339368122, | |
| "loss": 0.1432, | |
| "step": 24640 | |
| }, | |
| { | |
| "epoch": 15.75, | |
| "learning_rate": 0.0009361022364217253, | |
| "loss": 0.1382, | |
| "step": 24650 | |
| }, | |
| { | |
| "epoch": 15.76, | |
| "learning_rate": 0.0009360312389066383, | |
| "loss": 0.14, | |
| "step": 24660 | |
| }, | |
| { | |
| "epoch": 15.76, | |
| "learning_rate": 0.0009359602413915513, | |
| "loss": 0.1489, | |
| "step": 24670 | |
| }, | |
| { | |
| "epoch": 15.77, | |
| "learning_rate": 0.0009358892438764643, | |
| "loss": 0.1443, | |
| "step": 24680 | |
| }, | |
| { | |
| "epoch": 15.78, | |
| "learning_rate": 0.0009358182463613773, | |
| "loss": 0.1329, | |
| "step": 24690 | |
| }, | |
| { | |
| "epoch": 15.78, | |
| "learning_rate": 0.0009357472488462904, | |
| "loss": 0.1445, | |
| "step": 24700 | |
| }, | |
| { | |
| "epoch": 15.79, | |
| "learning_rate": 0.0009356762513312033, | |
| "loss": 0.159, | |
| "step": 24710 | |
| }, | |
| { | |
| "epoch": 15.8, | |
| "learning_rate": 0.0009356052538161165, | |
| "loss": 0.1628, | |
| "step": 24720 | |
| }, | |
| { | |
| "epoch": 15.8, | |
| "learning_rate": 0.0009355342563010295, | |
| "loss": 0.1636, | |
| "step": 24730 | |
| }, | |
| { | |
| "epoch": 15.81, | |
| "learning_rate": 0.0009354632587859425, | |
| "loss": 0.1332, | |
| "step": 24740 | |
| }, | |
| { | |
| "epoch": 15.81, | |
| "learning_rate": 0.0009353922612708555, | |
| "loss": 0.1685, | |
| "step": 24750 | |
| }, | |
| { | |
| "epoch": 15.82, | |
| "learning_rate": 0.0009353212637557686, | |
| "loss": 0.1439, | |
| "step": 24760 | |
| }, | |
| { | |
| "epoch": 15.83, | |
| "learning_rate": 0.0009352502662406815, | |
| "loss": 0.1545, | |
| "step": 24770 | |
| }, | |
| { | |
| "epoch": 15.83, | |
| "learning_rate": 0.0009351792687255947, | |
| "loss": 0.173, | |
| "step": 24780 | |
| }, | |
| { | |
| "epoch": 15.84, | |
| "learning_rate": 0.0009351082712105076, | |
| "loss": 0.1309, | |
| "step": 24790 | |
| }, | |
| { | |
| "epoch": 15.85, | |
| "learning_rate": 0.0009350372736954207, | |
| "loss": 0.1452, | |
| "step": 24800 | |
| }, | |
| { | |
| "epoch": 15.85, | |
| "learning_rate": 0.0009349662761803337, | |
| "loss": 0.1527, | |
| "step": 24810 | |
| }, | |
| { | |
| "epoch": 15.86, | |
| "learning_rate": 0.0009348952786652467, | |
| "loss": 0.1403, | |
| "step": 24820 | |
| }, | |
| { | |
| "epoch": 15.87, | |
| "learning_rate": 0.0009348242811501597, | |
| "loss": 0.1439, | |
| "step": 24830 | |
| }, | |
| { | |
| "epoch": 15.87, | |
| "learning_rate": 0.0009347532836350729, | |
| "loss": 0.1238, | |
| "step": 24840 | |
| }, | |
| { | |
| "epoch": 15.88, | |
| "learning_rate": 0.0009346822861199858, | |
| "loss": 0.1268, | |
| "step": 24850 | |
| }, | |
| { | |
| "epoch": 15.88, | |
| "learning_rate": 0.0009346112886048989, | |
| "loss": 0.1617, | |
| "step": 24860 | |
| }, | |
| { | |
| "epoch": 15.89, | |
| "learning_rate": 0.0009345402910898118, | |
| "loss": 0.1181, | |
| "step": 24870 | |
| }, | |
| { | |
| "epoch": 15.9, | |
| "learning_rate": 0.0009344692935747249, | |
| "loss": 0.1561, | |
| "step": 24880 | |
| }, | |
| { | |
| "epoch": 15.9, | |
| "learning_rate": 0.0009343982960596379, | |
| "loss": 0.1353, | |
| "step": 24890 | |
| }, | |
| { | |
| "epoch": 15.91, | |
| "learning_rate": 0.000934327298544551, | |
| "loss": 0.1284, | |
| "step": 24900 | |
| }, | |
| { | |
| "epoch": 15.92, | |
| "learning_rate": 0.000934256301029464, | |
| "loss": 0.1271, | |
| "step": 24910 | |
| }, | |
| { | |
| "epoch": 15.92, | |
| "learning_rate": 0.0009341853035143771, | |
| "loss": 0.1071, | |
| "step": 24920 | |
| }, | |
| { | |
| "epoch": 15.93, | |
| "learning_rate": 0.00093411430599929, | |
| "loss": 0.1475, | |
| "step": 24930 | |
| }, | |
| { | |
| "epoch": 15.94, | |
| "learning_rate": 0.0009340433084842031, | |
| "loss": 0.1313, | |
| "step": 24940 | |
| }, | |
| { | |
| "epoch": 15.94, | |
| "learning_rate": 0.000933972310969116, | |
| "loss": 0.1228, | |
| "step": 24950 | |
| }, | |
| { | |
| "epoch": 15.95, | |
| "learning_rate": 0.0009339013134540292, | |
| "loss": 0.137, | |
| "step": 24960 | |
| }, | |
| { | |
| "epoch": 15.95, | |
| "learning_rate": 0.0009338303159389422, | |
| "loss": 0.1521, | |
| "step": 24970 | |
| }, | |
| { | |
| "epoch": 15.96, | |
| "learning_rate": 0.0009337593184238551, | |
| "loss": 0.1228, | |
| "step": 24980 | |
| }, | |
| { | |
| "epoch": 15.97, | |
| "learning_rate": 0.0009336883209087682, | |
| "loss": 0.1769, | |
| "step": 24990 | |
| }, | |
| { | |
| "epoch": 15.97, | |
| "learning_rate": 0.0009336173233936812, | |
| "loss": 0.1282, | |
| "step": 25000 | |
| }, | |
| { | |
| "epoch": 15.98, | |
| "learning_rate": 0.0009335463258785942, | |
| "loss": 0.1443, | |
| "step": 25010 | |
| }, | |
| { | |
| "epoch": 15.99, | |
| "learning_rate": 0.0009334753283635073, | |
| "loss": 0.1371, | |
| "step": 25020 | |
| }, | |
| { | |
| "epoch": 15.99, | |
| "learning_rate": 0.0009334043308484204, | |
| "loss": 0.1388, | |
| "step": 25030 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "learning_rate": 0.0009333333333333333, | |
| "loss": 0.1664, | |
| "step": 25040 | |
| }, | |
| { | |
| "epoch": 16.01, | |
| "learning_rate": 0.0009332623358182464, | |
| "loss": 0.1286, | |
| "step": 25050 | |
| }, | |
| { | |
| "epoch": 16.01, | |
| "learning_rate": 0.0009331913383031593, | |
| "loss": 0.1375, | |
| "step": 25060 | |
| }, | |
| { | |
| "epoch": 16.02, | |
| "learning_rate": 0.0009331203407880724, | |
| "loss": 0.1182, | |
| "step": 25070 | |
| }, | |
| { | |
| "epoch": 16.03, | |
| "learning_rate": 0.0009330493432729855, | |
| "loss": 0.1052, | |
| "step": 25080 | |
| }, | |
| { | |
| "epoch": 16.03, | |
| "learning_rate": 0.0009329783457578985, | |
| "loss": 0.1171, | |
| "step": 25090 | |
| }, | |
| { | |
| "epoch": 16.04, | |
| "learning_rate": 0.0009329073482428115, | |
| "loss": 0.1204, | |
| "step": 25100 | |
| }, | |
| { | |
| "epoch": 16.04, | |
| "learning_rate": 0.0009328363507277246, | |
| "loss": 0.1288, | |
| "step": 25110 | |
| }, | |
| { | |
| "epoch": 16.05, | |
| "learning_rate": 0.0009327653532126375, | |
| "loss": 0.1363, | |
| "step": 25120 | |
| }, | |
| { | |
| "epoch": 16.06, | |
| "learning_rate": 0.0009326943556975506, | |
| "loss": 0.1242, | |
| "step": 25130 | |
| }, | |
| { | |
| "epoch": 16.06, | |
| "learning_rate": 0.0009326233581824637, | |
| "loss": 0.0983, | |
| "step": 25140 | |
| }, | |
| { | |
| "epoch": 16.07, | |
| "learning_rate": 0.0009325523606673767, | |
| "loss": 0.1232, | |
| "step": 25150 | |
| }, | |
| { | |
| "epoch": 16.08, | |
| "learning_rate": 0.0009324813631522897, | |
| "loss": 0.133, | |
| "step": 25160 | |
| }, | |
| { | |
| "epoch": 16.08, | |
| "learning_rate": 0.0009324103656372028, | |
| "loss": 0.1143, | |
| "step": 25170 | |
| }, | |
| { | |
| "epoch": 16.09, | |
| "learning_rate": 0.0009323393681221157, | |
| "loss": 0.118, | |
| "step": 25180 | |
| }, | |
| { | |
| "epoch": 16.1, | |
| "learning_rate": 0.0009322683706070288, | |
| "loss": 0.1199, | |
| "step": 25190 | |
| }, | |
| { | |
| "epoch": 16.1, | |
| "learning_rate": 0.0009321973730919417, | |
| "loss": 0.1186, | |
| "step": 25200 | |
| }, | |
| { | |
| "epoch": 16.11, | |
| "learning_rate": 0.0009321263755768549, | |
| "loss": 0.1374, | |
| "step": 25210 | |
| }, | |
| { | |
| "epoch": 16.11, | |
| "learning_rate": 0.0009320553780617679, | |
| "loss": 0.1354, | |
| "step": 25220 | |
| }, | |
| { | |
| "epoch": 16.12, | |
| "learning_rate": 0.0009319843805466809, | |
| "loss": 0.1587, | |
| "step": 25230 | |
| }, | |
| { | |
| "epoch": 16.13, | |
| "learning_rate": 0.0009319133830315939, | |
| "loss": 0.1165, | |
| "step": 25240 | |
| }, | |
| { | |
| "epoch": 16.13, | |
| "learning_rate": 0.000931842385516507, | |
| "loss": 0.1248, | |
| "step": 25250 | |
| }, | |
| { | |
| "epoch": 16.14, | |
| "learning_rate": 0.0009317713880014199, | |
| "loss": 0.1411, | |
| "step": 25260 | |
| }, | |
| { | |
| "epoch": 16.15, | |
| "learning_rate": 0.0009317003904863331, | |
| "loss": 0.1265, | |
| "step": 25270 | |
| }, | |
| { | |
| "epoch": 16.15, | |
| "learning_rate": 0.000931629392971246, | |
| "loss": 0.1404, | |
| "step": 25280 | |
| }, | |
| { | |
| "epoch": 16.16, | |
| "learning_rate": 0.000931558395456159, | |
| "loss": 0.1166, | |
| "step": 25290 | |
| }, | |
| { | |
| "epoch": 16.17, | |
| "learning_rate": 0.0009314873979410721, | |
| "loss": 0.1257, | |
| "step": 25300 | |
| }, | |
| { | |
| "epoch": 16.17, | |
| "learning_rate": 0.000931416400425985, | |
| "loss": 0.1293, | |
| "step": 25310 | |
| }, | |
| { | |
| "epoch": 16.18, | |
| "learning_rate": 0.0009313454029108981, | |
| "loss": 0.1311, | |
| "step": 25320 | |
| }, | |
| { | |
| "epoch": 16.19, | |
| "learning_rate": 0.0009312744053958112, | |
| "loss": 0.1424, | |
| "step": 25330 | |
| }, | |
| { | |
| "epoch": 16.19, | |
| "learning_rate": 0.0009312034078807242, | |
| "loss": 0.123, | |
| "step": 25340 | |
| }, | |
| { | |
| "epoch": 16.2, | |
| "learning_rate": 0.0009311324103656372, | |
| "loss": 0.1401, | |
| "step": 25350 | |
| }, | |
| { | |
| "epoch": 16.2, | |
| "learning_rate": 0.0009310614128505503, | |
| "loss": 0.1472, | |
| "step": 25360 | |
| }, | |
| { | |
| "epoch": 16.21, | |
| "learning_rate": 0.0009309904153354632, | |
| "loss": 0.1571, | |
| "step": 25370 | |
| }, | |
| { | |
| "epoch": 16.22, | |
| "learning_rate": 0.0009309194178203763, | |
| "loss": 0.1117, | |
| "step": 25380 | |
| }, | |
| { | |
| "epoch": 16.22, | |
| "learning_rate": 0.0009308484203052893, | |
| "loss": 0.1385, | |
| "step": 25390 | |
| }, | |
| { | |
| "epoch": 16.23, | |
| "learning_rate": 0.0009307774227902024, | |
| "loss": 0.1311, | |
| "step": 25400 | |
| }, | |
| { | |
| "epoch": 16.24, | |
| "learning_rate": 0.0009307064252751154, | |
| "loss": 0.122, | |
| "step": 25410 | |
| }, | |
| { | |
| "epoch": 16.24, | |
| "learning_rate": 0.0009306354277600284, | |
| "loss": 0.141, | |
| "step": 25420 | |
| }, | |
| { | |
| "epoch": 16.25, | |
| "learning_rate": 0.0009305644302449414, | |
| "loss": 0.1267, | |
| "step": 25430 | |
| }, | |
| { | |
| "epoch": 16.26, | |
| "learning_rate": 0.0009304934327298545, | |
| "loss": 0.1027, | |
| "step": 25440 | |
| }, | |
| { | |
| "epoch": 16.26, | |
| "learning_rate": 0.0009304224352147675, | |
| "loss": 0.1542, | |
| "step": 25450 | |
| }, | |
| { | |
| "epoch": 16.27, | |
| "learning_rate": 0.0009303514376996806, | |
| "loss": 0.1143, | |
| "step": 25460 | |
| }, | |
| { | |
| "epoch": 16.27, | |
| "learning_rate": 0.0009302804401845935, | |
| "loss": 0.1454, | |
| "step": 25470 | |
| }, | |
| { | |
| "epoch": 16.28, | |
| "learning_rate": 0.0009302094426695066, | |
| "loss": 0.1523, | |
| "step": 25480 | |
| }, | |
| { | |
| "epoch": 16.29, | |
| "learning_rate": 0.0009301384451544196, | |
| "loss": 0.1088, | |
| "step": 25490 | |
| }, | |
| { | |
| "epoch": 16.29, | |
| "learning_rate": 0.0009300674476393326, | |
| "loss": 0.1545, | |
| "step": 25500 | |
| }, | |
| { | |
| "epoch": 16.3, | |
| "learning_rate": 0.0009299964501242457, | |
| "loss": 0.1418, | |
| "step": 25510 | |
| }, | |
| { | |
| "epoch": 16.31, | |
| "learning_rate": 0.0009299254526091588, | |
| "loss": 0.1418, | |
| "step": 25520 | |
| }, | |
| { | |
| "epoch": 16.31, | |
| "learning_rate": 0.0009298544550940717, | |
| "loss": 0.1424, | |
| "step": 25530 | |
| }, | |
| { | |
| "epoch": 16.32, | |
| "learning_rate": 0.0009297834575789848, | |
| "loss": 0.1374, | |
| "step": 25540 | |
| }, | |
| { | |
| "epoch": 16.33, | |
| "learning_rate": 0.0009297124600638978, | |
| "loss": 0.148, | |
| "step": 25550 | |
| }, | |
| { | |
| "epoch": 16.33, | |
| "learning_rate": 0.0009296414625488108, | |
| "loss": 0.1299, | |
| "step": 25560 | |
| }, | |
| { | |
| "epoch": 16.34, | |
| "learning_rate": 0.0009295704650337239, | |
| "loss": 0.1407, | |
| "step": 25570 | |
| }, | |
| { | |
| "epoch": 16.34, | |
| "learning_rate": 0.000929499467518637, | |
| "loss": 0.1308, | |
| "step": 25580 | |
| }, | |
| { | |
| "epoch": 16.35, | |
| "learning_rate": 0.0009294284700035499, | |
| "loss": 0.1344, | |
| "step": 25590 | |
| }, | |
| { | |
| "epoch": 16.36, | |
| "learning_rate": 0.0009293574724884629, | |
| "loss": 0.1084, | |
| "step": 25600 | |
| }, | |
| { | |
| "epoch": 16.36, | |
| "learning_rate": 0.0009292864749733759, | |
| "loss": 0.1325, | |
| "step": 25610 | |
| }, | |
| { | |
| "epoch": 16.37, | |
| "learning_rate": 0.0009292154774582889, | |
| "loss": 0.133, | |
| "step": 25620 | |
| }, | |
| { | |
| "epoch": 16.38, | |
| "learning_rate": 0.0009291444799432021, | |
| "loss": 0.107, | |
| "step": 25630 | |
| }, | |
| { | |
| "epoch": 16.38, | |
| "learning_rate": 0.000929073482428115, | |
| "loss": 0.1486, | |
| "step": 25640 | |
| }, | |
| { | |
| "epoch": 16.39, | |
| "learning_rate": 0.0009290024849130281, | |
| "loss": 0.1332, | |
| "step": 25650 | |
| }, | |
| { | |
| "epoch": 16.4, | |
| "learning_rate": 0.000928931487397941, | |
| "loss": 0.1404, | |
| "step": 25660 | |
| }, | |
| { | |
| "epoch": 16.4, | |
| "learning_rate": 0.0009288604898828541, | |
| "loss": 0.1448, | |
| "step": 25670 | |
| }, | |
| { | |
| "epoch": 16.41, | |
| "learning_rate": 0.0009287894923677671, | |
| "loss": 0.1351, | |
| "step": 25680 | |
| }, | |
| { | |
| "epoch": 16.42, | |
| "learning_rate": 0.0009287184948526802, | |
| "loss": 0.1293, | |
| "step": 25690 | |
| }, | |
| { | |
| "epoch": 16.42, | |
| "learning_rate": 0.0009286474973375932, | |
| "loss": 0.1368, | |
| "step": 25700 | |
| }, | |
| { | |
| "epoch": 16.43, | |
| "learning_rate": 0.0009285764998225063, | |
| "loss": 0.1199, | |
| "step": 25710 | |
| }, | |
| { | |
| "epoch": 16.43, | |
| "learning_rate": 0.0009285055023074192, | |
| "loss": 0.1127, | |
| "step": 25720 | |
| }, | |
| { | |
| "epoch": 16.44, | |
| "learning_rate": 0.0009284345047923323, | |
| "loss": 0.146, | |
| "step": 25730 | |
| }, | |
| { | |
| "epoch": 16.45, | |
| "learning_rate": 0.0009283635072772452, | |
| "loss": 0.1567, | |
| "step": 25740 | |
| }, | |
| { | |
| "epoch": 16.45, | |
| "learning_rate": 0.0009282925097621584, | |
| "loss": 0.1227, | |
| "step": 25750 | |
| }, | |
| { | |
| "epoch": 16.46, | |
| "learning_rate": 0.0009282215122470714, | |
| "loss": 0.1116, | |
| "step": 25760 | |
| }, | |
| { | |
| "epoch": 16.47, | |
| "learning_rate": 0.0009281505147319844, | |
| "loss": 0.1299, | |
| "step": 25770 | |
| }, | |
| { | |
| "epoch": 16.47, | |
| "learning_rate": 0.0009280795172168974, | |
| "loss": 0.1208, | |
| "step": 25780 | |
| }, | |
| { | |
| "epoch": 16.48, | |
| "learning_rate": 0.0009280085197018105, | |
| "loss": 0.1362, | |
| "step": 25790 | |
| }, | |
| { | |
| "epoch": 16.49, | |
| "learning_rate": 0.0009279375221867234, | |
| "loss": 0.1251, | |
| "step": 25800 | |
| }, | |
| { | |
| "epoch": 16.49, | |
| "learning_rate": 0.0009278665246716365, | |
| "loss": 0.1411, | |
| "step": 25810 | |
| }, | |
| { | |
| "epoch": 16.5, | |
| "learning_rate": 0.0009277955271565496, | |
| "loss": 0.1121, | |
| "step": 25820 | |
| }, | |
| { | |
| "epoch": 16.5, | |
| "learning_rate": 0.0009277245296414626, | |
| "loss": 0.1616, | |
| "step": 25830 | |
| }, | |
| { | |
| "epoch": 16.51, | |
| "learning_rate": 0.0009276535321263756, | |
| "loss": 0.1454, | |
| "step": 25840 | |
| }, | |
| { | |
| "epoch": 16.52, | |
| "learning_rate": 0.0009275825346112887, | |
| "loss": 0.122, | |
| "step": 25850 | |
| }, | |
| { | |
| "epoch": 16.52, | |
| "learning_rate": 0.0009275115370962016, | |
| "loss": 0.1452, | |
| "step": 25860 | |
| }, | |
| { | |
| "epoch": 16.53, | |
| "learning_rate": 0.0009274405395811147, | |
| "loss": 0.1088, | |
| "step": 25870 | |
| }, | |
| { | |
| "epoch": 16.54, | |
| "learning_rate": 0.0009273695420660277, | |
| "loss": 0.1377, | |
| "step": 25880 | |
| }, | |
| { | |
| "epoch": 16.54, | |
| "learning_rate": 0.0009272985445509408, | |
| "loss": 0.1186, | |
| "step": 25890 | |
| }, | |
| { | |
| "epoch": 16.55, | |
| "learning_rate": 0.0009272275470358538, | |
| "loss": 0.1247, | |
| "step": 25900 | |
| }, | |
| { | |
| "epoch": 16.56, | |
| "learning_rate": 0.0009271565495207667, | |
| "loss": 0.0938, | |
| "step": 25910 | |
| }, | |
| { | |
| "epoch": 16.56, | |
| "learning_rate": 0.0009270855520056798, | |
| "loss": 0.1685, | |
| "step": 25920 | |
| }, | |
| { | |
| "epoch": 16.57, | |
| "learning_rate": 0.0009270145544905927, | |
| "loss": 0.1359, | |
| "step": 25930 | |
| }, | |
| { | |
| "epoch": 16.57, | |
| "learning_rate": 0.0009269435569755059, | |
| "loss": 0.1519, | |
| "step": 25940 | |
| }, | |
| { | |
| "epoch": 16.58, | |
| "learning_rate": 0.0009268725594604189, | |
| "loss": 0.1279, | |
| "step": 25950 | |
| }, | |
| { | |
| "epoch": 16.59, | |
| "learning_rate": 0.000926801561945332, | |
| "loss": 0.1069, | |
| "step": 25960 | |
| }, | |
| { | |
| "epoch": 16.59, | |
| "learning_rate": 0.0009267305644302449, | |
| "loss": 0.1241, | |
| "step": 25970 | |
| }, | |
| { | |
| "epoch": 16.6, | |
| "learning_rate": 0.000926659566915158, | |
| "loss": 0.1594, | |
| "step": 25980 | |
| }, | |
| { | |
| "epoch": 16.61, | |
| "learning_rate": 0.0009265885694000709, | |
| "loss": 0.1272, | |
| "step": 25990 | |
| }, | |
| { | |
| "epoch": 16.61, | |
| "learning_rate": 0.0009265175718849841, | |
| "loss": 0.1267, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 16.62, | |
| "learning_rate": 0.0009264465743698971, | |
| "loss": 0.1224, | |
| "step": 26010 | |
| }, | |
| { | |
| "epoch": 16.63, | |
| "learning_rate": 0.0009263755768548101, | |
| "loss": 0.1352, | |
| "step": 26020 | |
| }, | |
| { | |
| "epoch": 16.63, | |
| "learning_rate": 0.0009263045793397231, | |
| "loss": 0.1276, | |
| "step": 26030 | |
| }, | |
| { | |
| "epoch": 16.64, | |
| "learning_rate": 0.0009262335818246362, | |
| "loss": 0.123, | |
| "step": 26040 | |
| }, | |
| { | |
| "epoch": 16.65, | |
| "learning_rate": 0.0009261625843095491, | |
| "loss": 0.1321, | |
| "step": 26050 | |
| }, | |
| { | |
| "epoch": 16.65, | |
| "learning_rate": 0.0009260915867944623, | |
| "loss": 0.1449, | |
| "step": 26060 | |
| }, | |
| { | |
| "epoch": 16.66, | |
| "learning_rate": 0.0009260205892793752, | |
| "loss": 0.1492, | |
| "step": 26070 | |
| }, | |
| { | |
| "epoch": 16.66, | |
| "learning_rate": 0.0009259495917642883, | |
| "loss": 0.1182, | |
| "step": 26080 | |
| }, | |
| { | |
| "epoch": 16.67, | |
| "learning_rate": 0.0009258785942492013, | |
| "loss": 0.1407, | |
| "step": 26090 | |
| }, | |
| { | |
| "epoch": 16.68, | |
| "learning_rate": 0.0009258075967341143, | |
| "loss": 0.1472, | |
| "step": 26100 | |
| }, | |
| { | |
| "epoch": 16.68, | |
| "learning_rate": 0.0009257365992190273, | |
| "loss": 0.1404, | |
| "step": 26110 | |
| }, | |
| { | |
| "epoch": 16.69, | |
| "learning_rate": 0.0009256656017039405, | |
| "loss": 0.1511, | |
| "step": 26120 | |
| }, | |
| { | |
| "epoch": 16.7, | |
| "learning_rate": 0.0009255946041888534, | |
| "loss": 0.1255, | |
| "step": 26130 | |
| }, | |
| { | |
| "epoch": 16.7, | |
| "learning_rate": 0.0009255236066737665, | |
| "loss": 0.1221, | |
| "step": 26140 | |
| }, | |
| { | |
| "epoch": 16.71, | |
| "learning_rate": 0.0009254526091586794, | |
| "loss": 0.1251, | |
| "step": 26150 | |
| }, | |
| { | |
| "epoch": 16.72, | |
| "learning_rate": 0.0009253816116435925, | |
| "loss": 0.1232, | |
| "step": 26160 | |
| }, | |
| { | |
| "epoch": 16.72, | |
| "learning_rate": 0.0009253106141285055, | |
| "loss": 0.1382, | |
| "step": 26170 | |
| }, | |
| { | |
| "epoch": 16.73, | |
| "learning_rate": 0.0009252396166134186, | |
| "loss": 0.135, | |
| "step": 26180 | |
| }, | |
| { | |
| "epoch": 16.73, | |
| "learning_rate": 0.0009251686190983316, | |
| "loss": 0.1372, | |
| "step": 26190 | |
| }, | |
| { | |
| "epoch": 16.74, | |
| "learning_rate": 0.0009250976215832447, | |
| "loss": 0.1124, | |
| "step": 26200 | |
| }, | |
| { | |
| "epoch": 16.75, | |
| "learning_rate": 0.0009250266240681576, | |
| "loss": 0.1464, | |
| "step": 26210 | |
| }, | |
| { | |
| "epoch": 16.75, | |
| "learning_rate": 0.0009249556265530706, | |
| "loss": 0.1388, | |
| "step": 26220 | |
| }, | |
| { | |
| "epoch": 16.76, | |
| "learning_rate": 0.0009248846290379837, | |
| "loss": 0.1212, | |
| "step": 26230 | |
| }, | |
| { | |
| "epoch": 16.77, | |
| "learning_rate": 0.0009248136315228967, | |
| "loss": 0.1517, | |
| "step": 26240 | |
| }, | |
| { | |
| "epoch": 16.77, | |
| "learning_rate": 0.0009247426340078098, | |
| "loss": 0.1009, | |
| "step": 26250 | |
| }, | |
| { | |
| "epoch": 16.78, | |
| "learning_rate": 0.0009246716364927227, | |
| "loss": 0.1296, | |
| "step": 26260 | |
| }, | |
| { | |
| "epoch": 16.79, | |
| "learning_rate": 0.0009246006389776358, | |
| "loss": 0.1443, | |
| "step": 26270 | |
| }, | |
| { | |
| "epoch": 16.79, | |
| "learning_rate": 0.0009245296414625488, | |
| "loss": 0.1436, | |
| "step": 26280 | |
| }, | |
| { | |
| "epoch": 16.8, | |
| "learning_rate": 0.0009244586439474618, | |
| "loss": 0.1104, | |
| "step": 26290 | |
| }, | |
| { | |
| "epoch": 16.8, | |
| "learning_rate": 0.0009243876464323749, | |
| "loss": 0.1109, | |
| "step": 26300 | |
| }, | |
| { | |
| "epoch": 16.81, | |
| "learning_rate": 0.000924316648917288, | |
| "loss": 0.1459, | |
| "step": 26310 | |
| }, | |
| { | |
| "epoch": 16.82, | |
| "learning_rate": 0.0009242456514022009, | |
| "loss": 0.131, | |
| "step": 26320 | |
| }, | |
| { | |
| "epoch": 16.82, | |
| "learning_rate": 0.000924174653887114, | |
| "loss": 0.1423, | |
| "step": 26330 | |
| }, | |
| { | |
| "epoch": 16.83, | |
| "learning_rate": 0.000924103656372027, | |
| "loss": 0.1342, | |
| "step": 26340 | |
| }, | |
| { | |
| "epoch": 16.84, | |
| "learning_rate": 0.00092403265885694, | |
| "loss": 0.1241, | |
| "step": 26350 | |
| }, | |
| { | |
| "epoch": 16.84, | |
| "learning_rate": 0.000923961661341853, | |
| "loss": 0.1781, | |
| "step": 26360 | |
| }, | |
| { | |
| "epoch": 16.85, | |
| "learning_rate": 0.0009238906638267661, | |
| "loss": 0.116, | |
| "step": 26370 | |
| }, | |
| { | |
| "epoch": 16.86, | |
| "learning_rate": 0.0009238196663116791, | |
| "loss": 0.1799, | |
| "step": 26380 | |
| }, | |
| { | |
| "epoch": 16.86, | |
| "learning_rate": 0.0009237486687965922, | |
| "loss": 0.1317, | |
| "step": 26390 | |
| }, | |
| { | |
| "epoch": 16.87, | |
| "learning_rate": 0.0009236776712815051, | |
| "loss": 0.0983, | |
| "step": 26400 | |
| }, | |
| { | |
| "epoch": 16.88, | |
| "learning_rate": 0.0009236066737664182, | |
| "loss": 0.1497, | |
| "step": 26410 | |
| }, | |
| { | |
| "epoch": 16.88, | |
| "learning_rate": 0.0009235356762513312, | |
| "loss": 0.1571, | |
| "step": 26420 | |
| }, | |
| { | |
| "epoch": 16.89, | |
| "learning_rate": 0.0009234646787362443, | |
| "loss": 0.1443, | |
| "step": 26430 | |
| }, | |
| { | |
| "epoch": 16.89, | |
| "learning_rate": 0.0009233936812211573, | |
| "loss": 0.1457, | |
| "step": 26440 | |
| }, | |
| { | |
| "epoch": 16.9, | |
| "learning_rate": 0.0009233226837060703, | |
| "loss": 0.1255, | |
| "step": 26450 | |
| }, | |
| { | |
| "epoch": 16.91, | |
| "learning_rate": 0.0009232516861909833, | |
| "loss": 0.1181, | |
| "step": 26460 | |
| }, | |
| { | |
| "epoch": 16.91, | |
| "learning_rate": 0.0009231806886758964, | |
| "loss": 0.1382, | |
| "step": 26470 | |
| }, | |
| { | |
| "epoch": 16.92, | |
| "learning_rate": 0.0009231096911608093, | |
| "loss": 0.1318, | |
| "step": 26480 | |
| }, | |
| { | |
| "epoch": 16.93, | |
| "learning_rate": 0.0009230386936457225, | |
| "loss": 0.1427, | |
| "step": 26490 | |
| }, | |
| { | |
| "epoch": 16.93, | |
| "learning_rate": 0.0009229676961306355, | |
| "loss": 0.1359, | |
| "step": 26500 | |
| }, | |
| { | |
| "epoch": 16.94, | |
| "learning_rate": 0.0009228966986155485, | |
| "loss": 0.1099, | |
| "step": 26510 | |
| }, | |
| { | |
| "epoch": 16.95, | |
| "learning_rate": 0.0009228257011004615, | |
| "loss": 0.1713, | |
| "step": 26520 | |
| }, | |
| { | |
| "epoch": 16.95, | |
| "learning_rate": 0.0009227547035853744, | |
| "loss": 0.1392, | |
| "step": 26530 | |
| }, | |
| { | |
| "epoch": 16.96, | |
| "learning_rate": 0.0009226837060702875, | |
| "loss": 0.123, | |
| "step": 26540 | |
| }, | |
| { | |
| "epoch": 16.96, | |
| "learning_rate": 0.0009226127085552006, | |
| "loss": 0.1638, | |
| "step": 26550 | |
| }, | |
| { | |
| "epoch": 16.97, | |
| "learning_rate": 0.0009225417110401136, | |
| "loss": 0.152, | |
| "step": 26560 | |
| }, | |
| { | |
| "epoch": 16.98, | |
| "learning_rate": 0.0009224707135250266, | |
| "loss": 0.1197, | |
| "step": 26570 | |
| }, | |
| { | |
| "epoch": 16.98, | |
| "learning_rate": 0.0009223997160099397, | |
| "loss": 0.1322, | |
| "step": 26580 | |
| }, | |
| { | |
| "epoch": 16.99, | |
| "learning_rate": 0.0009223287184948526, | |
| "loss": 0.1272, | |
| "step": 26590 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "learning_rate": 0.0009222577209797657, | |
| "loss": 0.1141, | |
| "step": 26600 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "learning_rate": 0.0009221867234646788, | |
| "loss": 0.122, | |
| "step": 26610 | |
| }, | |
| { | |
| "epoch": 17.01, | |
| "learning_rate": 0.0009221157259495918, | |
| "loss": 0.1188, | |
| "step": 26620 | |
| }, | |
| { | |
| "epoch": 17.02, | |
| "learning_rate": 0.0009220447284345048, | |
| "loss": 0.1244, | |
| "step": 26630 | |
| }, | |
| { | |
| "epoch": 17.02, | |
| "learning_rate": 0.0009219737309194178, | |
| "loss": 0.1568, | |
| "step": 26640 | |
| }, | |
| { | |
| "epoch": 17.03, | |
| "learning_rate": 0.0009219027334043308, | |
| "loss": 0.1023, | |
| "step": 26650 | |
| }, | |
| { | |
| "epoch": 17.04, | |
| "learning_rate": 0.0009218317358892439, | |
| "loss": 0.1231, | |
| "step": 26660 | |
| }, | |
| { | |
| "epoch": 17.04, | |
| "learning_rate": 0.0009217607383741569, | |
| "loss": 0.1095, | |
| "step": 26670 | |
| }, | |
| { | |
| "epoch": 17.05, | |
| "learning_rate": 0.00092168974085907, | |
| "loss": 0.123, | |
| "step": 26680 | |
| }, | |
| { | |
| "epoch": 17.05, | |
| "learning_rate": 0.000921618743343983, | |
| "loss": 0.1071, | |
| "step": 26690 | |
| }, | |
| { | |
| "epoch": 17.06, | |
| "learning_rate": 0.000921547745828896, | |
| "loss": 0.1295, | |
| "step": 26700 | |
| }, | |
| { | |
| "epoch": 17.07, | |
| "learning_rate": 0.000921476748313809, | |
| "loss": 0.1227, | |
| "step": 26710 | |
| }, | |
| { | |
| "epoch": 17.07, | |
| "learning_rate": 0.000921405750798722, | |
| "loss": 0.1109, | |
| "step": 26720 | |
| }, | |
| { | |
| "epoch": 17.08, | |
| "learning_rate": 0.0009213347532836351, | |
| "loss": 0.1039, | |
| "step": 26730 | |
| }, | |
| { | |
| "epoch": 17.09, | |
| "learning_rate": 0.0009212637557685482, | |
| "loss": 0.1291, | |
| "step": 26740 | |
| }, | |
| { | |
| "epoch": 17.09, | |
| "learning_rate": 0.0009211927582534611, | |
| "loss": 0.11, | |
| "step": 26750 | |
| }, | |
| { | |
| "epoch": 17.1, | |
| "learning_rate": 0.0009211217607383742, | |
| "loss": 0.1387, | |
| "step": 26760 | |
| }, | |
| { | |
| "epoch": 17.11, | |
| "learning_rate": 0.0009210507632232872, | |
| "loss": 0.1014, | |
| "step": 26770 | |
| }, | |
| { | |
| "epoch": 17.11, | |
| "learning_rate": 0.0009209797657082002, | |
| "loss": 0.1332, | |
| "step": 26780 | |
| }, | |
| { | |
| "epoch": 17.12, | |
| "learning_rate": 0.0009209087681931133, | |
| "loss": 0.1355, | |
| "step": 26790 | |
| }, | |
| { | |
| "epoch": 17.12, | |
| "learning_rate": 0.0009208377706780264, | |
| "loss": 0.1203, | |
| "step": 26800 | |
| }, | |
| { | |
| "epoch": 17.13, | |
| "learning_rate": 0.0009207667731629393, | |
| "loss": 0.1282, | |
| "step": 26810 | |
| }, | |
| { | |
| "epoch": 17.14, | |
| "learning_rate": 0.0009206957756478524, | |
| "loss": 0.1236, | |
| "step": 26820 | |
| }, | |
| { | |
| "epoch": 17.14, | |
| "learning_rate": 0.0009206247781327653, | |
| "loss": 0.1301, | |
| "step": 26830 | |
| }, | |
| { | |
| "epoch": 17.15, | |
| "learning_rate": 0.0009205537806176783, | |
| "loss": 0.1248, | |
| "step": 26840 | |
| }, | |
| { | |
| "epoch": 17.16, | |
| "learning_rate": 0.0009204827831025915, | |
| "loss": 0.1393, | |
| "step": 26850 | |
| }, | |
| { | |
| "epoch": 17.16, | |
| "learning_rate": 0.0009204117855875044, | |
| "loss": 0.1158, | |
| "step": 26860 | |
| }, | |
| { | |
| "epoch": 17.17, | |
| "learning_rate": 0.0009203407880724175, | |
| "loss": 0.1415, | |
| "step": 26870 | |
| }, | |
| { | |
| "epoch": 17.18, | |
| "learning_rate": 0.0009202697905573305, | |
| "loss": 0.1166, | |
| "step": 26880 | |
| }, | |
| { | |
| "epoch": 17.18, | |
| "learning_rate": 0.0009201987930422435, | |
| "loss": 0.1273, | |
| "step": 26890 | |
| }, | |
| { | |
| "epoch": 17.19, | |
| "learning_rate": 0.0009201277955271565, | |
| "loss": 0.1322, | |
| "step": 26900 | |
| }, | |
| { | |
| "epoch": 17.19, | |
| "learning_rate": 0.0009200567980120697, | |
| "loss": 0.1042, | |
| "step": 26910 | |
| }, | |
| { | |
| "epoch": 17.2, | |
| "learning_rate": 0.0009199858004969826, | |
| "loss": 0.1692, | |
| "step": 26920 | |
| }, | |
| { | |
| "epoch": 17.21, | |
| "learning_rate": 0.0009199148029818957, | |
| "loss": 0.0913, | |
| "step": 26930 | |
| }, | |
| { | |
| "epoch": 17.21, | |
| "learning_rate": 0.0009198438054668086, | |
| "loss": 0.1293, | |
| "step": 26940 | |
| }, | |
| { | |
| "epoch": 17.22, | |
| "learning_rate": 0.0009197728079517217, | |
| "loss": 0.1275, | |
| "step": 26950 | |
| }, | |
| { | |
| "epoch": 17.23, | |
| "learning_rate": 0.0009197018104366347, | |
| "loss": 0.1086, | |
| "step": 26960 | |
| }, | |
| { | |
| "epoch": 17.23, | |
| "learning_rate": 0.0009196308129215477, | |
| "loss": 0.1151, | |
| "step": 26970 | |
| }, | |
| { | |
| "epoch": 17.24, | |
| "learning_rate": 0.0009195598154064608, | |
| "loss": 0.1449, | |
| "step": 26980 | |
| }, | |
| { | |
| "epoch": 17.25, | |
| "learning_rate": 0.0009194888178913739, | |
| "loss": 0.1332, | |
| "step": 26990 | |
| }, | |
| { | |
| "epoch": 17.25, | |
| "learning_rate": 0.0009194178203762868, | |
| "loss": 0.1148, | |
| "step": 27000 | |
| }, | |
| { | |
| "epoch": 17.26, | |
| "learning_rate": 0.0009193468228611999, | |
| "loss": 0.1344, | |
| "step": 27010 | |
| }, | |
| { | |
| "epoch": 17.27, | |
| "learning_rate": 0.0009192758253461128, | |
| "loss": 0.1061, | |
| "step": 27020 | |
| }, | |
| { | |
| "epoch": 17.27, | |
| "learning_rate": 0.0009192048278310259, | |
| "loss": 0.1154, | |
| "step": 27030 | |
| }, | |
| { | |
| "epoch": 17.28, | |
| "learning_rate": 0.000919133830315939, | |
| "loss": 0.0995, | |
| "step": 27040 | |
| }, | |
| { | |
| "epoch": 17.28, | |
| "learning_rate": 0.000919062832800852, | |
| "loss": 0.1339, | |
| "step": 27050 | |
| }, | |
| { | |
| "epoch": 17.29, | |
| "learning_rate": 0.000918991835285765, | |
| "loss": 0.1048, | |
| "step": 27060 | |
| }, | |
| { | |
| "epoch": 17.3, | |
| "learning_rate": 0.0009189208377706781, | |
| "loss": 0.1519, | |
| "step": 27070 | |
| }, | |
| { | |
| "epoch": 17.3, | |
| "learning_rate": 0.000918849840255591, | |
| "loss": 0.078, | |
| "step": 27080 | |
| }, | |
| { | |
| "epoch": 17.31, | |
| "learning_rate": 0.0009187788427405041, | |
| "loss": 0.1348, | |
| "step": 27090 | |
| }, | |
| { | |
| "epoch": 17.32, | |
| "learning_rate": 0.0009187078452254172, | |
| "loss": 0.1258, | |
| "step": 27100 | |
| }, | |
| { | |
| "epoch": 17.32, | |
| "learning_rate": 0.0009186368477103302, | |
| "loss": 0.1221, | |
| "step": 27110 | |
| }, | |
| { | |
| "epoch": 17.33, | |
| "learning_rate": 0.0009185658501952432, | |
| "loss": 0.1198, | |
| "step": 27120 | |
| }, | |
| { | |
| "epoch": 17.34, | |
| "learning_rate": 0.0009184948526801563, | |
| "loss": 0.0938, | |
| "step": 27130 | |
| }, | |
| { | |
| "epoch": 17.34, | |
| "learning_rate": 0.0009184238551650692, | |
| "loss": 0.1246, | |
| "step": 27140 | |
| }, | |
| { | |
| "epoch": 17.35, | |
| "learning_rate": 0.0009183528576499822, | |
| "loss": 0.132, | |
| "step": 27150 | |
| }, | |
| { | |
| "epoch": 17.35, | |
| "learning_rate": 0.0009182818601348953, | |
| "loss": 0.1265, | |
| "step": 27160 | |
| }, | |
| { | |
| "epoch": 17.36, | |
| "learning_rate": 0.0009182108626198083, | |
| "loss": 0.1348, | |
| "step": 27170 | |
| }, | |
| { | |
| "epoch": 17.37, | |
| "learning_rate": 0.0009181398651047214, | |
| "loss": 0.1407, | |
| "step": 27180 | |
| }, | |
| { | |
| "epoch": 17.37, | |
| "learning_rate": 0.0009180688675896343, | |
| "loss": 0.1409, | |
| "step": 27190 | |
| }, | |
| { | |
| "epoch": 17.38, | |
| "learning_rate": 0.0009179978700745474, | |
| "loss": 0.0996, | |
| "step": 27200 | |
| }, | |
| { | |
| "epoch": 17.39, | |
| "learning_rate": 0.0009179268725594603, | |
| "loss": 0.1391, | |
| "step": 27210 | |
| }, | |
| { | |
| "epoch": 17.39, | |
| "learning_rate": 0.0009178558750443735, | |
| "loss": 0.1252, | |
| "step": 27220 | |
| }, | |
| { | |
| "epoch": 17.4, | |
| "learning_rate": 0.0009177848775292865, | |
| "loss": 0.1404, | |
| "step": 27230 | |
| }, | |
| { | |
| "epoch": 17.41, | |
| "learning_rate": 0.0009177138800141995, | |
| "loss": 0.1238, | |
| "step": 27240 | |
| }, | |
| { | |
| "epoch": 17.41, | |
| "learning_rate": 0.0009176428824991125, | |
| "loss": 0.126, | |
| "step": 27250 | |
| }, | |
| { | |
| "epoch": 17.42, | |
| "learning_rate": 0.0009175718849840256, | |
| "loss": 0.1264, | |
| "step": 27260 | |
| }, | |
| { | |
| "epoch": 17.42, | |
| "learning_rate": 0.0009175008874689385, | |
| "loss": 0.1355, | |
| "step": 27270 | |
| }, | |
| { | |
| "epoch": 17.43, | |
| "learning_rate": 0.0009174298899538517, | |
| "loss": 0.1192, | |
| "step": 27280 | |
| }, | |
| { | |
| "epoch": 17.44, | |
| "learning_rate": 0.0009173588924387647, | |
| "loss": 0.1355, | |
| "step": 27290 | |
| }, | |
| { | |
| "epoch": 17.44, | |
| "learning_rate": 0.0009172878949236777, | |
| "loss": 0.1259, | |
| "step": 27300 | |
| }, | |
| { | |
| "epoch": 17.45, | |
| "learning_rate": 0.0009172168974085907, | |
| "loss": 0.1207, | |
| "step": 27310 | |
| }, | |
| { | |
| "epoch": 17.46, | |
| "learning_rate": 0.0009171458998935038, | |
| "loss": 0.111, | |
| "step": 27320 | |
| }, | |
| { | |
| "epoch": 17.46, | |
| "learning_rate": 0.0009170749023784167, | |
| "loss": 0.1248, | |
| "step": 27330 | |
| }, | |
| { | |
| "epoch": 17.47, | |
| "learning_rate": 0.0009170039048633299, | |
| "loss": 0.1155, | |
| "step": 27340 | |
| }, | |
| { | |
| "epoch": 17.48, | |
| "learning_rate": 0.0009169329073482428, | |
| "loss": 0.1202, | |
| "step": 27350 | |
| }, | |
| { | |
| "epoch": 17.48, | |
| "learning_rate": 0.0009168619098331559, | |
| "loss": 0.1468, | |
| "step": 27360 | |
| }, | |
| { | |
| "epoch": 17.49, | |
| "learning_rate": 0.0009167909123180689, | |
| "loss": 0.1278, | |
| "step": 27370 | |
| }, | |
| { | |
| "epoch": 17.5, | |
| "learning_rate": 0.0009167199148029819, | |
| "loss": 0.1361, | |
| "step": 27380 | |
| }, | |
| { | |
| "epoch": 17.5, | |
| "learning_rate": 0.0009166489172878949, | |
| "loss": 0.1249, | |
| "step": 27390 | |
| }, | |
| { | |
| "epoch": 17.51, | |
| "learning_rate": 0.0009165779197728081, | |
| "loss": 0.1392, | |
| "step": 27400 | |
| }, | |
| { | |
| "epoch": 17.51, | |
| "learning_rate": 0.000916506922257721, | |
| "loss": 0.1001, | |
| "step": 27410 | |
| }, | |
| { | |
| "epoch": 17.52, | |
| "learning_rate": 0.0009164359247426341, | |
| "loss": 0.1354, | |
| "step": 27420 | |
| }, | |
| { | |
| "epoch": 17.53, | |
| "learning_rate": 0.000916364927227547, | |
| "loss": 0.1063, | |
| "step": 27430 | |
| }, | |
| { | |
| "epoch": 17.53, | |
| "learning_rate": 0.0009162939297124601, | |
| "loss": 0.1433, | |
| "step": 27440 | |
| }, | |
| { | |
| "epoch": 17.54, | |
| "learning_rate": 0.0009162229321973731, | |
| "loss": 0.1294, | |
| "step": 27450 | |
| }, | |
| { | |
| "epoch": 17.55, | |
| "learning_rate": 0.0009161519346822862, | |
| "loss": 0.1183, | |
| "step": 27460 | |
| }, | |
| { | |
| "epoch": 17.55, | |
| "learning_rate": 0.0009160809371671992, | |
| "loss": 0.1353, | |
| "step": 27470 | |
| }, | |
| { | |
| "epoch": 17.56, | |
| "learning_rate": 0.0009160099396521122, | |
| "loss": 0.1012, | |
| "step": 27480 | |
| }, | |
| { | |
| "epoch": 17.57, | |
| "learning_rate": 0.0009159389421370252, | |
| "loss": 0.1388, | |
| "step": 27490 | |
| }, | |
| { | |
| "epoch": 17.57, | |
| "learning_rate": 0.0009158679446219382, | |
| "loss": 0.1329, | |
| "step": 27500 | |
| }, | |
| { | |
| "epoch": 17.58, | |
| "learning_rate": 0.0009157969471068513, | |
| "loss": 0.1465, | |
| "step": 27510 | |
| }, | |
| { | |
| "epoch": 17.58, | |
| "learning_rate": 0.0009157259495917643, | |
| "loss": 0.1405, | |
| "step": 27520 | |
| }, | |
| { | |
| "epoch": 17.59, | |
| "learning_rate": 0.0009156549520766774, | |
| "loss": 0.1375, | |
| "step": 27530 | |
| }, | |
| { | |
| "epoch": 17.6, | |
| "learning_rate": 0.0009155839545615903, | |
| "loss": 0.1431, | |
| "step": 27540 | |
| }, | |
| { | |
| "epoch": 17.6, | |
| "learning_rate": 0.0009155129570465034, | |
| "loss": 0.1102, | |
| "step": 27550 | |
| }, | |
| { | |
| "epoch": 17.61, | |
| "learning_rate": 0.0009154419595314164, | |
| "loss": 0.1477, | |
| "step": 27560 | |
| }, | |
| { | |
| "epoch": 17.62, | |
| "learning_rate": 0.0009153709620163294, | |
| "loss": 0.1203, | |
| "step": 27570 | |
| }, | |
| { | |
| "epoch": 17.62, | |
| "learning_rate": 0.0009152999645012424, | |
| "loss": 0.142, | |
| "step": 27580 | |
| }, | |
| { | |
| "epoch": 17.63, | |
| "learning_rate": 0.0009152289669861556, | |
| "loss": 0.1107, | |
| "step": 27590 | |
| }, | |
| { | |
| "epoch": 17.64, | |
| "learning_rate": 0.0009151579694710685, | |
| "loss": 0.0862, | |
| "step": 27600 | |
| }, | |
| { | |
| "epoch": 17.64, | |
| "learning_rate": 0.0009150869719559816, | |
| "loss": 0.1198, | |
| "step": 27610 | |
| }, | |
| { | |
| "epoch": 17.65, | |
| "learning_rate": 0.0009150159744408945, | |
| "loss": 0.1224, | |
| "step": 27620 | |
| }, | |
| { | |
| "epoch": 17.65, | |
| "learning_rate": 0.0009149449769258076, | |
| "loss": 0.1223, | |
| "step": 27630 | |
| }, | |
| { | |
| "epoch": 17.66, | |
| "learning_rate": 0.0009148739794107206, | |
| "loss": 0.1656, | |
| "step": 27640 | |
| }, | |
| { | |
| "epoch": 17.67, | |
| "learning_rate": 0.0009148029818956337, | |
| "loss": 0.1391, | |
| "step": 27650 | |
| }, | |
| { | |
| "epoch": 17.67, | |
| "learning_rate": 0.0009147319843805467, | |
| "loss": 0.1391, | |
| "step": 27660 | |
| }, | |
| { | |
| "epoch": 17.68, | |
| "learning_rate": 0.0009146609868654598, | |
| "loss": 0.1292, | |
| "step": 27670 | |
| }, | |
| { | |
| "epoch": 17.69, | |
| "learning_rate": 0.0009145899893503727, | |
| "loss": 0.1195, | |
| "step": 27680 | |
| }, | |
| { | |
| "epoch": 17.69, | |
| "learning_rate": 0.0009145189918352858, | |
| "loss": 0.1563, | |
| "step": 27690 | |
| }, | |
| { | |
| "epoch": 17.7, | |
| "learning_rate": 0.0009144479943201987, | |
| "loss": 0.1435, | |
| "step": 27700 | |
| }, | |
| { | |
| "epoch": 17.71, | |
| "learning_rate": 0.0009143769968051119, | |
| "loss": 0.1365, | |
| "step": 27710 | |
| }, | |
| { | |
| "epoch": 17.71, | |
| "learning_rate": 0.0009143059992900249, | |
| "loss": 0.1296, | |
| "step": 27720 | |
| }, | |
| { | |
| "epoch": 17.72, | |
| "learning_rate": 0.000914235001774938, | |
| "loss": 0.1118, | |
| "step": 27730 | |
| }, | |
| { | |
| "epoch": 17.73, | |
| "learning_rate": 0.0009141640042598509, | |
| "loss": 0.115, | |
| "step": 27740 | |
| }, | |
| { | |
| "epoch": 17.73, | |
| "learning_rate": 0.000914093006744764, | |
| "loss": 0.1173, | |
| "step": 27750 | |
| }, | |
| { | |
| "epoch": 17.74, | |
| "learning_rate": 0.0009140220092296769, | |
| "loss": 0.1318, | |
| "step": 27760 | |
| }, | |
| { | |
| "epoch": 17.74, | |
| "learning_rate": 0.0009139510117145901, | |
| "loss": 0.1547, | |
| "step": 27770 | |
| }, | |
| { | |
| "epoch": 17.75, | |
| "learning_rate": 0.0009138800141995031, | |
| "loss": 0.1173, | |
| "step": 27780 | |
| }, | |
| { | |
| "epoch": 17.76, | |
| "learning_rate": 0.000913809016684416, | |
| "loss": 0.1173, | |
| "step": 27790 | |
| }, | |
| { | |
| "epoch": 17.76, | |
| "learning_rate": 0.0009137380191693291, | |
| "loss": 0.1154, | |
| "step": 27800 | |
| }, | |
| { | |
| "epoch": 17.77, | |
| "learning_rate": 0.000913667021654242, | |
| "loss": 0.1305, | |
| "step": 27810 | |
| }, | |
| { | |
| "epoch": 17.78, | |
| "learning_rate": 0.0009135960241391551, | |
| "loss": 0.1241, | |
| "step": 27820 | |
| }, | |
| { | |
| "epoch": 17.78, | |
| "learning_rate": 0.0009135250266240682, | |
| "loss": 0.1159, | |
| "step": 27830 | |
| }, | |
| { | |
| "epoch": 17.79, | |
| "learning_rate": 0.0009134540291089812, | |
| "loss": 0.1501, | |
| "step": 27840 | |
| }, | |
| { | |
| "epoch": 17.8, | |
| "learning_rate": 0.0009133830315938942, | |
| "loss": 0.1342, | |
| "step": 27850 | |
| }, | |
| { | |
| "epoch": 17.8, | |
| "learning_rate": 0.0009133120340788073, | |
| "loss": 0.1278, | |
| "step": 27860 | |
| }, | |
| { | |
| "epoch": 17.81, | |
| "learning_rate": 0.0009132410365637202, | |
| "loss": 0.134, | |
| "step": 27870 | |
| }, | |
| { | |
| "epoch": 17.81, | |
| "learning_rate": 0.0009131700390486333, | |
| "loss": 0.1363, | |
| "step": 27880 | |
| }, | |
| { | |
| "epoch": 17.82, | |
| "learning_rate": 0.0009130990415335464, | |
| "loss": 0.1314, | |
| "step": 27890 | |
| }, | |
| { | |
| "epoch": 17.83, | |
| "learning_rate": 0.0009130280440184594, | |
| "loss": 0.1324, | |
| "step": 27900 | |
| }, | |
| { | |
| "epoch": 17.83, | |
| "learning_rate": 0.0009129570465033724, | |
| "loss": 0.1197, | |
| "step": 27910 | |
| }, | |
| { | |
| "epoch": 17.84, | |
| "learning_rate": 0.0009128860489882854, | |
| "loss": 0.1307, | |
| "step": 27920 | |
| }, | |
| { | |
| "epoch": 17.85, | |
| "learning_rate": 0.0009128150514731984, | |
| "loss": 0.1197, | |
| "step": 27930 | |
| }, | |
| { | |
| "epoch": 17.85, | |
| "learning_rate": 0.0009127440539581115, | |
| "loss": 0.1454, | |
| "step": 27940 | |
| }, | |
| { | |
| "epoch": 17.86, | |
| "learning_rate": 0.0009126730564430245, | |
| "loss": 0.1155, | |
| "step": 27950 | |
| }, | |
| { | |
| "epoch": 17.87, | |
| "learning_rate": 0.0009126020589279376, | |
| "loss": 0.1238, | |
| "step": 27960 | |
| }, | |
| { | |
| "epoch": 17.87, | |
| "learning_rate": 0.0009125310614128506, | |
| "loss": 0.102, | |
| "step": 27970 | |
| }, | |
| { | |
| "epoch": 17.88, | |
| "learning_rate": 0.0009124600638977636, | |
| "loss": 0.1501, | |
| "step": 27980 | |
| }, | |
| { | |
| "epoch": 17.88, | |
| "learning_rate": 0.0009123890663826766, | |
| "loss": 0.1435, | |
| "step": 27990 | |
| }, | |
| { | |
| "epoch": 17.89, | |
| "learning_rate": 0.0009123180688675897, | |
| "loss": 0.1381, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 17.9, | |
| "learning_rate": 0.0009122470713525027, | |
| "loss": 0.1478, | |
| "step": 28010 | |
| }, | |
| { | |
| "epoch": 17.9, | |
| "learning_rate": 0.0009121760738374158, | |
| "loss": 0.1608, | |
| "step": 28020 | |
| }, | |
| { | |
| "epoch": 17.91, | |
| "learning_rate": 0.0009121050763223287, | |
| "loss": 0.16, | |
| "step": 28030 | |
| }, | |
| { | |
| "epoch": 17.92, | |
| "learning_rate": 0.0009120340788072418, | |
| "loss": 0.1383, | |
| "step": 28040 | |
| }, | |
| { | |
| "epoch": 17.92, | |
| "learning_rate": 0.0009119630812921548, | |
| "loss": 0.1365, | |
| "step": 28050 | |
| }, | |
| { | |
| "epoch": 17.93, | |
| "learning_rate": 0.0009118920837770678, | |
| "loss": 0.1274, | |
| "step": 28060 | |
| }, | |
| { | |
| "epoch": 17.94, | |
| "learning_rate": 0.0009118210862619809, | |
| "loss": 0.1176, | |
| "step": 28070 | |
| }, | |
| { | |
| "epoch": 17.94, | |
| "learning_rate": 0.000911750088746894, | |
| "loss": 0.1474, | |
| "step": 28080 | |
| }, | |
| { | |
| "epoch": 17.95, | |
| "learning_rate": 0.0009116790912318069, | |
| "loss": 0.1065, | |
| "step": 28090 | |
| }, | |
| { | |
| "epoch": 17.95, | |
| "learning_rate": 0.0009116080937167199, | |
| "loss": 0.1241, | |
| "step": 28100 | |
| }, | |
| { | |
| "epoch": 17.96, | |
| "learning_rate": 0.000911537096201633, | |
| "loss": 0.123, | |
| "step": 28110 | |
| }, | |
| { | |
| "epoch": 17.97, | |
| "learning_rate": 0.0009114660986865459, | |
| "loss": 0.1231, | |
| "step": 28120 | |
| }, | |
| { | |
| "epoch": 17.97, | |
| "learning_rate": 0.0009113951011714591, | |
| "loss": 0.1273, | |
| "step": 28130 | |
| }, | |
| { | |
| "epoch": 17.98, | |
| "learning_rate": 0.000911324103656372, | |
| "loss": 0.136, | |
| "step": 28140 | |
| }, | |
| { | |
| "epoch": 17.99, | |
| "learning_rate": 0.0009112531061412851, | |
| "loss": 0.1333, | |
| "step": 28150 | |
| }, | |
| { | |
| "epoch": 17.99, | |
| "learning_rate": 0.0009111821086261981, | |
| "loss": 0.1464, | |
| "step": 28160 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "learning_rate": 0.0009111111111111111, | |
| "loss": 0.1176, | |
| "step": 28170 | |
| }, | |
| { | |
| "epoch": 18.01, | |
| "learning_rate": 0.0009110401135960241, | |
| "loss": 0.1254, | |
| "step": 28180 | |
| }, | |
| { | |
| "epoch": 18.01, | |
| "learning_rate": 0.0009109691160809372, | |
| "loss": 0.111, | |
| "step": 28190 | |
| }, | |
| { | |
| "epoch": 18.02, | |
| "learning_rate": 0.0009108981185658502, | |
| "loss": 0.1208, | |
| "step": 28200 | |
| }, | |
| { | |
| "epoch": 18.03, | |
| "learning_rate": 0.0009108271210507633, | |
| "loss": 0.1233, | |
| "step": 28210 | |
| }, | |
| { | |
| "epoch": 18.03, | |
| "learning_rate": 0.0009107561235356762, | |
| "loss": 0.097, | |
| "step": 28220 | |
| }, | |
| { | |
| "epoch": 18.04, | |
| "learning_rate": 0.0009106851260205893, | |
| "loss": 0.1101, | |
| "step": 28230 | |
| }, | |
| { | |
| "epoch": 18.04, | |
| "learning_rate": 0.0009106141285055023, | |
| "loss": 0.0998, | |
| "step": 28240 | |
| }, | |
| { | |
| "epoch": 18.05, | |
| "learning_rate": 0.0009105431309904153, | |
| "loss": 0.116, | |
| "step": 28250 | |
| }, | |
| { | |
| "epoch": 18.06, | |
| "learning_rate": 0.0009104721334753284, | |
| "loss": 0.1068, | |
| "step": 28260 | |
| }, | |
| { | |
| "epoch": 18.06, | |
| "learning_rate": 0.0009104011359602415, | |
| "loss": 0.1056, | |
| "step": 28270 | |
| }, | |
| { | |
| "epoch": 18.07, | |
| "learning_rate": 0.0009103301384451544, | |
| "loss": 0.1343, | |
| "step": 28280 | |
| }, | |
| { | |
| "epoch": 18.08, | |
| "learning_rate": 0.0009102591409300675, | |
| "loss": 0.1656, | |
| "step": 28290 | |
| }, | |
| { | |
| "epoch": 18.08, | |
| "learning_rate": 0.0009101881434149804, | |
| "loss": 0.1124, | |
| "step": 28300 | |
| }, | |
| { | |
| "epoch": 18.09, | |
| "learning_rate": 0.0009101171458998935, | |
| "loss": 0.1164, | |
| "step": 28310 | |
| }, | |
| { | |
| "epoch": 18.1, | |
| "learning_rate": 0.0009100461483848066, | |
| "loss": 0.0916, | |
| "step": 28320 | |
| }, | |
| { | |
| "epoch": 18.1, | |
| "learning_rate": 0.0009099751508697196, | |
| "loss": 0.1054, | |
| "step": 28330 | |
| }, | |
| { | |
| "epoch": 18.11, | |
| "learning_rate": 0.0009099041533546326, | |
| "loss": 0.1102, | |
| "step": 28340 | |
| }, | |
| { | |
| "epoch": 18.11, | |
| "learning_rate": 0.0009098331558395457, | |
| "loss": 0.1293, | |
| "step": 28350 | |
| }, | |
| { | |
| "epoch": 18.12, | |
| "learning_rate": 0.0009097621583244586, | |
| "loss": 0.1283, | |
| "step": 28360 | |
| }, | |
| { | |
| "epoch": 18.13, | |
| "learning_rate": 0.0009096911608093717, | |
| "loss": 0.1168, | |
| "step": 28370 | |
| }, | |
| { | |
| "epoch": 18.13, | |
| "learning_rate": 0.0009096201632942848, | |
| "loss": 0.0809, | |
| "step": 28380 | |
| }, | |
| { | |
| "epoch": 18.14, | |
| "learning_rate": 0.0009095491657791978, | |
| "loss": 0.1197, | |
| "step": 28390 | |
| }, | |
| { | |
| "epoch": 18.15, | |
| "learning_rate": 0.0009094781682641108, | |
| "loss": 0.1149, | |
| "step": 28400 | |
| }, | |
| { | |
| "epoch": 18.15, | |
| "learning_rate": 0.0009094071707490237, | |
| "loss": 0.1162, | |
| "step": 28410 | |
| }, | |
| { | |
| "epoch": 18.16, | |
| "learning_rate": 0.0009093361732339368, | |
| "loss": 0.1258, | |
| "step": 28420 | |
| }, | |
| { | |
| "epoch": 18.17, | |
| "learning_rate": 0.0009092651757188498, | |
| "loss": 0.1266, | |
| "step": 28430 | |
| }, | |
| { | |
| "epoch": 18.17, | |
| "learning_rate": 0.0009091941782037629, | |
| "loss": 0.1502, | |
| "step": 28440 | |
| }, | |
| { | |
| "epoch": 18.18, | |
| "learning_rate": 0.0009091231806886759, | |
| "loss": 0.1195, | |
| "step": 28450 | |
| }, | |
| { | |
| "epoch": 18.19, | |
| "learning_rate": 0.000909052183173589, | |
| "loss": 0.1035, | |
| "step": 28460 | |
| }, | |
| { | |
| "epoch": 18.19, | |
| "learning_rate": 0.0009089811856585019, | |
| "loss": 0.1482, | |
| "step": 28470 | |
| }, | |
| { | |
| "epoch": 18.2, | |
| "learning_rate": 0.000908910188143415, | |
| "loss": 0.1187, | |
| "step": 28480 | |
| }, | |
| { | |
| "epoch": 18.2, | |
| "learning_rate": 0.000908839190628328, | |
| "loss": 0.1204, | |
| "step": 28490 | |
| }, | |
| { | |
| "epoch": 18.21, | |
| "learning_rate": 0.0009087681931132411, | |
| "loss": 0.1059, | |
| "step": 28500 | |
| }, | |
| { | |
| "epoch": 18.22, | |
| "learning_rate": 0.0009086971955981541, | |
| "loss": 0.1164, | |
| "step": 28510 | |
| }, | |
| { | |
| "epoch": 18.22, | |
| "learning_rate": 0.0009086261980830671, | |
| "loss": 0.1168, | |
| "step": 28520 | |
| }, | |
| { | |
| "epoch": 18.23, | |
| "learning_rate": 0.0009085552005679801, | |
| "loss": 0.1324, | |
| "step": 28530 | |
| }, | |
| { | |
| "epoch": 18.24, | |
| "learning_rate": 0.0009084842030528932, | |
| "loss": 0.124, | |
| "step": 28540 | |
| }, | |
| { | |
| "epoch": 18.24, | |
| "learning_rate": 0.0009084132055378061, | |
| "loss": 0.1028, | |
| "step": 28550 | |
| }, | |
| { | |
| "epoch": 18.25, | |
| "learning_rate": 0.0009083422080227193, | |
| "loss": 0.1057, | |
| "step": 28560 | |
| }, | |
| { | |
| "epoch": 18.26, | |
| "learning_rate": 0.0009082712105076323, | |
| "loss": 0.1132, | |
| "step": 28570 | |
| }, | |
| { | |
| "epoch": 18.26, | |
| "learning_rate": 0.0009082002129925453, | |
| "loss": 0.1164, | |
| "step": 28580 | |
| }, | |
| { | |
| "epoch": 18.27, | |
| "learning_rate": 0.0009081292154774583, | |
| "loss": 0.1129, | |
| "step": 28590 | |
| }, | |
| { | |
| "epoch": 18.27, | |
| "learning_rate": 0.0009080582179623713, | |
| "loss": 0.1185, | |
| "step": 28600 | |
| }, | |
| { | |
| "epoch": 18.28, | |
| "learning_rate": 0.0009079872204472843, | |
| "loss": 0.1268, | |
| "step": 28610 | |
| }, | |
| { | |
| "epoch": 18.29, | |
| "learning_rate": 0.0009079162229321975, | |
| "loss": 0.1184, | |
| "step": 28620 | |
| }, | |
| { | |
| "epoch": 18.29, | |
| "learning_rate": 0.0009078452254171104, | |
| "loss": 0.0942, | |
| "step": 28630 | |
| }, | |
| { | |
| "epoch": 18.3, | |
| "learning_rate": 0.0009077742279020235, | |
| "loss": 0.109, | |
| "step": 28640 | |
| }, | |
| { | |
| "epoch": 18.31, | |
| "learning_rate": 0.0009077032303869365, | |
| "loss": 0.0995, | |
| "step": 28650 | |
| }, | |
| { | |
| "epoch": 18.31, | |
| "learning_rate": 0.0009076322328718495, | |
| "loss": 0.1432, | |
| "step": 28660 | |
| }, | |
| { | |
| "epoch": 18.32, | |
| "learning_rate": 0.0009075612353567625, | |
| "loss": 0.1517, | |
| "step": 28670 | |
| }, | |
| { | |
| "epoch": 18.33, | |
| "learning_rate": 0.0009074902378416757, | |
| "loss": 0.1044, | |
| "step": 28680 | |
| }, | |
| { | |
| "epoch": 18.33, | |
| "learning_rate": 0.0009074192403265886, | |
| "loss": 0.0846, | |
| "step": 28690 | |
| }, | |
| { | |
| "epoch": 18.34, | |
| "learning_rate": 0.0009073482428115017, | |
| "loss": 0.1275, | |
| "step": 28700 | |
| }, | |
| { | |
| "epoch": 18.34, | |
| "learning_rate": 0.0009072772452964146, | |
| "loss": 0.0935, | |
| "step": 28710 | |
| }, | |
| { | |
| "epoch": 18.35, | |
| "learning_rate": 0.0009072062477813276, | |
| "loss": 0.0898, | |
| "step": 28720 | |
| }, | |
| { | |
| "epoch": 18.36, | |
| "learning_rate": 0.0009071352502662407, | |
| "loss": 0.127, | |
| "step": 28730 | |
| }, | |
| { | |
| "epoch": 18.36, | |
| "learning_rate": 0.0009070642527511536, | |
| "loss": 0.1172, | |
| "step": 28740 | |
| }, | |
| { | |
| "epoch": 18.37, | |
| "learning_rate": 0.0009069932552360668, | |
| "loss": 0.1069, | |
| "step": 28750 | |
| }, | |
| { | |
| "epoch": 18.38, | |
| "learning_rate": 0.0009069222577209798, | |
| "loss": 0.1378, | |
| "step": 28760 | |
| }, | |
| { | |
| "epoch": 18.38, | |
| "learning_rate": 0.0009068512602058928, | |
| "loss": 0.1268, | |
| "step": 28770 | |
| }, | |
| { | |
| "epoch": 18.39, | |
| "learning_rate": 0.0009067802626908058, | |
| "loss": 0.0926, | |
| "step": 28780 | |
| }, | |
| { | |
| "epoch": 18.4, | |
| "learning_rate": 0.0009067092651757188, | |
| "loss": 0.1208, | |
| "step": 28790 | |
| }, | |
| { | |
| "epoch": 18.4, | |
| "learning_rate": 0.0009066382676606318, | |
| "loss": 0.1234, | |
| "step": 28800 | |
| }, | |
| { | |
| "epoch": 18.41, | |
| "learning_rate": 0.000906567270145545, | |
| "loss": 0.1548, | |
| "step": 28810 | |
| }, | |
| { | |
| "epoch": 18.42, | |
| "learning_rate": 0.0009064962726304579, | |
| "loss": 0.1121, | |
| "step": 28820 | |
| }, | |
| { | |
| "epoch": 18.42, | |
| "learning_rate": 0.000906425275115371, | |
| "loss": 0.1457, | |
| "step": 28830 | |
| }, | |
| { | |
| "epoch": 18.43, | |
| "learning_rate": 0.000906354277600284, | |
| "loss": 0.1252, | |
| "step": 28840 | |
| }, | |
| { | |
| "epoch": 18.43, | |
| "learning_rate": 0.000906283280085197, | |
| "loss": 0.1345, | |
| "step": 28850 | |
| }, | |
| { | |
| "epoch": 18.44, | |
| "learning_rate": 0.00090621228257011, | |
| "loss": 0.1101, | |
| "step": 28860 | |
| }, | |
| { | |
| "epoch": 18.45, | |
| "learning_rate": 0.0009061412850550232, | |
| "loss": 0.1146, | |
| "step": 28870 | |
| }, | |
| { | |
| "epoch": 18.45, | |
| "learning_rate": 0.0009060702875399361, | |
| "loss": 0.1232, | |
| "step": 28880 | |
| }, | |
| { | |
| "epoch": 18.46, | |
| "learning_rate": 0.0009059992900248492, | |
| "loss": 0.1239, | |
| "step": 28890 | |
| }, | |
| { | |
| "epoch": 18.47, | |
| "learning_rate": 0.0009059282925097621, | |
| "loss": 0.1202, | |
| "step": 28900 | |
| }, | |
| { | |
| "epoch": 18.47, | |
| "learning_rate": 0.0009058572949946752, | |
| "loss": 0.1124, | |
| "step": 28910 | |
| }, | |
| { | |
| "epoch": 18.48, | |
| "learning_rate": 0.0009057862974795882, | |
| "loss": 0.1148, | |
| "step": 28920 | |
| }, | |
| { | |
| "epoch": 18.49, | |
| "learning_rate": 0.0009057152999645013, | |
| "loss": 0.1111, | |
| "step": 28930 | |
| }, | |
| { | |
| "epoch": 18.49, | |
| "learning_rate": 0.0009056443024494143, | |
| "loss": 0.1243, | |
| "step": 28940 | |
| }, | |
| { | |
| "epoch": 18.5, | |
| "learning_rate": 0.0009055733049343274, | |
| "loss": 0.1227, | |
| "step": 28950 | |
| }, | |
| { | |
| "epoch": 18.5, | |
| "learning_rate": 0.0009055023074192403, | |
| "loss": 0.0993, | |
| "step": 28960 | |
| }, | |
| { | |
| "epoch": 18.51, | |
| "learning_rate": 0.0009054313099041534, | |
| "loss": 0.1286, | |
| "step": 28970 | |
| }, | |
| { | |
| "epoch": 18.52, | |
| "learning_rate": 0.0009053603123890663, | |
| "loss": 0.1054, | |
| "step": 28980 | |
| }, | |
| { | |
| "epoch": 18.52, | |
| "learning_rate": 0.0009052893148739795, | |
| "loss": 0.1196, | |
| "step": 28990 | |
| }, | |
| { | |
| "epoch": 18.53, | |
| "learning_rate": 0.0009052183173588925, | |
| "loss": 0.1255, | |
| "step": 29000 | |
| }, | |
| { | |
| "epoch": 18.54, | |
| "learning_rate": 0.0009051473198438055, | |
| "loss": 0.1325, | |
| "step": 29010 | |
| }, | |
| { | |
| "epoch": 18.54, | |
| "learning_rate": 0.0009050763223287185, | |
| "loss": 0.1161, | |
| "step": 29020 | |
| }, | |
| { | |
| "epoch": 18.55, | |
| "learning_rate": 0.0009050053248136315, | |
| "loss": 0.1144, | |
| "step": 29030 | |
| }, | |
| { | |
| "epoch": 18.56, | |
| "learning_rate": 0.0009049343272985445, | |
| "loss": 0.1293, | |
| "step": 29040 | |
| }, | |
| { | |
| "epoch": 18.56, | |
| "learning_rate": 0.0009048633297834576, | |
| "loss": 0.1284, | |
| "step": 29050 | |
| }, | |
| { | |
| "epoch": 18.57, | |
| "learning_rate": 0.0009047923322683707, | |
| "loss": 0.1086, | |
| "step": 29060 | |
| }, | |
| { | |
| "epoch": 18.57, | |
| "learning_rate": 0.0009047213347532836, | |
| "loss": 0.1142, | |
| "step": 29070 | |
| }, | |
| { | |
| "epoch": 18.58, | |
| "learning_rate": 0.0009046503372381967, | |
| "loss": 0.1223, | |
| "step": 29080 | |
| }, | |
| { | |
| "epoch": 18.59, | |
| "learning_rate": 0.0009045793397231096, | |
| "loss": 0.137, | |
| "step": 29090 | |
| }, | |
| { | |
| "epoch": 18.59, | |
| "learning_rate": 0.0009045083422080227, | |
| "loss": 0.1287, | |
| "step": 29100 | |
| }, | |
| { | |
| "epoch": 18.6, | |
| "learning_rate": 0.0009044373446929358, | |
| "loss": 0.1208, | |
| "step": 29110 | |
| }, | |
| { | |
| "epoch": 18.61, | |
| "learning_rate": 0.0009043663471778488, | |
| "loss": 0.1086, | |
| "step": 29120 | |
| }, | |
| { | |
| "epoch": 18.61, | |
| "learning_rate": 0.0009042953496627618, | |
| "loss": 0.125, | |
| "step": 29130 | |
| }, | |
| { | |
| "epoch": 18.62, | |
| "learning_rate": 0.0009042243521476749, | |
| "loss": 0.1193, | |
| "step": 29140 | |
| }, | |
| { | |
| "epoch": 18.63, | |
| "learning_rate": 0.0009041533546325878, | |
| "loss": 0.1054, | |
| "step": 29150 | |
| }, | |
| { | |
| "epoch": 18.63, | |
| "learning_rate": 0.0009040823571175009, | |
| "loss": 0.1231, | |
| "step": 29160 | |
| }, | |
| { | |
| "epoch": 18.64, | |
| "learning_rate": 0.000904011359602414, | |
| "loss": 0.1086, | |
| "step": 29170 | |
| }, | |
| { | |
| "epoch": 18.65, | |
| "learning_rate": 0.000903940362087327, | |
| "loss": 0.1391, | |
| "step": 29180 | |
| }, | |
| { | |
| "epoch": 18.65, | |
| "learning_rate": 0.00090386936457224, | |
| "loss": 0.1039, | |
| "step": 29190 | |
| }, | |
| { | |
| "epoch": 18.66, | |
| "learning_rate": 0.000903798367057153, | |
| "loss": 0.14, | |
| "step": 29200 | |
| }, | |
| { | |
| "epoch": 18.66, | |
| "learning_rate": 0.000903727369542066, | |
| "loss": 0.1216, | |
| "step": 29210 | |
| }, | |
| { | |
| "epoch": 18.67, | |
| "learning_rate": 0.0009036563720269791, | |
| "loss": 0.1337, | |
| "step": 29220 | |
| }, | |
| { | |
| "epoch": 18.68, | |
| "learning_rate": 0.0009035853745118921, | |
| "loss": 0.1436, | |
| "step": 29230 | |
| }, | |
| { | |
| "epoch": 18.68, | |
| "learning_rate": 0.0009035143769968052, | |
| "loss": 0.1275, | |
| "step": 29240 | |
| }, | |
| { | |
| "epoch": 18.69, | |
| "learning_rate": 0.0009034433794817182, | |
| "loss": 0.1191, | |
| "step": 29250 | |
| }, | |
| { | |
| "epoch": 18.7, | |
| "learning_rate": 0.0009033723819666312, | |
| "loss": 0.1228, | |
| "step": 29260 | |
| }, | |
| { | |
| "epoch": 18.7, | |
| "learning_rate": 0.0009033013844515442, | |
| "loss": 0.1387, | |
| "step": 29270 | |
| }, | |
| { | |
| "epoch": 18.71, | |
| "learning_rate": 0.0009032303869364573, | |
| "loss": 0.146, | |
| "step": 29280 | |
| }, | |
| { | |
| "epoch": 18.72, | |
| "learning_rate": 0.0009031593894213703, | |
| "loss": 0.1387, | |
| "step": 29290 | |
| }, | |
| { | |
| "epoch": 18.72, | |
| "learning_rate": 0.0009030883919062834, | |
| "loss": 0.0893, | |
| "step": 29300 | |
| }, | |
| { | |
| "epoch": 18.73, | |
| "learning_rate": 0.0009030173943911963, | |
| "loss": 0.1221, | |
| "step": 29310 | |
| }, | |
| { | |
| "epoch": 18.73, | |
| "learning_rate": 0.0009029463968761094, | |
| "loss": 0.1158, | |
| "step": 29320 | |
| }, | |
| { | |
| "epoch": 18.74, | |
| "learning_rate": 0.0009028753993610224, | |
| "loss": 0.1393, | |
| "step": 29330 | |
| }, | |
| { | |
| "epoch": 18.75, | |
| "learning_rate": 0.0009028044018459353, | |
| "loss": 0.1195, | |
| "step": 29340 | |
| }, | |
| { | |
| "epoch": 18.75, | |
| "learning_rate": 0.0009027334043308484, | |
| "loss": 0.1365, | |
| "step": 29350 | |
| }, | |
| { | |
| "epoch": 18.76, | |
| "learning_rate": 0.0009026624068157615, | |
| "loss": 0.1153, | |
| "step": 29360 | |
| }, | |
| { | |
| "epoch": 18.77, | |
| "learning_rate": 0.0009025914093006745, | |
| "loss": 0.1396, | |
| "step": 29370 | |
| }, | |
| { | |
| "epoch": 18.77, | |
| "learning_rate": 0.0009025204117855875, | |
| "loss": 0.1326, | |
| "step": 29380 | |
| }, | |
| { | |
| "epoch": 18.78, | |
| "learning_rate": 0.0009024494142705005, | |
| "loss": 0.1302, | |
| "step": 29390 | |
| }, | |
| { | |
| "epoch": 18.79, | |
| "learning_rate": 0.0009023784167554135, | |
| "loss": 0.142, | |
| "step": 29400 | |
| }, | |
| { | |
| "epoch": 18.79, | |
| "learning_rate": 0.0009023074192403266, | |
| "loss": 0.1146, | |
| "step": 29410 | |
| }, | |
| { | |
| "epoch": 18.8, | |
| "learning_rate": 0.0009022364217252396, | |
| "loss": 0.1048, | |
| "step": 29420 | |
| }, | |
| { | |
| "epoch": 18.8, | |
| "learning_rate": 0.0009021654242101527, | |
| "loss": 0.1186, | |
| "step": 29430 | |
| }, | |
| { | |
| "epoch": 18.81, | |
| "learning_rate": 0.0009020944266950657, | |
| "loss": 0.1196, | |
| "step": 29440 | |
| }, | |
| { | |
| "epoch": 18.82, | |
| "learning_rate": 0.0009020234291799787, | |
| "loss": 0.1468, | |
| "step": 29450 | |
| }, | |
| { | |
| "epoch": 18.82, | |
| "learning_rate": 0.0009019524316648917, | |
| "loss": 0.1145, | |
| "step": 29460 | |
| }, | |
| { | |
| "epoch": 18.83, | |
| "learning_rate": 0.0009018814341498048, | |
| "loss": 0.112, | |
| "step": 29470 | |
| }, | |
| { | |
| "epoch": 18.84, | |
| "learning_rate": 0.0009018104366347178, | |
| "loss": 0.1304, | |
| "step": 29480 | |
| }, | |
| { | |
| "epoch": 18.84, | |
| "learning_rate": 0.0009017394391196309, | |
| "loss": 0.1395, | |
| "step": 29490 | |
| }, | |
| { | |
| "epoch": 18.85, | |
| "learning_rate": 0.0009016684416045438, | |
| "loss": 0.1276, | |
| "step": 29500 | |
| }, | |
| { | |
| "epoch": 18.86, | |
| "learning_rate": 0.0009015974440894569, | |
| "loss": 0.097, | |
| "step": 29510 | |
| }, | |
| { | |
| "epoch": 18.86, | |
| "learning_rate": 0.0009015264465743699, | |
| "loss": 0.1287, | |
| "step": 29520 | |
| }, | |
| { | |
| "epoch": 18.87, | |
| "learning_rate": 0.0009014554490592829, | |
| "loss": 0.1234, | |
| "step": 29530 | |
| }, | |
| { | |
| "epoch": 18.88, | |
| "learning_rate": 0.000901384451544196, | |
| "loss": 0.1509, | |
| "step": 29540 | |
| }, | |
| { | |
| "epoch": 18.88, | |
| "learning_rate": 0.0009013134540291091, | |
| "loss": 0.1317, | |
| "step": 29550 | |
| }, | |
| { | |
| "epoch": 18.89, | |
| "learning_rate": 0.000901242456514022, | |
| "loss": 0.1198, | |
| "step": 29560 | |
| }, | |
| { | |
| "epoch": 18.89, | |
| "learning_rate": 0.0009011714589989351, | |
| "loss": 0.1212, | |
| "step": 29570 | |
| }, | |
| { | |
| "epoch": 18.9, | |
| "learning_rate": 0.000901100461483848, | |
| "loss": 0.1124, | |
| "step": 29580 | |
| }, | |
| { | |
| "epoch": 18.91, | |
| "learning_rate": 0.0009010294639687611, | |
| "loss": 0.1289, | |
| "step": 29590 | |
| }, | |
| { | |
| "epoch": 18.91, | |
| "learning_rate": 0.0009009584664536742, | |
| "loss": 0.0943, | |
| "step": 29600 | |
| }, | |
| { | |
| "epoch": 18.92, | |
| "learning_rate": 0.0009008874689385872, | |
| "loss": 0.1308, | |
| "step": 29610 | |
| }, | |
| { | |
| "epoch": 18.93, | |
| "learning_rate": 0.0009008164714235002, | |
| "loss": 0.1405, | |
| "step": 29620 | |
| }, | |
| { | |
| "epoch": 18.93, | |
| "learning_rate": 0.0009007454739084133, | |
| "loss": 0.1067, | |
| "step": 29630 | |
| }, | |
| { | |
| "epoch": 18.94, | |
| "learning_rate": 0.0009006744763933262, | |
| "loss": 0.1219, | |
| "step": 29640 | |
| }, | |
| { | |
| "epoch": 18.95, | |
| "learning_rate": 0.0009006034788782392, | |
| "loss": 0.1205, | |
| "step": 29650 | |
| }, | |
| { | |
| "epoch": 18.95, | |
| "learning_rate": 0.0009005324813631524, | |
| "loss": 0.1326, | |
| "step": 29660 | |
| }, | |
| { | |
| "epoch": 18.96, | |
| "learning_rate": 0.0009004614838480653, | |
| "loss": 0.1112, | |
| "step": 29670 | |
| }, | |
| { | |
| "epoch": 18.96, | |
| "learning_rate": 0.0009003904863329784, | |
| "loss": 0.1184, | |
| "step": 29680 | |
| }, | |
| { | |
| "epoch": 18.97, | |
| "learning_rate": 0.0009003194888178913, | |
| "loss": 0.1426, | |
| "step": 29690 | |
| }, | |
| { | |
| "epoch": 18.98, | |
| "learning_rate": 0.0009002484913028044, | |
| "loss": 0.1358, | |
| "step": 29700 | |
| }, | |
| { | |
| "epoch": 18.98, | |
| "learning_rate": 0.0009001774937877174, | |
| "loss": 0.1562, | |
| "step": 29710 | |
| }, | |
| { | |
| "epoch": 18.99, | |
| "learning_rate": 0.0009001064962726305, | |
| "loss": 0.1396, | |
| "step": 29720 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "learning_rate": 0.0009000354987575435, | |
| "loss": 0.1173, | |
| "step": 29730 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "learning_rate": 0.0008999645012424566, | |
| "loss": 0.1017, | |
| "step": 29740 | |
| }, | |
| { | |
| "epoch": 19.01, | |
| "learning_rate": 0.0008998935037273695, | |
| "loss": 0.1158, | |
| "step": 29750 | |
| }, | |
| { | |
| "epoch": 19.02, | |
| "learning_rate": 0.0008998225062122826, | |
| "loss": 0.109, | |
| "step": 29760 | |
| }, | |
| { | |
| "epoch": 19.02, | |
| "learning_rate": 0.0008997515086971955, | |
| "loss": 0.1313, | |
| "step": 29770 | |
| }, | |
| { | |
| "epoch": 19.03, | |
| "learning_rate": 0.0008996805111821087, | |
| "loss": 0.1366, | |
| "step": 29780 | |
| }, | |
| { | |
| "epoch": 19.04, | |
| "learning_rate": 0.0008996095136670217, | |
| "loss": 0.1002, | |
| "step": 29790 | |
| }, | |
| { | |
| "epoch": 19.04, | |
| "learning_rate": 0.0008995385161519347, | |
| "loss": 0.0708, | |
| "step": 29800 | |
| }, | |
| { | |
| "epoch": 19.05, | |
| "learning_rate": 0.0008994675186368477, | |
| "loss": 0.1137, | |
| "step": 29810 | |
| }, | |
| { | |
| "epoch": 19.05, | |
| "learning_rate": 0.0008993965211217608, | |
| "loss": 0.0956, | |
| "step": 29820 | |
| }, | |
| { | |
| "epoch": 19.06, | |
| "learning_rate": 0.0008993255236066737, | |
| "loss": 0.1274, | |
| "step": 29830 | |
| }, | |
| { | |
| "epoch": 19.07, | |
| "learning_rate": 0.0008992545260915869, | |
| "loss": 0.1048, | |
| "step": 29840 | |
| }, | |
| { | |
| "epoch": 19.07, | |
| "learning_rate": 0.0008991835285764999, | |
| "loss": 0.0961, | |
| "step": 29850 | |
| }, | |
| { | |
| "epoch": 19.08, | |
| "learning_rate": 0.0008991125310614129, | |
| "loss": 0.125, | |
| "step": 29860 | |
| }, | |
| { | |
| "epoch": 19.09, | |
| "learning_rate": 0.0008990415335463259, | |
| "loss": 0.1302, | |
| "step": 29870 | |
| }, | |
| { | |
| "epoch": 19.09, | |
| "learning_rate": 0.000898970536031239, | |
| "loss": 0.1347, | |
| "step": 29880 | |
| }, | |
| { | |
| "epoch": 19.1, | |
| "learning_rate": 0.0008988995385161519, | |
| "loss": 0.1157, | |
| "step": 29890 | |
| }, | |
| { | |
| "epoch": 19.11, | |
| "learning_rate": 0.0008988285410010651, | |
| "loss": 0.1186, | |
| "step": 29900 | |
| }, | |
| { | |
| "epoch": 19.11, | |
| "learning_rate": 0.000898757543485978, | |
| "loss": 0.1363, | |
| "step": 29910 | |
| }, | |
| { | |
| "epoch": 19.12, | |
| "learning_rate": 0.0008986865459708911, | |
| "loss": 0.1319, | |
| "step": 29920 | |
| }, | |
| { | |
| "epoch": 19.12, | |
| "learning_rate": 0.0008986155484558041, | |
| "loss": 0.1121, | |
| "step": 29930 | |
| }, | |
| { | |
| "epoch": 19.13, | |
| "learning_rate": 0.0008985445509407171, | |
| "loss": 0.0922, | |
| "step": 29940 | |
| }, | |
| { | |
| "epoch": 19.14, | |
| "learning_rate": 0.0008984735534256301, | |
| "loss": 0.1178, | |
| "step": 29950 | |
| }, | |
| { | |
| "epoch": 19.14, | |
| "learning_rate": 0.000898402555910543, | |
| "loss": 0.1193, | |
| "step": 29960 | |
| }, | |
| { | |
| "epoch": 19.15, | |
| "learning_rate": 0.0008983315583954562, | |
| "loss": 0.111, | |
| "step": 29970 | |
| }, | |
| { | |
| "epoch": 19.16, | |
| "learning_rate": 0.0008982605608803692, | |
| "loss": 0.0945, | |
| "step": 29980 | |
| }, | |
| { | |
| "epoch": 19.16, | |
| "learning_rate": 0.0008981895633652822, | |
| "loss": 0.119, | |
| "step": 29990 | |
| }, | |
| { | |
| "epoch": 19.17, | |
| "learning_rate": 0.0008981185658501952, | |
| "loss": 0.1203, | |
| "step": 30000 | |
| } | |
| ], | |
| "max_steps": 156500, | |
| "num_train_epochs": 100, | |
| "total_flos": 0.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |