-
Notifications
You must be signed in to change notification settings - Fork 63
/
log_base_pretrain.txt
800 lines (800 loc) · 65.7 KB
/
log_base_pretrain.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
{"train_lr": 2.4920064e-05, "train_loss": 1.029866009569168, "epoch": 0}
{"train_lr": 7.492006399999998e-05, "train_loss": 0.826913864672184, "epoch": 1}
{"train_lr": 0.00012492006400000006, "train_loss": 0.7834360855937004, "epoch": 2}
{"train_lr": 0.00017492006399999992, "train_loss": 0.7394427828550338, "epoch": 3}
{"train_lr": 0.00022492006399999994, "train_loss": 0.7072458884239197, "epoch": 4}
{"train_lr": 0.0002749200639999999, "train_loss": 0.6952311094760895, "epoch": 5}
{"train_lr": 0.00032492006400000004, "train_loss": 0.6914466771841049, "epoch": 6}
{"train_lr": 0.00037492006400000006, "train_loss": 0.6886494241833687, "epoch": 7}
{"train_lr": 0.00042492006399999987, "train_loss": 0.6822491272926331, "epoch": 8}
{"train_lr": 0.00047492006400000044, "train_loss": 0.6565844881653786, "epoch": 9}
{"train_lr": 0.0005249200640000002, "train_loss": 0.6322732063770294, "epoch": 10}
{"train_lr": 0.0005749200639999999, "train_loss": 0.6173936517953873, "epoch": 11}
{"train_lr": 0.0006249200639999998, "train_loss": 0.5982944983005524, "epoch": 12}
{"train_lr": 0.0006749200640000005, "train_loss": 0.5760513068437576, "epoch": 13}
{"train_lr": 0.000724920064, "train_loss": 0.558085383951664, "epoch": 14}
{"train_lr": 0.0007749200639999998, "train_loss": 0.5438177249908447, "epoch": 15}
{"train_lr": 0.0008249200639999997, "train_loss": 0.5321405304253102, "epoch": 16}
{"train_lr": 0.0008749200639999996, "train_loss": 0.5226460194289684, "epoch": 17}
{"train_lr": 0.0009249200639999996, "train_loss": 0.5143405359089375, "epoch": 18}
{"train_lr": 0.0009749200640000003, "train_loss": 0.5078899907290936, "epoch": 19}
{"train_lr": 0.0010249200639999999, "train_loss": 0.5023593332231044, "epoch": 20}
{"train_lr": 0.0010749200640000002, "train_loss": 0.4975539141893387, "epoch": 21}
{"train_lr": 0.0011249200639999997, "train_loss": 0.49327956531047823, "epoch": 22}
{"train_lr": 0.001174920064000001, "train_loss": 0.48933574736714364, "epoch": 23}
{"train_lr": 0.001224920064, "train_loss": 0.4860016059339046, "epoch": 24}
{"train_lr": 0.0012749200639999999, "train_loss": 0.48271030520796776, "epoch": 25}
{"train_lr": 0.0013249200639999996, "train_loss": 0.48013067763447764, "epoch": 26}
{"train_lr": 0.0013749200639999988, "train_loss": 0.47759121404886246, "epoch": 27}
{"train_lr": 0.001424920064, "train_loss": 0.4752511966407299, "epoch": 28}
{"train_lr": 0.0014749200639999995, "train_loss": 0.47316404255628586, "epoch": 29}
{"train_lr": 0.001524920064000001, "train_loss": 0.4711698636054993, "epoch": 30}
{"train_lr": 0.001574920064, "train_loss": 0.4693278255581856, "epoch": 31}
{"train_lr": 0.0016249200640000012, "train_loss": 0.46783283928632735, "epoch": 32}
{"train_lr": 0.0016749200639999998, "train_loss": 0.46624995667934416, "epoch": 33}
{"train_lr": 0.0017249200640000002, "train_loss": 0.46449592822194097, "epoch": 34}
{"train_lr": 0.0017749200639999995, "train_loss": 0.46306066621541975, "epoch": 35}
{"train_lr": 0.0018249200639999994, "train_loss": 0.4618008250772953, "epoch": 36}
{"train_lr": 0.0018749200640000001, "train_loss": 0.46067862812876703, "epoch": 37}
{"train_lr": 0.0019249200639999994, "train_loss": 0.4598328410089016, "epoch": 38}
{"train_lr": 0.001974920064, "train_loss": 0.4584417822599411, "epoch": 39}
{"train_lr": 0.0019999971657724378, "train_loss": 0.4574848892211914, "epoch": 40}
{"train_lr": 0.001999980105982979, "train_loss": 0.45612444841861727, "epoch": 41}
{"train_lr": 0.0019999459593779763, "train_loss": 0.4549763072431087, "epoch": 42}
{"train_lr": 0.001999894726540914, "train_loss": 0.4538106670200825, "epoch": 43}
{"train_lr": 0.00199982640834721, "train_loss": 0.45279076434373855, "epoch": 44}
{"train_lr": 0.0019997410059642406, "train_loss": 0.45213532138466833, "epoch": 45}
{"train_lr": 0.001999638520851299, "train_loss": 0.45124949448108675, "epoch": 46}
{"train_lr": 0.0019995189547595644, "train_loss": 0.45040599479079246, "epoch": 47}
{"train_lr": 0.0019993823097320955, "train_loss": 0.44934970703125, "epoch": 48}
{"train_lr": 0.00199922858810378, "train_loss": 0.44850586191415787, "epoch": 49}
{"train_lr": 0.001999057792501294, "train_loss": 0.44782372673153875, "epoch": 50}
{"train_lr": 0.0019988699258430644, "train_loss": 0.4471781154215336, "epoch": 51}
{"train_lr": 0.001998664991339216, "train_loss": 0.44638750190138815, "epoch": 52}
{"train_lr": 0.001998442992491514, "train_loss": 0.44575022593736646, "epoch": 53}
{"train_lr": 0.001998203933093299, "train_loss": 0.4452553203165531, "epoch": 54}
{"train_lr": 0.0019979478172294477, "train_loss": 0.4447741946578026, "epoch": 55}
{"train_lr": 0.0019976746492762656, "train_loss": 0.4442489013373852, "epoch": 56}
{"train_lr": 0.001997384433901443, "train_loss": 0.4437332093179226, "epoch": 57}
{"train_lr": 0.0019970771760639545, "train_loss": 0.4431314005434513, "epoch": 58}
{"train_lr": 0.001996752881013995, "train_loss": 0.44259421687722206, "epoch": 59}
{"train_lr": 0.0019964115542928738, "train_loss": 0.4422669967353344, "epoch": 60}
{"train_lr": 0.0019960532017329145, "train_loss": 0.4417998247206211, "epoch": 61}
{"train_lr": 0.0019956778294573777, "train_loss": 0.44136346296072004, "epoch": 62}
{"train_lr": 0.0019952854438803442, "train_loss": 0.44111803106069564, "epoch": 63}
{"train_lr": 0.0019948760517065917, "train_loss": 0.44124629287719724, "epoch": 64}
{"train_lr": 0.001994449659931513, "train_loss": 0.44030142896175384, "epoch": 65}
{"train_lr": 0.001994006275840954, "train_loss": 0.4400160102546215, "epoch": 66}
{"train_lr": 0.001993545907011146, "train_loss": 0.4394983403027058, "epoch": 67}
{"train_lr": 0.0019930685613085016, "train_loss": 0.43934193002581595, "epoch": 68}
{"train_lr": 0.001992574246889553, "train_loss": 0.43939045332074167, "epoch": 69}
{"train_lr": 0.0019920629722007623, "train_loss": 0.43876420689821244, "epoch": 70}
{"train_lr": 0.001991534745978413, "train_loss": 0.4383896221101284, "epoch": 71}
{"train_lr": 0.00199098957724843, "train_loss": 0.43805962885022165, "epoch": 72}
{"train_lr": 0.001990427475326234, "train_loss": 0.4378157087266445, "epoch": 73}
{"train_lr": 0.0019898484498166082, "train_loss": 0.4375223469555378, "epoch": 74}
{"train_lr": 0.001989252510613496, "train_loss": 0.4371592809557915, "epoch": 75}
{"train_lr": 0.0019886396678998547, "train_loss": 0.43709583897590637, "epoch": 76}
{"train_lr": 0.001988009932147472, "train_loss": 0.43670710064172746, "epoch": 77}
{"train_lr": 0.0019873633141167983, "train_loss": 0.4365320971310139, "epoch": 78}
{"train_lr": 0.0019866998248567525, "train_loss": 0.4362802542924881, "epoch": 79}
{"train_lr": 0.0019860194757045316, "train_loss": 0.43601478363275525, "epoch": 80}
{"train_lr": 0.001985322278285424, "train_loss": 0.4358106957912445, "epoch": 81}
{"train_lr": 0.001984608244512617, "train_loss": 0.43634837040901187, "epoch": 82}
{"train_lr": 0.0019838773865869753, "train_loss": 0.4354546032965183, "epoch": 83}
{"train_lr": 0.001983129716996845, "train_loss": 0.43514904779195784, "epoch": 84}
{"train_lr": 0.0019823652485178316, "train_loss": 0.4349977902054787, "epoch": 85}
{"train_lr": 0.0019815839942125928, "train_loss": 0.4347984156310558, "epoch": 86}
{"train_lr": 0.001980785967430611, "train_loss": 0.4346069442749023, "epoch": 87}
{"train_lr": 0.001979971181807968, "train_loss": 0.43437728793025016, "epoch": 88}
{"train_lr": 0.0019791396512670954, "train_loss": 0.43415831446647646, "epoch": 89}
{"train_lr": 0.0019782913900165513, "train_loss": 0.43396707623004915, "epoch": 90}
{"train_lr": 0.001977426412550794, "train_loss": 0.43384554549455645, "epoch": 91}
{"train_lr": 0.0019765447336498893, "train_loss": 0.43357861334681513, "epoch": 92}
{"train_lr": 0.0019756463683793042, "train_loss": 0.43340606517791747, "epoch": 93}
{"train_lr": 0.0019747313320896127, "train_loss": 0.43321831868886945, "epoch": 94}
{"train_lr": 0.001973799640416274, "train_loss": 0.43303715973496437, "epoch": 95}
{"train_lr": 0.001972851309279318, "train_loss": 0.4329533623635769, "epoch": 96}
{"train_lr": 0.001971886354883114, "train_loss": 0.4327393824696541, "epoch": 97}
{"train_lr": 0.0019709047937160624, "train_loss": 0.4326424191534519, "epoch": 98}
{"train_lr": 0.00196990664255034, "train_loss": 0.432473964703083, "epoch": 99}
{"train_lr": 0.001968891918441605, "train_loss": 0.4323611004710197, "epoch": 100}
{"train_lr": 0.0019678606387286746, "train_loss": 0.43220903632044794, "epoch": 101}
{"train_lr": 0.0019668128210332835, "train_loss": 0.4320597696781158, "epoch": 102}
{"train_lr": 0.001965748483259745, "train_loss": 0.431807940363884, "epoch": 103}
{"train_lr": 0.0019646676435946544, "train_loss": 0.43166343091726306, "epoch": 104}
{"train_lr": 0.0019635703205065857, "train_loss": 0.43165171412825587, "epoch": 105}
{"train_lr": 0.001962456532745752, "train_loss": 0.4314692829966545, "epoch": 106}
{"train_lr": 0.001961326299343718, "train_loss": 0.43120107041597366, "epoch": 107}
{"train_lr": 0.0019601796396130477, "train_loss": 0.43122232078313827, "epoch": 108}
{"train_lr": 0.001959016573147011, "train_loss": 0.43111382276415827, "epoch": 109}
{"train_lr": 0.001957837119819182, "train_loss": 0.43085430263876917, "epoch": 110}
{"train_lr": 0.0019566412997831803, "train_loss": 0.43075852123498914, "epoch": 111}
{"train_lr": 0.0019554291334722604, "train_loss": 0.4307229078769684, "epoch": 112}
{"train_lr": 0.001954200641599004, "train_loss": 0.43064907240271566, "epoch": 113}
{"train_lr": 0.001952955845154955, "train_loss": 0.4303462516546249, "epoch": 114}
{"train_lr": 0.0019516947654102353, "train_loss": 0.430285882461071, "epoch": 115}
{"train_lr": 0.0019504174239132258, "train_loss": 0.4302071396172047, "epoch": 116}
{"train_lr": 0.0019491238424901728, "train_loss": 0.43007939971089365, "epoch": 117}
{"train_lr": 0.0019478140432448074, "train_loss": 0.42995246585607527, "epoch": 118}
{"train_lr": 0.0019464880485579859, "train_loss": 0.4299236563742161, "epoch": 119}
{"train_lr": 0.0019451458810873046, "train_loss": 0.42975575862526894, "epoch": 120}
{"train_lr": 0.0019437875637666987, "train_loss": 0.4296689044058323, "epoch": 121}
{"train_lr": 0.0019424131198060568, "train_loss": 0.4295571488142014, "epoch": 122}
{"train_lr": 0.001941022572690844, "train_loss": 0.4295304506480694, "epoch": 123}
{"train_lr": 0.0019396159461816677, "train_loss": 0.4295160254955292, "epoch": 124}
{"train_lr": 0.0019381932643138978, "train_loss": 0.4293148836731911, "epoch": 125}
{"train_lr": 0.0019367545513972342, "train_loss": 0.4292679689407349, "epoch": 126}
{"train_lr": 0.0019352998320153279, "train_loss": 0.42902680062055587, "epoch": 127}
{"train_lr": 0.0019338291310252987, "train_loss": 0.4290702934384346, "epoch": 128}
{"train_lr": 0.001932342473557387, "train_loss": 0.4288153325974941, "epoch": 129}
{"train_lr": 0.0019308398850144532, "train_loss": 0.4288082259654999, "epoch": 130}
{"train_lr": 0.0019293213910715973, "train_loss": 0.4287457905650139, "epoch": 131}
{"train_lr": 0.0019277870176756878, "train_loss": 0.42868427852988245, "epoch": 132}
{"train_lr": 0.0019262367910449316, "train_loss": 0.4285197732448578, "epoch": 133}
{"train_lr": 0.0019246707376684355, "train_loss": 0.4284260827243328, "epoch": 134}
{"train_lr": 0.0019230888843057212, "train_loss": 0.42834890897870065, "epoch": 135}
{"train_lr": 0.001921491257986288, "train_loss": 0.42836915620565413, "epoch": 136}
{"train_lr": 0.001919877886009182, "train_loss": 0.4281206827223301, "epoch": 137}
{"train_lr": 0.0019182487959424652, "train_loss": 0.4281239497900009, "epoch": 138}
{"train_lr": 0.0019166040156227992, "train_loss": 0.4281063589513302, "epoch": 139}
{"train_lr": 0.0019149435731549388, "train_loss": 0.42810667996406554, "epoch": 140}
{"train_lr": 0.001913267496911266, "train_loss": 0.42796390196084977, "epoch": 141}
{"train_lr": 0.001911575815531295, "train_loss": 0.4278896269261837, "epoch": 142}
{"train_lr": 0.001909868557921197, "train_loss": 0.42768696791529653, "epoch": 143}
{"train_lr": 0.0019081457532532941, "train_loss": 0.42768659583330154, "epoch": 144}
{"train_lr": 0.0019064074309655585, "train_loss": 0.42750629413723945, "epoch": 145}
{"train_lr": 0.0019046536207611357, "train_loss": 0.42743830469250677, "epoch": 146}
{"train_lr": 0.0019028843526077868, "train_loss": 0.42752327723503114, "epoch": 147}
{"train_lr": 0.0019010996567374366, "train_loss": 0.42736736696958544, "epoch": 148}
{"train_lr": 0.0018992995636456075, "train_loss": 0.4276691595375538, "epoch": 149}
{"train_lr": 0.0018974841040909193, "train_loss": 0.4272169639468193, "epoch": 150}
{"train_lr": 0.0018956533090945722, "train_loss": 0.4271261396050453, "epoch": 151}
{"train_lr": 0.0018938072099398014, "train_loss": 0.42715407326221466, "epoch": 152}
{"train_lr": 0.0018919458381713458, "train_loss": 0.4283799661755562, "epoch": 153}
{"train_lr": 0.0018900692255949196, "train_loss": 0.4275367811322212, "epoch": 154}
{"train_lr": 0.0018881774042766428, "train_loss": 0.42704309683442115, "epoch": 155}
{"train_lr": 0.0018862704065425273, "train_loss": 0.4270126509964466, "epoch": 156}
{"train_lr": 0.0018843482649779047, "train_loss": 0.42692647844552994, "epoch": 157}
{"train_lr": 0.0018824110124268732, "train_loss": 0.42698997198939326, "epoch": 158}
{"train_lr": 0.0018804586819917309, "train_loss": 0.42690860251784324, "epoch": 159}
{"train_lr": 0.0018784913070324137, "train_loss": 0.42671867433190347, "epoch": 160}
{"train_lr": 0.0018765089211659387, "train_loss": 0.4265693518280983, "epoch": 161}
{"train_lr": 0.0018745115582658063, "train_loss": 0.42649883098006247, "epoch": 162}
{"train_lr": 0.0018724992524614336, "train_loss": 0.42644061017632484, "epoch": 163}
{"train_lr": 0.0018704720381375868, "train_loss": 0.42639319202899933, "epoch": 164}
{"train_lr": 0.0018684299499337567, "train_loss": 0.4262290573775768, "epoch": 165}
{"train_lr": 0.0018663730227436023, "train_loss": 0.42622224123477936, "epoch": 166}
{"train_lr": 0.0018643012917143186, "train_loss": 0.4262301009774208, "epoch": 167}
{"train_lr": 0.0018622147922460915, "train_loss": 0.426052722042799, "epoch": 168}
{"train_lr": 0.0018601135599914326, "train_loss": 0.42615303208231925, "epoch": 169}
{"train_lr": 0.0018579976308546009, "train_loss": 0.4259471821427345, "epoch": 170}
{"train_lr": 0.0018558670409909955, "train_loss": 0.42602315420508385, "epoch": 171}
{"train_lr": 0.001853721826806509, "train_loss": 0.4258790579974651, "epoch": 172}
{"train_lr": 0.001851562024956937, "train_loss": 0.4258593296408653, "epoch": 173}
{"train_lr": 0.0018493876723473352, "train_loss": 0.42584737250208854, "epoch": 174}
{"train_lr": 0.0018471988061313895, "train_loss": 0.4257563955247402, "epoch": 175}
{"train_lr": 0.001844995463710784, "train_loss": 0.42564952899217606, "epoch": 176}
{"train_lr": 0.0018427776827345638, "train_loss": 0.425537062728405, "epoch": 177}
{"train_lr": 0.0018405455010984842, "train_loss": 0.42545911307930945, "epoch": 178}
{"train_lr": 0.0018382989569443692, "train_loss": 0.42556525562405584, "epoch": 179}
{"train_lr": 0.0018360380886594638, "train_loss": 0.4254311235845089, "epoch": 180}
{"train_lr": 0.0018337629348757645, "train_loss": 0.4255017030119896, "epoch": 181}
{"train_lr": 0.0018314735344693734, "train_loss": 0.42531982975006105, "epoch": 182}
{"train_lr": 0.0018291699265598315, "train_loss": 0.4253919682562351, "epoch": 183}
{"train_lr": 0.0018268521505094332, "train_loss": 0.42532408665418625, "epoch": 184}
{"train_lr": 0.0018245202459225905, "train_loss": 0.4252872289419174, "epoch": 185}
{"train_lr": 0.0018221742526451034, "train_loss": 0.42515819770097735, "epoch": 186}
{"train_lr": 0.0018198142107635346, "train_loss": 0.4251448391377926, "epoch": 187}
{"train_lr": 0.001817440160604478, "train_loss": 0.4251269141793251, "epoch": 188}
{"train_lr": 0.001815052142733913, "train_loss": 0.42496180029511454, "epoch": 189}
{"train_lr": 0.001812650197956469, "train_loss": 0.4249068469822407, "epoch": 190}
{"train_lr": 0.001810234367314759, "train_loss": 0.4250109994530678, "epoch": 191}
{"train_lr": 0.001807804692088656, "train_loss": 0.424981004846096, "epoch": 192}
{"train_lr": 0.0018053612137946117, "train_loss": 0.4247819488167763, "epoch": 193}
{"train_lr": 0.00180290397418492, "train_loss": 0.4246981884419918, "epoch": 194}
{"train_lr": 0.0018004330152470427, "train_loss": 0.4247443710744381, "epoch": 195}
{"train_lr": 0.001797948379202839, "train_loss": 0.42464397926330566, "epoch": 196}
{"train_lr": 0.001795450108507886, "train_loss": 0.4248728358566761, "epoch": 197}
{"train_lr": 0.0017929382458507345, "train_loss": 0.42464299993515014, "epoch": 198}
{"train_lr": 0.001790412834152188, "train_loss": 0.42458462185263635, "epoch": 199}
{"train_lr": 0.0017878739165645666, "train_loss": 0.4244833302080631, "epoch": 200}
{"train_lr": 0.0017853215364709624, "train_loss": 0.4244596959531307, "epoch": 201}
{"train_lr": 0.001782755737484517, "train_loss": 0.4243732154786587, "epoch": 202}
{"train_lr": 0.0017801765634476482, "train_loss": 0.42429113371372223, "epoch": 203}
{"train_lr": 0.0017775840584313269, "train_loss": 0.4243124633014202, "epoch": 204}
{"train_lr": 0.0017749782667343087, "train_loss": 0.4242242727458477, "epoch": 205}
{"train_lr": 0.0017723592328823872, "train_loss": 0.42419893629550937, "epoch": 206}
{"train_lr": 0.0017697270016276267, "train_loss": 0.424120762860775, "epoch": 207}
{"train_lr": 0.0017670816179475896, "train_loss": 0.4241485097467899, "epoch": 208}
{"train_lr": 0.0017644231270445914, "train_loss": 0.4241050954818726, "epoch": 209}
{"train_lr": 0.0017617515743449002, "train_loss": 0.42401950508356095, "epoch": 210}
{"train_lr": 0.0017590670054979855, "train_loss": 0.4240114216029644, "epoch": 211}
{"train_lr": 0.0017563694663757193, "train_loss": 0.4239511508405209, "epoch": 212}
{"train_lr": 0.001753659003071607, "train_loss": 0.4239001268327236, "epoch": 213}
{"train_lr": 0.0017509356618999798, "train_loss": 0.4238909521043301, "epoch": 214}
{"train_lr": 0.0017481994893952333, "train_loss": 0.42393678986430167, "epoch": 215}
{"train_lr": 0.0017454505323109951, "train_loss": 0.42374238679409026, "epoch": 216}
{"train_lr": 0.0017426888376193663, "train_loss": 0.42381820154190064, "epoch": 217}
{"train_lr": 0.0017399144525100897, "train_loss": 0.423696692097187, "epoch": 218}
{"train_lr": 0.0017371274243897503, "train_loss": 0.4236421609342098, "epoch": 219}
{"train_lr": 0.0017343278008809635, "train_loss": 0.42375850692987443, "epoch": 220}
{"train_lr": 0.0017315156298215765, "train_loss": 0.42361214114427564, "epoch": 221}
{"train_lr": 0.0017286909592638356, "train_loss": 0.423529484629631, "epoch": 222}
{"train_lr": 0.001725853837473557, "train_loss": 0.4241306705236435, "epoch": 223}
{"train_lr": 0.001723004312929336, "train_loss": 0.4236619794726372, "epoch": 224}
{"train_lr": 0.0017201424343216843, "train_loss": 0.423469975990057, "epoch": 225}
{"train_lr": 0.001717268250552199, "train_loss": 0.4235054041683674, "epoch": 226}
{"train_lr": 0.0017143818107327635, "train_loss": 0.4234480388879776, "epoch": 227}
{"train_lr": 0.001711483164184661, "train_loss": 0.42325710557699203, "epoch": 228}
{"train_lr": 0.0017085723604377695, "train_loss": 0.423364332896471, "epoch": 229}
{"train_lr": 0.001705649449229696, "train_loss": 0.4232913333415985, "epoch": 230}
{"train_lr": 0.0017027144805049166, "train_loss": 0.42325079972147944, "epoch": 231}
{"train_lr": 0.0016997675044139638, "train_loss": 0.4232346039891243, "epoch": 232}
{"train_lr": 0.0016968085713125144, "train_loss": 0.42314266840815545, "epoch": 233}
{"train_lr": 0.001693837731760583, "train_loss": 0.4230865432739258, "epoch": 234}
{"train_lr": 0.001690855036521616, "train_loss": 0.42304754146933554, "epoch": 235}
{"train_lr": 0.0016878605365616413, "train_loss": 0.4229908716440201, "epoch": 236}
{"train_lr": 0.0016848542830484078, "train_loss": 0.42301636381149293, "epoch": 237}
{"train_lr": 0.0016818363273504887, "train_loss": 0.4229623642385006, "epoch": 238}
{"train_lr": 0.0016788067210364202, "train_loss": 0.42286261225342753, "epoch": 239}
{"train_lr": 0.0016757655158738203, "train_loss": 0.4231466094911098, "epoch": 240}
{"train_lr": 0.0016727127638284855, "train_loss": 0.4228993058741093, "epoch": 241}
{"train_lr": 0.0016696485170635351, "train_loss": 0.4227703313648701, "epoch": 242}
{"train_lr": 0.001666572827938487, "train_loss": 0.42268667768239976, "epoch": 243}
{"train_lr": 0.0016634857490083828, "train_loss": 0.4226205878555775, "epoch": 244}
{"train_lr": 0.001660387333022884, "train_loss": 0.4228058986365795, "epoch": 245}
{"train_lr": 0.0016572776329253699, "train_loss": 0.4226573086321354, "epoch": 246}
{"train_lr": 0.0016541567018520343, "train_loss": 0.4226382351756096, "epoch": 247}
{"train_lr": 0.0016510245931309836, "train_loss": 0.42262957600951195, "epoch": 248}
{"train_lr": 0.001647881360281309, "train_loss": 0.42256055372953416, "epoch": 249}
{"train_lr": 0.0016447270570121876, "train_loss": 0.42256660661697387, "epoch": 250}
{"train_lr": 0.0016415617372219618, "train_loss": 0.4224966368377209, "epoch": 251}
{"train_lr": 0.001638385454997211, "train_loss": 0.422463566839695, "epoch": 252}
{"train_lr": 0.00163519826461184, "train_loss": 0.42237583945393564, "epoch": 253}
{"train_lr": 0.0016320002205261264, "train_loss": 0.42226354267001154, "epoch": 254}
{"train_lr": 0.0016287913773858353, "train_loss": 0.4222660710632801, "epoch": 255}
{"train_lr": 0.0016255717900212328, "train_loss": 0.4222601546764374, "epoch": 256}
{"train_lr": 0.0016223415134461888, "train_loss": 0.4221981988191605, "epoch": 257}
{"train_lr": 0.0016191006028572102, "train_loss": 0.4222234422802925, "epoch": 258}
{"train_lr": 0.0016158491136325235, "train_loss": 0.42203234511613846, "epoch": 259}
{"train_lr": 0.0016125871013311073, "train_loss": 0.4220574823975563, "epoch": 260}
{"train_lr": 0.0016093146216917486, "train_loss": 0.42207971769571306, "epoch": 261}
{"train_lr": 0.0016060317306321, "train_loss": 0.42206390278339384, "epoch": 262}
{"train_lr": 0.0016027384842477105, "train_loss": 0.4220549532175064, "epoch": 263}
{"train_lr": 0.0015994349388110693, "train_loss": 0.4220111142575741, "epoch": 264}
{"train_lr": 0.001596121150770662, "train_loss": 0.4219424910187721, "epoch": 265}
{"train_lr": 0.0015927971767499772, "train_loss": 0.4220361890375614, "epoch": 266}
{"train_lr": 0.0015894630735465585, "train_loss": 0.4218697710752487, "epoch": 267}
{"train_lr": 0.001586118898131038, "train_loss": 0.42191931760907175, "epoch": 268}
{"train_lr": 0.0015827647076461402, "train_loss": 0.4217308155596256, "epoch": 269}
{"train_lr": 0.0015794005594057226, "train_loss": 0.4218587208151817, "epoch": 270}
{"train_lr": 0.0015760265108938055, "train_loss": 0.4217528022646904, "epoch": 271}
{"train_lr": 0.001572642619763563, "train_loss": 0.421679973757267, "epoch": 272}
{"train_lr": 0.0015692489438363627, "train_loss": 0.4217708421468735, "epoch": 273}
{"train_lr": 0.001565845541100755, "train_loss": 0.4216467033326626, "epoch": 274}
{"train_lr": 0.001562432469711511, "train_loss": 0.42169866006374357, "epoch": 275}
{"train_lr": 0.0015590097879886, "train_loss": 0.42156042192578314, "epoch": 276}
{"train_lr": 0.001555577554416206, "train_loss": 0.42161925470232964, "epoch": 277}
{"train_lr": 0.0015521358276417347, "train_loss": 0.42153908587694167, "epoch": 278}
{"train_lr": 0.0015486846664748033, "train_loss": 0.4215101927101612, "epoch": 279}
{"train_lr": 0.0015452241298862248, "train_loss": 0.4214610160768032, "epoch": 280}
{"train_lr": 0.0015417542770070323, "train_loss": 0.42141325249671935, "epoch": 281}
{"train_lr": 0.0015382751671274308, "train_loss": 0.42136881043314933, "epoch": 282}
{"train_lr": 0.0015347868596958091, "train_loss": 0.42135062956213953, "epoch": 283}
{"train_lr": 0.0015312894143177202, "train_loss": 0.42139784327149393, "epoch": 284}
{"train_lr": 0.0015277828907548521, "train_loss": 0.4214449079275131, "epoch": 285}
{"train_lr": 0.001524267348924025, "train_loss": 0.4213422214746475, "epoch": 286}
{"train_lr": 0.0015207428488961414, "train_loss": 0.42129106523990634, "epoch": 287}
{"train_lr": 0.0015172094508951826, "train_loss": 0.42131546414494514, "epoch": 288}
{"train_lr": 0.0015136672152971753, "train_loss": 0.4212149278342724, "epoch": 289}
{"train_lr": 0.0015101162026291506, "train_loss": 0.42106798495054243, "epoch": 290}
{"train_lr": 0.001506556473568119, "train_loss": 0.42114609475135806, "epoch": 291}
{"train_lr": 0.0015029880889400262, "train_loss": 0.42112620157003405, "epoch": 292}
{"train_lr": 0.001499411109718721, "train_loss": 0.4210899014830589, "epoch": 293}
{"train_lr": 0.001495825597024904, "train_loss": 0.42102030997872353, "epoch": 294}
{"train_lr": 0.0014922316121251074, "train_loss": 0.4210644329071045, "epoch": 295}
{"train_lr": 0.0014886292164306054, "train_loss": 0.42094684926271436, "epoch": 296}
{"train_lr": 0.001485018471496406, "train_loss": 0.420904375231266, "epoch": 297}
{"train_lr": 0.001481399439020176, "train_loss": 0.4209073343873024, "epoch": 298}
{"train_lr": 0.0014777721808411927, "train_loss": 0.4208303572535515, "epoch": 299}
{"train_lr": 0.0014741367589392984, "train_loss": 0.420840155172348, "epoch": 300}
{"train_lr": 0.001470493235433814, "train_loss": 0.42079361829161643, "epoch": 301}
{"train_lr": 0.0014668416725825066, "train_loss": 0.420751271378994, "epoch": 302}
{"train_lr": 0.0014631821327805124, "train_loss": 0.42070620072484016, "epoch": 303}
{"train_lr": 0.0014595146785592672, "train_loss": 0.4206903719842434, "epoch": 304}
{"train_lr": 0.00145583937258545, "train_loss": 0.4207553890287876, "epoch": 305}
{"train_lr": 0.001452156277659891, "train_loss": 0.42065541954040525, "epoch": 306}
{"train_lr": 0.0014484654567165239, "train_loss": 0.4206352675974369, "epoch": 307}
{"train_lr": 0.0014447669728213, "train_loss": 0.420621358191967, "epoch": 308}
{"train_lr": 0.0014410608891710992, "train_loss": 0.42055000742673876, "epoch": 309}
{"train_lr": 0.0014373472690926664, "train_loss": 0.4204847206771374, "epoch": 310}
{"train_lr": 0.0014336261760415228, "train_loss": 0.4204664314568043, "epoch": 311}
{"train_lr": 0.0014298976736008813, "train_loss": 0.42043020857572555, "epoch": 312}
{"train_lr": 0.001426161825480565, "train_loss": 0.42040675433278085, "epoch": 313}
{"train_lr": 0.0014224186955159059, "train_loss": 0.42036361072659495, "epoch": 314}
{"train_lr": 0.001418668347666667, "train_loss": 0.42047722015976907, "epoch": 315}
{"train_lr": 0.001414910846015954, "train_loss": 0.4203856301009655, "epoch": 316}
{"train_lr": 0.0014111462547690917, "train_loss": 0.42029333937168123, "epoch": 317}
{"train_lr": 0.0014073746382525652, "train_loss": 0.4202634672820568, "epoch": 318}
{"train_lr": 0.0014035960609128908, "train_loss": 0.4202524435698986, "epoch": 319}
{"train_lr": 0.0013998105873155328, "train_loss": 0.4202196150660515, "epoch": 320}
{"train_lr": 0.0013960182821437879, "train_loss": 0.4202494762778282, "epoch": 321}
{"train_lr": 0.001392219210197692, "train_loss": 0.42015298603773116, "epoch": 322}
{"train_lr": 0.0013884134363928921, "train_loss": 0.4201268202781677, "epoch": 323}
{"train_lr": 0.001384601025759574, "train_loss": 0.419998131608963, "epoch": 324}
{"train_lr": 0.001380782043441313, "train_loss": 0.42012175452113154, "epoch": 325}
{"train_lr": 0.0013769565546939756, "train_loss": 0.4199835945248604, "epoch": 326}
{"train_lr": 0.001373124624884616, "train_loss": 0.4199679668843746, "epoch": 327}
{"train_lr": 0.0013692863194903408, "train_loss": 0.41995242735147476, "epoch": 328}
{"train_lr": 0.0013654417040971938, "train_loss": 0.419914648014307, "epoch": 329}
{"train_lr": 0.0013615908443990496, "train_loss": 0.420291811478138, "epoch": 330}
{"train_lr": 0.0013577338061964764, "train_loss": 0.42001431497335434, "epoch": 331}
{"train_lr": 0.0013538706553956092, "train_loss": 0.41982507169246674, "epoch": 332}
{"train_lr": 0.0013500014580070398, "train_loss": 0.4198868880212307, "epoch": 333}
{"train_lr": 0.0013461262801446774, "train_loss": 0.41981268939375876, "epoch": 334}
{"train_lr": 0.0013422451880246203, "train_loss": 0.4197859157443047, "epoch": 335}
{"train_lr": 0.0013383582479640172, "train_loss": 0.4197030574500561, "epoch": 336}
{"train_lr": 0.0013344655263799582, "train_loss": 0.41963064196109773, "epoch": 337}
{"train_lr": 0.0013305670897883135, "train_loss": 0.41961017757058144, "epoch": 338}
{"train_lr": 0.0013266630048026041, "train_loss": 0.41970578683018683, "epoch": 339}
{"train_lr": 0.00132275333813287, "train_loss": 0.4195633431851864, "epoch": 340}
{"train_lr": 0.001318838156584536, "train_loss": 0.41961616225242615, "epoch": 341}
{"train_lr": 0.0013149175270572404, "train_loss": 0.419570646417141, "epoch": 342}
{"train_lr": 0.0013109915165437332, "train_loss": 0.41954742604494094, "epoch": 343}
{"train_lr": 0.0013070601921287021, "train_loss": 0.4194275137424469, "epoch": 344}
{"train_lr": 0.001303123620987628, "train_loss": 0.41942608463168146, "epoch": 345}
{"train_lr": 0.0012991818703856554, "train_loss": 0.4194012299001217, "epoch": 346}
{"train_lr": 0.0012952350076764231, "train_loss": 0.41930887975096703, "epoch": 347}
{"train_lr": 0.00129128310030093, "train_loss": 0.4193776847779751, "epoch": 348}
{"train_lr": 0.0012873262157863646, "train_loss": 0.4193605829834938, "epoch": 349}
{"train_lr": 0.0012833644217449664, "train_loss": 0.4192501567542553, "epoch": 350}
{"train_lr": 0.0012793977858728675, "train_loss": 0.4192127873659134, "epoch": 351}
{"train_lr": 0.00127542637594893, "train_loss": 0.4193183109641075, "epoch": 352}
{"train_lr": 0.0012714502598335897, "train_loss": 0.4197004640817642, "epoch": 353}
{"train_lr": 0.0012674695054677005, "train_loss": 0.41917526848316194, "epoch": 354}
{"train_lr": 0.0012634841808713748, "train_loss": 0.41914406824707984, "epoch": 355}
{"train_lr": 0.0012594943541428109, "train_loss": 0.4190760906219482, "epoch": 356}
{"train_lr": 0.0012555000934571397, "train_loss": 0.419058157235384, "epoch": 357}
{"train_lr": 0.0012515014670652586, "train_loss": 0.419025038343668, "epoch": 358}
{"train_lr": 0.0012474985432926558, "train_loss": 0.4189569546878338, "epoch": 359}
{"train_lr": 0.001243491390538254, "train_loss": 0.4190199301660061, "epoch": 360}
{"train_lr": 0.0012394800772732412, "train_loss": 0.4189968164920807, "epoch": 361}
{"train_lr": 0.0012354646720398926, "train_loss": 0.41894257601499557, "epoch": 362}
{"train_lr": 0.001231445243450402, "train_loss": 0.41891998412013054, "epoch": 363}
{"train_lr": 0.0012274218601857198, "train_loss": 0.41875716477632524, "epoch": 364}
{"train_lr": 0.0012233945909943611, "train_loss": 0.4189456850349903, "epoch": 365}
{"train_lr": 0.001219363504691245, "train_loss": 0.41879626615047455, "epoch": 366}
{"train_lr": 0.0012153286701565129, "train_loss": 0.4187718325734138, "epoch": 367}
{"train_lr": 0.0012112901563343563, "train_loss": 0.4186474060893059, "epoch": 368}
{"train_lr": 0.0012072480322318328, "train_loss": 0.4186492353022099, "epoch": 369}
{"train_lr": 0.0012032023669176915, "train_loss": 0.4186739155292511, "epoch": 370}
{"train_lr": 0.0011991532295211936, "train_loss": 0.41872328140735626, "epoch": 371}
{"train_lr": 0.001195100689230918, "train_loss": 0.4187125334382057, "epoch": 372}
{"train_lr": 0.0011910448152936013, "train_loss": 0.4187649071574211, "epoch": 373}
{"train_lr": 0.00118698567701294, "train_loss": 0.41862554777264593, "epoch": 374}
{"train_lr": 0.001182923343748406, "train_loss": 0.418472838807106, "epoch": 375}
{"train_lr": 0.0011788578849140647, "train_loss": 0.4184612022995949, "epoch": 376}
{"train_lr": 0.00117478936997739, "train_loss": 0.418489412689209, "epoch": 377}
{"train_lr": 0.001170717868458082, "train_loss": 0.4183967174947262, "epoch": 378}
{"train_lr": 0.001166643449926863, "train_loss": 0.4184104426383972, "epoch": 379}
{"train_lr": 0.0011625661840043084, "train_loss": 0.41830870187282565, "epoch": 380}
{"train_lr": 0.0011584861403596384, "train_loss": 0.41836045224666596, "epoch": 381}
{"train_lr": 0.0011544033887095435, "train_loss": 0.41827855964899063, "epoch": 382}
{"train_lr": 0.0011503179988169893, "train_loss": 0.41831054545640944, "epoch": 383}
{"train_lr": 0.001146230040490009, "train_loss": 0.41834157658815385, "epoch": 384}
{"train_lr": 0.0011421395835805358, "train_loss": 0.41814741303920744, "epoch": 385}
{"train_lr": 0.0011380466979831925, "train_loss": 0.41818422635793684, "epoch": 386}
{"train_lr": 0.0011339514536341003, "train_loss": 0.418172834277153, "epoch": 387}
{"train_lr": 0.001129853920509686, "train_loss": 0.4181679087162018, "epoch": 388}
{"train_lr": 0.0011257541686254895, "train_loss": 0.4180516511440277, "epoch": 389}
{"train_lr": 0.0011216522680349492, "train_loss": 0.41804933690428736, "epoch": 390}
{"train_lr": 0.0011175482888282399, "train_loss": 0.4180680680811405, "epoch": 391}
{"train_lr": 0.0011134423011310347, "train_loss": 0.4179827343761921, "epoch": 392}
{"train_lr": 0.0011093343751033356, "train_loss": 0.4179728990733623, "epoch": 393}
{"train_lr": 0.0011052245809382672, "train_loss": 0.4179292483329773, "epoch": 394}
{"train_lr": 0.0011011129888608734, "train_loss": 0.41794585397839545, "epoch": 395}
{"train_lr": 0.0010969996691269118, "train_loss": 0.41799348885416987, "epoch": 396}
{"train_lr": 0.0010928846920216773, "train_loss": 0.41798636142015455, "epoch": 397}
{"train_lr": 0.0010887681278587693, "train_loss": 0.4178778306603432, "epoch": 398}
{"train_lr": 0.0010846500469789088, "train_loss": 0.417874898070097, "epoch": 399}
{"train_lr": 0.0010805305197487387, "train_loss": 0.4177279465615749, "epoch": 400}
{"train_lr": 0.001076409616559617, "train_loss": 0.4177750180602074, "epoch": 401}
{"train_lr": 0.001072287407826403, "train_loss": 0.41769819692969323, "epoch": 402}
{"train_lr": 0.0010681639639862738, "train_loss": 0.4177047014296055, "epoch": 403}
{"train_lr": 0.0010640393554975105, "train_loss": 0.41777194578647614, "epoch": 404}
{"train_lr": 0.001059913652838287, "train_loss": 0.4176086929380894, "epoch": 405}
{"train_lr": 0.0010557869265054776, "train_loss": 0.41784522614479064, "epoch": 406}
{"train_lr": 0.0010516592470134524, "train_loss": 0.4175245689034462, "epoch": 407}
{"train_lr": 0.0010475306848928647, "train_loss": 0.41752753249406815, "epoch": 408}
{"train_lr": 0.0010434013106894533, "train_loss": 0.41756826764941213, "epoch": 409}
{"train_lr": 0.0010392711949628248, "train_loss": 0.417456934183836, "epoch": 410}
{"train_lr": 0.00103514040828526, "train_loss": 0.4174256393015385, "epoch": 411}
{"train_lr": 0.001031009021240512, "train_loss": 0.4173729620695114, "epoch": 412}
{"train_lr": 0.0010268771044225837, "train_loss": 0.41735645656585696, "epoch": 413}
{"train_lr": 0.0010227447284345357, "train_loss": 0.4173586934030056, "epoch": 414}
{"train_lr": 0.0010186119638872688, "train_loss": 0.4173215918242931, "epoch": 415}
{"train_lr": 0.001014478881398324, "train_loss": 0.4172305813729763, "epoch": 416}
{"train_lr": 0.0010103455515906839, "train_loss": 0.4172926494061947, "epoch": 417}
{"train_lr": 0.0010062120450915484, "train_loss": 0.41724464458227156, "epoch": 418}
{"train_lr": 0.0010020784325311383, "train_loss": 0.4171691377878189, "epoch": 419}
{"train_lr": 0.0009979447845414845, "train_loss": 0.4171639740407467, "epoch": 420}
{"train_lr": 0.000993811171755231, "train_loss": 0.41711280400156975, "epoch": 421}
{"train_lr": 0.0009896776648044105, "train_loss": 0.4171565491616726, "epoch": 422}
{"train_lr": 0.0009855443343192564, "train_loss": 0.41707179708480835, "epoch": 423}
{"train_lr": 0.0009814112509269812, "train_loss": 0.4170188140451908, "epoch": 424}
{"train_lr": 0.0009772784852505741, "train_loss": 0.4170406273066998, "epoch": 425}
{"train_lr": 0.0009731461079075985, "train_loss": 0.41711612367033957, "epoch": 426}
{"train_lr": 0.0009690141895089831, "train_loss": 0.4170222055196762, "epoch": 427}
{"train_lr": 0.0009648828006578134, "train_loss": 0.41702341947555543, "epoch": 428}
{"train_lr": 0.0009607520119481245, "train_loss": 0.41691789889335634, "epoch": 429}
{"train_lr": 0.0009566218939636999, "train_loss": 0.4168686304748058, "epoch": 430}
{"train_lr": 0.0009524925172768602, "train_loss": 0.41675924023389815, "epoch": 431}
{"train_lr": 0.0009483639524472556, "train_loss": 0.416854871147871, "epoch": 432}
{"train_lr": 0.000944236270020672, "train_loss": 0.4168514198482037, "epoch": 433}
{"train_lr": 0.0009401095405278129, "train_loss": 0.416757233697176, "epoch": 434}
{"train_lr": 0.0009359838344831006, "train_loss": 0.41670299382805825, "epoch": 435}
{"train_lr": 0.0009318592223834629, "train_loss": 0.4166590934753418, "epoch": 436}
{"train_lr": 0.0009277357747071485, "train_loss": 0.41663964110612867, "epoch": 437}
{"train_lr": 0.0009236135619124953, "train_loss": 0.4165965996146202, "epoch": 438}
{"train_lr": 0.0009194926544367453, "train_loss": 0.41651798075437546, "epoch": 439}
{"train_lr": 0.0009153731226948438, "train_loss": 0.4164986294090748, "epoch": 440}
{"train_lr": 0.0009112550370782172, "train_loss": 0.416437136977911, "epoch": 441}
{"train_lr": 0.0009071384679535845, "train_loss": 0.41646568976044657, "epoch": 442}
{"train_lr": 0.0009030234856617595, "train_loss": 0.41643167090415956, "epoch": 443}
{"train_lr": 0.0008989101605164331, "train_loss": 0.41652717319726945, "epoch": 444}
{"train_lr": 0.0008947985628029826, "train_loss": 0.41643864707946776, "epoch": 445}
{"train_lr": 0.000890688762777271, "train_loss": 0.4163997540950775, "epoch": 446}
{"train_lr": 0.000886580830664437, "train_loss": 0.41629073085188867, "epoch": 447}
{"train_lr": 0.000882474836657711, "train_loss": 0.41629329221844674, "epoch": 448}
{"train_lr": 0.0008783708509171996, "train_loss": 0.4162357913553715, "epoch": 449}
{"train_lr": 0.0008742689435686971, "train_loss": 0.41620945250988006, "epoch": 450}
{"train_lr": 0.0008701691847024806, "train_loss": 0.4162765025675297, "epoch": 451}
{"train_lr": 0.0008660716443721178, "train_loss": 0.4162437853038311, "epoch": 452}
{"train_lr": 0.0008619763925932672, "train_loss": 0.4160850357532501, "epoch": 453}
{"train_lr": 0.000857883499342485, "train_loss": 0.41610757068395615, "epoch": 454}
{"train_lr": 0.0008537930345560229, "train_loss": 0.4160928344607353, "epoch": 455}
{"train_lr": 0.0008497050681286344, "train_loss": 0.4160299357116222, "epoch": 456}
{"train_lr": 0.0008456196699123931, "train_loss": 0.4160114522874355, "epoch": 457}
{"train_lr": 0.0008415369097154786, "train_loss": 0.4159763306438923, "epoch": 458}
{"train_lr": 0.0008374568573009967, "train_loss": 0.41603127918839455, "epoch": 459}
{"train_lr": 0.0008333795823857903, "train_loss": 0.41598988704681394, "epoch": 460}
{"train_lr": 0.0008293051546392356, "train_loss": 0.4159310473740101, "epoch": 461}
{"train_lr": 0.0008252336436820601, "train_loss": 0.415981581813097, "epoch": 462}
{"train_lr": 0.0008211651190851549, "train_loss": 0.41578987702727316, "epoch": 463}
{"train_lr": 0.000817099650368378, "train_loss": 0.41580206685066223, "epoch": 464}
{"train_lr": 0.0008130373069993725, "train_loss": 0.41571778808832166, "epoch": 465}
{"train_lr": 0.0008089781583923796, "train_loss": 0.41572712430357933, "epoch": 466}
{"train_lr": 0.0008049222739070492, "train_loss": 0.41574336388111116, "epoch": 467}
{"train_lr": 0.0008008697228472562, "train_loss": 0.4156535137236118, "epoch": 468}
{"train_lr": 0.0007968205744599162, "train_loss": 0.4156419990241528, "epoch": 469}
{"train_lr": 0.0007927748979338039, "train_loss": 0.4155884074151516, "epoch": 470}
{"train_lr": 0.0007887327623983688, "train_loss": 0.4156378916442394, "epoch": 471}
{"train_lr": 0.0007846942369225543, "train_loss": 0.4155085301876068, "epoch": 472}
{"train_lr": 0.0007806593905136176, "train_loss": 0.4155448598384857, "epoch": 473}
{"train_lr": 0.0007766282921159524, "train_loss": 0.4154927032291889, "epoch": 474}
{"train_lr": 0.0007726010106099076, "train_loss": 0.41546733177900314, "epoch": 475}
{"train_lr": 0.0007685776148106116, "train_loss": 0.4154239023923874, "epoch": 476}
{"train_lr": 0.0007645581734668001, "train_loss": 0.41537334437966345, "epoch": 477}
{"train_lr": 0.0007605427552596346, "train_loss": 0.4154018564403057, "epoch": 478}
{"train_lr": 0.0007565314288015307, "train_loss": 0.4154400738298893, "epoch": 479}
{"train_lr": 0.0007525242626349935, "train_loss": 0.41526551213860513, "epoch": 480}
{"train_lr": 0.0007485213252314344, "train_loss": 0.41534639605283735, "epoch": 481}
{"train_lr": 0.0007445226849900115, "train_loss": 0.41517547313570974, "epoch": 482}
{"train_lr": 0.0007405284102364519, "train_loss": 0.41520622568130494, "epoch": 483}
{"train_lr": 0.0007365385692218902, "train_loss": 0.4151805117607117, "epoch": 484}
{"train_lr": 0.0007325532301217024, "train_loss": 0.4151923873543739, "epoch": 485}
{"train_lr": 0.0007285724610343378, "train_loss": 0.415164637196064, "epoch": 486}
{"train_lr": 0.0007245963299801566, "train_loss": 0.41513061105012894, "epoch": 487}
{"train_lr": 0.0007206249049002679, "train_loss": 0.41505594806075097, "epoch": 488}
{"train_lr": 0.000716658253655366, "train_loss": 0.414974316573143, "epoch": 489}
{"train_lr": 0.0007126964440245807, "train_loss": 0.4150249040722847, "epoch": 490}
{"train_lr": 0.0007087395437043058, "train_loss": 0.41488441542983057, "epoch": 491}
{"train_lr": 0.00070478762030705, "train_loss": 0.4148910955309868, "epoch": 492}
{"train_lr": 0.0007008407413602802, "train_loss": 0.41482908695936205, "epoch": 493}
{"train_lr": 0.000696898974305269, "train_loss": 0.4148184060752392, "epoch": 494}
{"train_lr": 0.000692962386495939, "train_loss": 0.4147723206758499, "epoch": 495}
{"train_lr": 0.0006890310451977145, "train_loss": 0.4147319468975067, "epoch": 496}
{"train_lr": 0.0006851050175863707, "train_loss": 0.41478028755784035, "epoch": 497}
{"train_lr": 0.0006811843707468876, "train_loss": 0.41468667683005334, "epoch": 498}
{"train_lr": 0.0006772691716723045, "train_loss": 0.4146990427553654, "epoch": 499}
{"train_lr": 0.0006733594872625652, "train_loss": 0.4146124188661575, "epoch": 500}
{"train_lr": 0.0006694553843233956, "train_loss": 0.41460838395953176, "epoch": 501}
{"train_lr": 0.000665556929565141, "train_loss": 0.4146430678844452, "epoch": 502}
{"train_lr": 0.0006616641896016334, "train_loss": 0.41454836529493333, "epoch": 503}
{"train_lr": 0.0006577772309490656, "train_loss": 0.4145636016011238, "epoch": 504}
{"train_lr": 0.0006538961200248293, "train_loss": 0.4144807538509369, "epoch": 505}
{"train_lr": 0.0006500209231464063, "train_loss": 0.4144996554195881, "epoch": 506}
{"train_lr": 0.0006461517065302167, "train_loss": 0.41448832686543463, "epoch": 507}
{"train_lr": 0.0006422885362904992, "train_loss": 0.41441225247979163, "epoch": 508}
{"train_lr": 0.0006384314784381729, "train_loss": 0.41435343540906905, "epoch": 509}
{"train_lr": 0.000634580598879715, "train_loss": 0.41432497901916504, "epoch": 510}
{"train_lr": 0.0006307359634160299, "train_loss": 0.4141963863253593, "epoch": 511}
{"train_lr": 0.0006268976377413344, "train_loss": 0.414292369222641, "epoch": 512}
{"train_lr": 0.0006230656874420206, "train_loss": 0.41412822899222373, "epoch": 513}
{"train_lr": 0.000619240177995549, "train_loss": 0.41413087169528007, "epoch": 514}
{"train_lr": 0.0006154211747693183, "train_loss": 0.4142154009103775, "epoch": 515}
{"train_lr": 0.0006116087430195577, "train_loss": 0.4141320895433426, "epoch": 516}
{"train_lr": 0.0006078029478902082, "train_loss": 0.41410443152785303, "epoch": 517}
{"train_lr": 0.0006040038544118062, "train_loss": 0.41408611317276955, "epoch": 518}
{"train_lr": 0.0006002115275003778, "train_loss": 0.41404432806372643, "epoch": 519}
{"train_lr": 0.0005964260319563274, "train_loss": 0.41398654327988627, "epoch": 520}
{"train_lr": 0.0005926474324633267, "train_loss": 0.41391335440278054, "epoch": 521}
{"train_lr": 0.0005888757935872201, "train_loss": 0.41387077738046646, "epoch": 522}
{"train_lr": 0.0005851111797749066, "train_loss": 0.41397186594605445, "epoch": 523}
{"train_lr": 0.0005813536553532483, "train_loss": 0.4139413024187088, "epoch": 524}
{"train_lr": 0.0005776032845279719, "train_loss": 0.4138102644562721, "epoch": 525}
{"train_lr": 0.0005738601313825683, "train_loss": 0.4137563929796219, "epoch": 526}
{"train_lr": 0.0005701242598771955, "train_loss": 0.41368419902324677, "epoch": 527}
{"train_lr": 0.0005663957338475891, "train_loss": 0.4137420842349529, "epoch": 528}
{"train_lr": 0.0005626746170039725, "train_loss": 0.41368860872387886, "epoch": 529}
{"train_lr": 0.0005589609729299664, "train_loss": 0.41366335294246676, "epoch": 530}
{"train_lr": 0.0005552548650815012, "train_loss": 0.4136664641916752, "epoch": 531}
{"train_lr": 0.0005515563567857334, "train_loss": 0.41364744307994844, "epoch": 532}
{"train_lr": 0.0005478655112399664, "train_loss": 0.4135095750927925, "epoch": 533}
{"train_lr": 0.0005441823915105678, "train_loss": 0.4134646384775639, "epoch": 534}
{"train_lr": 0.0005405070605318911, "train_loss": 0.4135267463207245, "epoch": 535}
{"train_lr": 0.0005368395811052013, "train_loss": 0.41346614977121354, "epoch": 536}
{"train_lr": 0.000533180015897602, "train_loss": 0.41341310681700705, "epoch": 537}
{"train_lr": 0.0005295284274409709, "train_loss": 0.41329991322159765, "epoch": 538}
{"train_lr": 0.0005258848781308736, "train_loss": 0.41334705371260644, "epoch": 539}
{"train_lr": 0.0005222494302255165, "train_loss": 0.41332384219169616, "epoch": 540}
{"train_lr": 0.0005186221458446746, "train_loss": 0.41331451881527903, "epoch": 541}
{"train_lr": 0.0005150030869686313, "train_loss": 0.4133096279680729, "epoch": 542}
{"train_lr": 0.0005113923154371142, "train_loss": 0.41333488993048667, "epoch": 543}
{"train_lr": 0.0005077898929482494, "train_loss": 0.41325920339226724, "epoch": 544}
{"train_lr": 0.0005041958810574948, "train_loss": 0.41315065550804136, "epoch": 545}
{"train_lr": 0.0005006103411766005, "train_loss": 0.41317506961226463, "epoch": 546}
{"train_lr": 0.0004970333345725481, "train_loss": 0.4131286765635014, "epoch": 547}
{"train_lr": 0.0004934649223665127, "train_loss": 0.41310886276960374, "epoch": 548}
{"train_lr": 0.0004899051655328116, "train_loss": 0.4130334359705448, "epoch": 549}
{"train_lr": 0.0004863541248978668, "train_loss": 0.4128937359213829, "epoch": 550}
{"train_lr": 0.00048281186113916804, "train_loss": 0.413018404263258, "epoch": 551}
{"train_lr": 0.00047927843478422894, "train_loss": 0.4130131136238575, "epoch": 552}
{"train_lr": 0.00047575390620955427, "train_loss": 0.41287013072967527, "epoch": 553}
{"train_lr": 0.00047223833563961505, "train_loss": 0.4128674404680729, "epoch": 554}
{"train_lr": 0.00046873178314581177, "train_loss": 0.41282065522670747, "epoch": 555}
{"train_lr": 0.00046523430864545227, "train_loss": 0.412801239490509, "epoch": 556}
{"train_lr": 0.00046174597190072565, "train_loss": 0.4127468424975872, "epoch": 557}
{"train_lr": 0.0004582668325176823, "train_loss": 0.41264703783988954, "epoch": 558}
{"train_lr": 0.000454796949945214, "train_loss": 0.412723533976078, "epoch": 559}
{"train_lr": 0.0004513363834740404, "train_loss": 0.4126707662463188, "epoch": 560}
{"train_lr": 0.0004478851922356962, "train_loss": 0.4126263898909092, "epoch": 561}
{"train_lr": 0.0004444434352015155, "train_loss": 0.4126412259161472, "epoch": 562}
{"train_lr": 0.0004410111711816321, "train_loss": 0.4125005640268326, "epoch": 563}
{"train_lr": 0.0004375884588239656, "train_loss": 0.41252969363331793, "epoch": 564}
{"train_lr": 0.0004341753566132277, "train_loss": 0.4123950005233288, "epoch": 565}
{"train_lr": 0.0004307719228699184, "train_loss": 0.4124559945344925, "epoch": 566}
{"train_lr": 0.0004273782157493301, "train_loss": 0.41243081186413766, "epoch": 567}
{"train_lr": 0.00042399429324055236, "train_loss": 0.41239919402599334, "epoch": 568}
{"train_lr": 0.0004206202131654863, "train_loss": 0.4123308017849922, "epoch": 569}
{"train_lr": 0.000417256033177851, "train_loss": 0.4123557644248009, "epoch": 570}
{"train_lr": 0.00041390181076219907, "train_loss": 0.41225514442920685, "epoch": 571}
{"train_lr": 0.0004105576032329374, "train_loss": 0.41224638593196866, "epoch": 572}
{"train_lr": 0.0004072234677333462, "train_loss": 0.4121566233634949, "epoch": 573}
{"train_lr": 0.000403899461234601, "train_loss": 0.4122022950172424, "epoch": 574}
{"train_lr": 0.0004005856405348028, "train_loss": 0.4122386267721653, "epoch": 575}
{"train_lr": 0.00039728206225800316, "train_loss": 0.4121166242182255, "epoch": 576}
{"train_lr": 0.0003939887828532405, "train_loss": 0.41211722364425657, "epoch": 577}
{"train_lr": 0.00039070585859357225, "train_loss": 0.41196879163384437, "epoch": 578}
{"train_lr": 0.00038743334557511883, "train_loss": 0.4120268380403519, "epoch": 579}
{"train_lr": 0.00038417129971609465, "train_loss": 0.4120321435570717, "epoch": 580}
{"train_lr": 0.0003809197767558675, "train_loss": 0.4119880166888237, "epoch": 581}
{"train_lr": 0.00037767883225399033, "train_loss": 0.41182354040145874, "epoch": 582}
{"train_lr": 0.00037444852158926347, "train_loss": 0.4119151137650013, "epoch": 583}
{"train_lr": 0.00037122889995878434, "train_loss": 0.41178027091026304, "epoch": 584}
{"train_lr": 0.00036802002237700215, "train_loss": 0.41189671708345416, "epoch": 585}
{"train_lr": 0.0003648219436747815, "train_loss": 0.4118088481903076, "epoch": 586}
{"train_lr": 0.00036163471849846445, "train_loss": 0.41158689913749696, "epoch": 587}
{"train_lr": 0.00035845840130893473, "train_loss": 0.4116609573543072, "epoch": 588}
{"train_lr": 0.00035529304638068815, "train_loss": 0.4116432239770889, "epoch": 589}
{"train_lr": 0.0003521387078009091, "train_loss": 0.4116695198178291, "epoch": 590}
{"train_lr": 0.0003489954394685392, "train_loss": 0.4116169459104538, "epoch": 591}
{"train_lr": 0.000345863295093364, "train_loss": 0.4115727410554886, "epoch": 592}
{"train_lr": 0.0003427423281950851, "train_loss": 0.41158620098233223, "epoch": 593}
{"train_lr": 0.00033963259210241883, "train_loss": 0.41150212720036505, "epoch": 594}
{"train_lr": 0.00033653413995217435, "train_loss": 0.41141462765336034, "epoch": 595}
{"train_lr": 0.00033344702468834903, "train_loss": 0.4113722758948803, "epoch": 596}
{"train_lr": 0.00033037129906122623, "train_loss": 0.41129573442935946, "epoch": 597}
{"train_lr": 0.0003273070156264704, "train_loss": 0.41129547247886655, "epoch": 598}
{"train_lr": 0.0003242542267442306, "train_loss": 0.4113450105786324, "epoch": 599}
{"train_lr": 0.0003212129845782456, "train_loss": 0.411285870462656, "epoch": 600}
{"train_lr": 0.0003181833410949536, "train_loss": 0.41130744271874425, "epoch": 601}
{"train_lr": 0.00031516534806260186, "train_loss": 0.4112095928132534, "epoch": 602}
{"train_lr": 0.00031215905705036536, "train_loss": 0.41113772990703584, "epoch": 603}
{"train_lr": 0.0003091645194274621, "train_loss": 0.41113032053112986, "epoch": 604}
{"train_lr": 0.0003061817863622778, "train_loss": 0.4110891651570797, "epoch": 605}
{"train_lr": 0.00030321090882149234, "train_loss": 0.41110460319519043, "epoch": 606}
{"train_lr": 0.0003002519375692042, "train_loss": 0.41107726674675943, "epoch": 607}
{"train_lr": 0.00029730492316606825, "train_loss": 0.4110739596545696, "epoch": 608}
{"train_lr": 0.0002943699159684297, "train_loss": 0.4109533204615116, "epoch": 609}
{"train_lr": 0.00029144696612746454, "train_loss": 0.41088306730389595, "epoch": 610}
{"train_lr": 0.0002885361235883199, "train_loss": 0.41095819348096846, "epoch": 611}
{"train_lr": 0.0002856374380892637, "train_loss": 0.41093446829319, "epoch": 612}
{"train_lr": 0.00028275095916083335, "train_loss": 0.41092277715802195, "epoch": 613}
{"train_lr": 0.00027987673612499026, "train_loss": 0.41091884284615515, "epoch": 614}
{"train_lr": 0.00027701481809427403, "train_loss": 0.41077308706641197, "epoch": 615}
{"train_lr": 0.0002741652539709704, "train_loss": 0.41076149238944054, "epoch": 616}
{"train_lr": 0.0002713280924462657, "train_loss": 0.41067302731275557, "epoch": 617}
{"train_lr": 0.00026850338199942207, "train_loss": 0.4106996956408024, "epoch": 618}
{"train_lr": 0.0002656911708969498, "train_loss": 0.41060551152825353, "epoch": 619}
{"train_lr": 0.0002628915071917763, "train_loss": 0.41057525554299357, "epoch": 620}
{"train_lr": 0.0002601044387224285, "train_loss": 0.4105493293166161, "epoch": 621}
{"train_lr": 0.0002573300131122188, "train_loss": 0.41071004919409754, "epoch": 622}
{"train_lr": 0.00025456827776842376, "train_loss": 0.41045111640691756, "epoch": 623}
{"train_lr": 0.00025181927988148265, "train_loss": 0.410511493909359, "epoch": 624}
{"train_lr": 0.0002490830664241836, "train_loss": 0.4104461461484432, "epoch": 625}
{"train_lr": 0.0002463596841508659, "train_loss": 0.4104572146654129, "epoch": 626}
{"train_lr": 0.00024364917959661644, "train_loss": 0.41034869700074195, "epoch": 627}
{"train_lr": 0.00024095159907648234, "train_loss": 0.41023331859111783, "epoch": 628}
{"train_lr": 0.0002382669886846699, "train_loss": 0.41035697820782663, "epoch": 629}
{"train_lr": 0.0002355953942937644, "train_loss": 0.4102578080415726, "epoch": 630}
{"train_lr": 0.00023293686155394203, "train_loss": 0.41025401488542557, "epoch": 631}
{"train_lr": 0.00023029143589219285, "train_loss": 0.41027388836741446, "epoch": 632}
{"train_lr": 0.00022765916251154313, "train_loss": 0.4101309650480747, "epoch": 633}
{"train_lr": 0.00022504008639028075, "train_loss": 0.41018197714686394, "epoch": 634}
{"train_lr": 0.00022243425228119063, "train_loss": 0.4102461946487427, "epoch": 635}
{"train_lr": 0.00021984170471078866, "train_loss": 0.41012363595962525, "epoch": 636}
{"train_lr": 0.00021726248797855976, "train_loss": 0.41003916486501696, "epoch": 637}
{"train_lr": 0.0002146966461562013, "train_loss": 0.4100011553347111, "epoch": 638}
{"train_lr": 0.00021214422308687, "train_loss": 0.4099870161771774, "epoch": 639}
{"train_lr": 0.00020960526238443468, "train_loss": 0.409950205296278, "epoch": 640}
{"train_lr": 0.00020707980743272803, "train_loss": 0.40993198407888415, "epoch": 641}
{"train_lr": 0.00020456790138480746, "train_loss": 0.40987456869482997, "epoch": 642}
{"train_lr": 0.00020206958716221631, "train_loss": 0.4099106639921665, "epoch": 643}
{"train_lr": 0.00019958490745425211, "train_loss": 0.40992944944500925, "epoch": 644}
{"train_lr": 0.00019711390471723525, "train_loss": 0.40970903441905976, "epoch": 645}
{"train_lr": 0.00019465662117378513, "train_loss": 0.4097623137831688, "epoch": 646}
{"train_lr": 0.00019221309881209726, "train_loss": 0.4097091728568077, "epoch": 647}
{"train_lr": 0.00018978337938522675, "train_loss": 0.4097723929464817, "epoch": 648}
{"train_lr": 0.00018736750441037523, "train_loss": 0.4096767637908459, "epoch": 649}
{"train_lr": 0.00018496551516817997, "train_loss": 0.4096685712814331, "epoch": 650}
{"train_lr": 0.00018257745270201065, "train_loss": 0.4095007773041725, "epoch": 651}
{"train_lr": 0.00018020335781726479, "train_loss": 0.40950128165483474, "epoch": 652}
{"train_lr": 0.0001778432710806747, "train_loss": 0.4095606074631214, "epoch": 653}
{"train_lr": 0.00017549723281960988, "train_loss": 0.40949765983819963, "epoch": 654}
{"train_lr": 0.00017316528312139175, "train_loss": 0.40952413992881775, "epoch": 655}
{"train_lr": 0.00017084746183260703, "train_loss": 0.4094638512015343, "epoch": 656}
{"train_lr": 0.00016854380855842624, "train_loss": 0.4094694583117962, "epoch": 657}
{"train_lr": 0.00016625436266192763, "train_loss": 0.40931712368130685, "epoch": 658}
{"train_lr": 0.00016397916326342497, "train_loss": 0.4093422090888023, "epoch": 659}
{"train_lr": 0.000161718249239798, "train_loss": 0.4092994294703007, "epoch": 660}
{"train_lr": 0.0001594716592238298, "train_loss": 0.4093663468182087, "epoch": 661}
{"train_lr": 0.00015723943160354516, "train_loss": 0.40929065743684767, "epoch": 662}
{"train_lr": 0.00015502160452155516, "train_loss": 0.4092123525619507, "epoch": 663}
{"train_lr": 0.00015281821587440569, "train_loss": 0.40918805617690085, "epoch": 664}
{"train_lr": 0.00015062930331192866, "train_loss": 0.4091305765867233, "epoch": 665}
{"train_lr": 0.0001484549042366004, "train_loss": 0.40919655148983003, "epoch": 666}
{"train_lr": 0.0001462950558029027, "train_loss": 0.40923569843173024, "epoch": 667}
{"train_lr": 0.0001441497949166853, "train_loss": 0.40912016796469686, "epoch": 668}
{"train_lr": 0.00014201915823453798, "train_loss": 0.4091143898308277, "epoch": 669}
{"train_lr": 0.00013990318216316309, "train_loss": 0.4091158373832703, "epoch": 670}
{"train_lr": 0.00013780190285875329, "train_loss": 0.4089883540272713, "epoch": 671}
{"train_lr": 0.0001357153562263738, "train_loss": 0.40893249164819717, "epoch": 672}
{"train_lr": 0.00013364357791935063, "train_loss": 0.409016412883997, "epoch": 673}
{"train_lr": 0.0001315866033386586, "train_loss": 0.40892095088362695, "epoch": 674}
{"train_lr": 0.00012954446763231708, "train_loss": 0.4089177478671074, "epoch": 675}
{"train_lr": 0.00012751720569479193, "train_loss": 0.4089482992887497, "epoch": 676}
{"train_lr": 0.00012550485216639558, "train_loss": 0.40890288605093955, "epoch": 677}
{"train_lr": 0.0001235074414326978, "train_loss": 0.40893578273653985, "epoch": 678}
{"train_lr": 0.00012152500762393668, "train_loss": 0.40879338170886037, "epoch": 679}
{"train_lr": 0.00011955758461443642, "train_loss": 0.40870585800409315, "epoch": 680}
{"train_lr": 0.0001176052060220283, "train_loss": 0.408755088865757, "epoch": 681}
{"train_lr": 0.00011566790520747518, "train_loss": 0.4087392102777958, "epoch": 682}
{"train_lr": 0.00011374571527390314, "train_loss": 0.40866463065743447, "epoch": 683}
{"train_lr": 0.0001118386690662345, "train_loss": 0.4087050619006157, "epoch": 684}
{"train_lr": 0.00010994679917062744, "train_loss": 0.4086720600247383, "epoch": 685}
{"train_lr": 0.000108070137913918, "train_loss": 0.40857414263486863, "epoch": 686}
{"train_lr": 0.00010620871736307003, "train_loss": 0.40863434770703316, "epoch": 687}
{"train_lr": 0.00010436256932462424, "train_loss": 0.40859491340518, "epoch": 688}
{"train_lr": 0.00010253172534415723, "train_loss": 0.40860966989994046, "epoch": 689}
{"train_lr": 0.00010071621670574097, "train_loss": 0.408625454801321, "epoch": 690}
{"train_lr": 9.891607443140929e-05, "train_loss": 0.40844214201569556, "epoch": 691}
{"train_lr": 9.713132928062657e-05, "train_loss": 0.40843296210169794, "epoch": 692}
{"train_lr": 9.536201174976322e-05, "train_loss": 0.40837096125483513, "epoch": 693}
{"train_lr": 9.360815207157413e-05, "train_loss": 0.4083694005072117, "epoch": 694}
{"train_lr": 9.186978021468215e-05, "train_loss": 0.4084002661764622, "epoch": 695}
{"train_lr": 9.014692588306594e-05, "train_loss": 0.40843813487291336, "epoch": 696}
{"train_lr": 8.84396185155527e-05, "train_loss": 0.40834322509765625, "epoch": 697}
{"train_lr": 8.67478872853143e-05, "train_loss": 0.4083211016476154, "epoch": 698}
{"train_lr": 8.507176109937047e-05, "train_loss": 0.4082286029994488, "epoch": 699}
{"train_lr": 8.341126859809256e-05, "train_loss": 0.40823151443004607, "epoch": 700}
{"train_lr": 8.176643815471623e-05, "train_loss": 0.40823154353499413, "epoch": 701}
{"train_lr": 8.013729787485531e-05, "train_loss": 0.40827645783424377, "epoch": 702}
{"train_lr": 7.852387559602257e-05, "train_loss": 0.40825580505132675, "epoch": 703}
{"train_lr": 7.692619888715302e-05, "train_loss": 0.4081780993103981, "epoch": 704}
{"train_lr": 7.534429504813323e-05, "train_loss": 0.4081855354487896, "epoch": 705}
{"train_lr": 7.377819110933544e-05, "train_loss": 0.4082311128556728, "epoch": 706}
{"train_lr": 7.222791383115492e-05, "train_loss": 0.4081001627087593, "epoch": 707}
{"train_lr": 7.069348970355303e-05, "train_loss": 0.40801326141357425, "epoch": 708}
{"train_lr": 6.917494494560436e-05, "train_loss": 0.40805929116606715, "epoch": 709}
{"train_lr": 6.767230550504895e-05, "train_loss": 0.4080538489818573, "epoch": 710}
{"train_lr": 6.618559705784932e-05, "train_loss": 0.4080111927628517, "epoch": 711}
{"train_lr": 6.471484500775038e-05, "train_loss": 0.40799329899549486, "epoch": 712}
{"train_lr": 6.326007448584706e-05, "train_loss": 0.4080479858994484, "epoch": 713}
{"train_lr": 6.182131035015343e-05, "train_loss": 0.4079994874477387, "epoch": 714}
{"train_lr": 6.0398577185179195e-05, "train_loss": 0.4078952370584011, "epoch": 715}
{"train_lr": 5.8991899301508436e-05, "train_loss": 0.40794192504286764, "epoch": 716}
{"train_lr": 5.7601300735385406e-05, "train_loss": 0.4079172481238842, "epoch": 717}
{"train_lr": 5.62268052483022e-05, "train_loss": 0.4078769870400429, "epoch": 718}
{"train_lr": 5.4868436326594996e-05, "train_loss": 0.40775742872953413, "epoch": 719}
{"train_lr": 5.352621718104013e-05, "train_loss": 0.4078458012342453, "epoch": 720}
{"train_lr": 5.220017074646012e-05, "train_loss": 0.4077809689939022, "epoch": 721}
{"train_lr": 5.089031968132945e-05, "train_loss": 0.40774403147697447, "epoch": 722}
{"train_lr": 4.959668636738903e-05, "train_loss": 0.4077515964627266, "epoch": 723}
{"train_lr": 4.831929290926272e-05, "train_loss": 0.407721921145916, "epoch": 724}
{"train_lr": 4.705816113408049e-05, "train_loss": 0.40768695514798164, "epoch": 725}
{"train_lr": 4.5813312591104704e-05, "train_loss": 0.4076756275653839, "epoch": 726}
{"train_lr": 4.458476855136227e-05, "train_loss": 0.40769834047555925, "epoch": 727}
{"train_lr": 4.3372550007281185e-05, "train_loss": 0.4076857505738735, "epoch": 728}
{"train_lr": 4.217667767233175e-05, "train_loss": 0.4076809181332588, "epoch": 729}
{"train_lr": 4.0997171980672597e-05, "train_loss": 0.4076770887076855, "epoch": 730}
{"train_lr": 3.9834053086801805e-05, "train_loss": 0.4075366601884365, "epoch": 731}
{"train_lr": 3.868734086521197e-05, "train_loss": 0.40765976741313936, "epoch": 732}
{"train_lr": 3.7557054910051054e-05, "train_loss": 0.40767239355444906, "epoch": 733}
{"train_lr": 3.644321453478749e-05, "train_loss": 0.4076313421726227, "epoch": 734}
{"train_lr": 3.5345838771880166e-05, "train_loss": 0.40756957579255104, "epoch": 735}
{"train_lr": 3.4264946372453015e-05, "train_loss": 0.40758756697773935, "epoch": 736}
{"train_lr": 3.3200555805974955e-05, "train_loss": 0.40753637469410897, "epoch": 737}
{"train_lr": 3.215268525994395e-05, "train_loss": 0.40759654030799863, "epoch": 738}
{"train_lr": 3.1121352639576464e-05, "train_loss": 0.4075975024521351, "epoch": 739}
{"train_lr": 3.0106575567501452e-05, "train_loss": 0.4074262948334217, "epoch": 740}
{"train_lr": 2.9108371383459213e-05, "train_loss": 0.4075006844162941, "epoch": 741}
{"train_lr": 2.8126757144005083e-05, "train_loss": 0.4073981125712395, "epoch": 742}
{"train_lr": 2.7161749622217994e-05, "train_loss": 0.40740938003063204, "epoch": 743}
{"train_lr": 2.6213365307414162e-05, "train_loss": 0.4074016982078552, "epoch": 744}
{"train_lr": 2.5281620404864564e-05, "train_loss": 0.4073709517121315, "epoch": 745}
{"train_lr": 2.4366530835519025e-05, "train_loss": 0.40737549446821214, "epoch": 746}
{"train_lr": 2.3468112235733392e-05, "train_loss": 0.4074480685114861, "epoch": 747}
{"train_lr": 2.2586379957002727e-05, "train_loss": 0.407499808126688, "epoch": 748}
{"train_lr": 2.1721349065698846e-05, "train_loss": 0.40737112711071966, "epoch": 749}
{"train_lr": 2.087303434281305e-05, "train_loss": 0.40735656403303144, "epoch": 750}
{"train_lr": 2.0041450283703275e-05, "train_loss": 0.40729228178858756, "epoch": 751}
{"train_lr": 1.9226611097846807e-05, "train_loss": 0.40734857454895973, "epoch": 752}
{"train_lr": 1.842853070859705e-05, "train_loss": 0.407330923384428, "epoch": 753}
{"train_lr": 1.7647222752945838e-05, "train_loss": 0.40724869443178174, "epoch": 754}
{"train_lr": 1.688270058129047e-05, "train_loss": 0.4072960561275482, "epoch": 755}
{"train_lr": 1.6134977257205462e-05, "train_loss": 0.407342313015461, "epoch": 756}
{"train_lr": 1.5404065557219386e-05, "train_loss": 0.40731965934634207, "epoch": 757}
{"train_lr": 1.4689977970596522e-05, "train_loss": 0.40725169029831887, "epoch": 758}
{"train_lr": 1.3992726699123512e-05, "train_loss": 0.4072245597243309, "epoch": 759}
{"train_lr": 1.3312323656900852e-05, "train_loss": 0.40719416123628616, "epoch": 760}
{"train_lr": 1.2648780470139173e-05, "train_loss": 0.4072723692417145, "epoch": 761}
{"train_lr": 1.2002108476960741e-05, "train_loss": 0.4072173948287964, "epoch": 762}
{"train_lr": 1.1372318727205755e-05, "train_loss": 0.40724221390485765, "epoch": 763}
{"train_lr": 1.0759421982243326e-05, "train_loss": 0.40718788425326347, "epoch": 764}
{"train_lr": 1.0163428714787861e-05, "train_loss": 0.40724759435653685, "epoch": 765}
{"train_lr": 9.584349108719813e-06, "train_loss": 0.40717979621887207, "epoch": 766}
{"train_lr": 9.022193058912006e-06, "train_loss": 0.4071979228913784, "epoch": 767}
{"train_lr": 8.476970171060192e-06, "train_loss": 0.40717670152187346, "epoch": 768}
{"train_lr": 7.948689761519278e-06, "train_loss": 0.40705007915496827, "epoch": 769}
{"train_lr": 7.437360857143847e-06, "train_loss": 0.4072156092405319, "epoch": 770}
{"train_lr": 6.942992195134097e-06, "train_loss": 0.4070780915558338, "epoch": 771}
{"train_lr": 6.465592222886441e-06, "train_loss": 0.4070723837614059, "epoch": 772}
{"train_lr": 6.0051690978492155e-06, "train_loss": 0.40715753821730616, "epoch": 773}
{"train_lr": 5.561730687383275e-06, "train_loss": 0.40711742687225344, "epoch": 774}
{"train_lr": 5.135284568627556e-06, "train_loss": 0.407139888215065, "epoch": 775}
{"train_lr": 4.725838028369653e-06, "train_loss": 0.4070862729489803, "epoch": 776}
{"train_lr": 4.333398062921207e-06, "train_loss": 0.40716656067967416, "epoch": 777}
{"train_lr": 3.957971377998454e-06, "train_loss": 0.4070811638891697, "epoch": 778}
{"train_lr": 3.599564388607613e-06, "train_loss": 0.40715316613912583, "epoch": 779}
{"train_lr": 3.258183218935257e-06, "train_loss": 0.4070707754790783, "epoch": 780}
{"train_lr": 2.9338337022436484e-06, "train_loss": 0.407094335603714, "epoch": 781}
{"train_lr": 2.626521380771149e-06, "train_loss": 0.4070680266022682, "epoch": 782}
{"train_lr": 2.3362515056374043e-06, "train_loss": 0.4070445769608021, "epoch": 783}
{"train_lr": 2.0630290367537063e-06, "train_loss": 0.407051396137476, "epoch": 784}
{"train_lr": 1.8068586427382016e-06, "train_loss": 0.4070886338174343, "epoch": 785}
{"train_lr": 1.5677447008361348e-06, "train_loss": 0.4070832368195057, "epoch": 786}
{"train_lr": 1.3456912968450236e-06, "train_loss": 0.4070368420124054, "epoch": 787}
{"train_lr": 1.140702225044881e-06, "train_loss": 0.40696477791666985, "epoch": 788}
{"train_lr": 9.527809881333541e-07, "train_loss": 0.40711091704964636, "epoch": 789}
{"train_lr": 7.819307971659009e-07, "train_loss": 0.40703405417203903, "epoch": 790}
{"train_lr": 6.281545715008838e-07, "train_loss": 0.4070916808605194, "epoch": 791}
{"train_lr": 4.91454938749716e-07, "train_loss": 0.4070300230205059, "epoch": 792}
{"train_lr": 3.7183423473196524e-07, "train_loss": 0.40707525467276573, "epoch": 793}
{"train_lr": 2.6929450343540397e-07, "train_loss": 0.40699523387551306, "epoch": 794}
{"train_lr": 1.8383749698112992e-07, "train_loss": 0.4070662397742271, "epoch": 795}
{"train_lr": 1.1546467559359906e-07, "train_loss": 0.40707216830849646, "epoch": 796}
{"train_lr": 6.417720757569029e-08, "train_loss": 0.4070766533434391, "epoch": 797}
{"train_lr": 2.9975969288707755e-08, "train_loss": 0.4070338776230812, "epoch": 798}
{"train_lr": 1.2861545137461837e-08, "train_loss": 0.4070114720463753, "epoch": 799}