-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathresults 3 (epoch=100).txt
1701 lines (1701 loc) · 110 KB
/
results 3 (epoch=100).txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
Epoch: [ 1], step: [10], time: [2.7649], loss: [0.00109137]
Epoch: [ 1], step: [20], time: [5.4004], loss: [0.00080989]
Epoch: [ 1], step: [30], time: [8.0478], loss: [0.00075109]
Epoch: [ 1], step: [40], time: [10.6777], loss: [0.00255918]
Epoch: [ 1], step: [50], time: [13.3149], loss: [0.00096065]
Epoch: [ 1], step: [60], time: [15.9459], loss: [0.00033348]
Epoch: [ 1], step: [70], time: [18.6621], loss: [0.00175625]
Epoch: [ 1], step: [80], time: [21.7127], loss: [0.00027413]
Epoch: [ 1], step: [90], time: [24.9195], loss: [0.00422178]
Epoch: [ 1], step: [100], time: [27.8999], loss: [0.00770430]
Epoch: [ 1], step: [110], time: [30.8688], loss: [0.00030762]
Epoch: [ 1], step: [120], time: [33.6139], loss: [0.00147307]
Epoch: [ 1], step: [130], time: [36.4298], loss: [0.00093158]
Epoch: [ 1], step: [140], time: [39.2302], loss: [0.00035774]
Epoch: [ 1], step: [150], time: [42.5349], loss: [0.00089210]
Epoch: [ 1], step: [160], time: [45.5014], loss: [0.00456960]
Epoch: [ 1], step: [170], time: [48.5560], loss: [0.00040237]
Epoch: [ 2], step: [180], time: [51.8430], loss: [0.00109148]
Epoch: [ 2], step: [190], time: [55.4951], loss: [0.00081008]
Epoch: [ 2], step: [200], time: [58.9257], loss: [0.00075120]
Epoch: [ 2], step: [210], time: [61.6261], loss: [0.00255910]
Epoch: [ 2], step: [220], time: [64.2526], loss: [0.00096062]
Epoch: [ 2], step: [230], time: [67.1055], loss: [0.00033346]
Epoch: [ 2], step: [240], time: [69.8098], loss: [0.00175630]
Epoch: [ 2], step: [250], time: [73.0016], loss: [0.00027418]
Epoch: [ 2], step: [260], time: [76.4548], loss: [0.00422178]
Epoch: [ 2], step: [270], time: [79.4243], loss: [0.00770428]
Epoch: [ 2], step: [280], time: [82.0953], loss: [0.00030762]
Epoch: [ 2], step: [290], time: [84.7557], loss: [0.00147304]
Epoch: [ 2], step: [300], time: [87.4263], loss: [0.00093157]
Epoch: [ 2], step: [310], time: [90.1008], loss: [0.00035775]
Epoch: [ 2], step: [320], time: [92.7657], loss: [0.00089208]
Epoch: [ 2], step: [330], time: [95.4585], loss: [0.00456959]
Epoch: [ 2], step: [340], time: [98.1546], loss: [0.00040236]
Epoch: [ 3], step: [350], time: [100.8540], loss: [0.00109149]
Epoch: [ 3], step: [360], time: [103.5235], loss: [0.00081011]
Epoch: [ 3], step: [370], time: [106.1970], loss: [0.00075121]
Epoch: [ 3], step: [380], time: [108.9454], loss: [0.00255910]
Epoch: [ 3], step: [390], time: [111.5880], loss: [0.00096062]
Epoch: [ 3], step: [400], time: [114.2134], loss: [0.00033346]
Epoch: [ 3], step: [410], time: [116.8719], loss: [0.00175630]
Epoch: [ 3], step: [420], time: [119.5528], loss: [0.00027418]
Epoch: [ 3], step: [430], time: [122.2151], loss: [0.00422178]
Epoch: [ 3], step: [440], time: [125.1980], loss: [0.00770428]
Epoch: [ 3], step: [450], time: [128.5251], loss: [0.00030762]
Epoch: [ 3], step: [460], time: [131.8896], loss: [0.00147303]
Epoch: [ 3], step: [470], time: [135.4302], loss: [0.00093157]
Epoch: [ 3], step: [480], time: [139.2068], loss: [0.00035775]
Epoch: [ 3], step: [490], time: [142.5064], loss: [0.00089208]
Epoch: [ 3], step: [500], time: [146.1528], loss: [0.00456959]
Epoch: [ 3], step: [510], time: [149.6536], loss: [0.00040236]
Epoch: [ 4], step: [520], time: [152.4868], loss: [0.00109149]
Epoch: [ 4], step: [530], time: [155.3962], loss: [0.00081011]
Epoch: [ 4], step: [540], time: [158.8096], loss: [0.00075121]
Epoch: [ 4], step: [550], time: [162.2542], loss: [0.00255909]
Epoch: [ 4], step: [560], time: [165.4258], loss: [0.00096062]
Epoch: [ 4], step: [570], time: [169.1427], loss: [0.00033346]
Epoch: [ 4], step: [580], time: [172.1538], loss: [0.00175631]
Epoch: [ 4], step: [590], time: [175.3960], loss: [0.00027418]
Epoch: [ 4], step: [600], time: [178.5158], loss: [0.00422178]
Epoch: [ 4], step: [610], time: [182.6560], loss: [0.00770428]
Epoch: [ 4], step: [620], time: [186.4074], loss: [0.00030762]
Epoch: [ 4], step: [630], time: [189.9155], loss: [0.00147303]
Epoch: [ 4], step: [640], time: [193.2974], loss: [0.00093157]
Epoch: [ 4], step: [650], time: [196.7142], loss: [0.00035775]
Epoch: [ 4], step: [660], time: [200.1037], loss: [0.00089208]
Epoch: [ 4], step: [670], time: [203.9938], loss: [0.00456958]
Epoch: [ 4], step: [680], time: [207.7282], loss: [0.00040236]
Epoch: [ 5], step: [690], time: [212.5322], loss: [0.00109149]
Epoch: [ 5], step: [700], time: [216.9102], loss: [0.00081011]
Epoch: [ 5], step: [710], time: [220.3600], loss: [0.00075121]
Epoch: [ 5], step: [720], time: [224.0186], loss: [0.00255909]
Epoch: [ 5], step: [730], time: [227.1704], loss: [0.00096062]
Epoch: [ 5], step: [740], time: [229.9177], loss: [0.00033346]
Epoch: [ 5], step: [750], time: [233.3370], loss: [0.00175630]
Epoch: [ 5], step: [760], time: [236.2566], loss: [0.00027418]
Epoch: [ 5], step: [770], time: [238.9471], loss: [0.00422178]
Epoch: [ 5], step: [780], time: [242.3242], loss: [0.00770428]
Epoch: [ 5], step: [790], time: [245.5298], loss: [0.00030762]
Epoch: [ 5], step: [800], time: [248.5705], loss: [0.00147303]
Epoch: [ 5], step: [810], time: [251.4618], loss: [0.00093157]
Epoch: [ 5], step: [820], time: [254.3383], loss: [0.00035775]
Epoch: [ 5], step: [830], time: [257.1574], loss: [0.00089208]
Epoch: [ 5], step: [840], time: [260.1834], loss: [0.00456958]
Epoch: [ 5], step: [850], time: [263.3498], loss: [0.00040236]
Epoch: [ 6], step: [860], time: [266.6986], loss: [0.00109149]
Epoch: [ 6], step: [870], time: [270.1559], loss: [0.00081011]
Epoch: [ 6], step: [880], time: [272.8742], loss: [0.00075121]
Epoch: [ 6], step: [890], time: [275.9882], loss: [0.00255909]
Epoch: [ 6], step: [900], time: [279.4545], loss: [0.00096062]
Epoch: [ 6], step: [910], time: [283.0311], loss: [0.00033346]
Epoch: [ 6], step: [920], time: [286.8621], loss: [0.00175630]
Epoch: [ 6], step: [930], time: [289.6779], loss: [0.00027418]
Epoch: [ 6], step: [940], time: [292.4391], loss: [0.00422178]
Epoch: [ 6], step: [950], time: [295.6385], loss: [0.00770428]
Epoch: [ 6], step: [960], time: [299.0157], loss: [0.00030762]
Epoch: [ 6], step: [970], time: [301.7116], loss: [0.00147303]
Epoch: [ 6], step: [980], time: [304.3404], loss: [0.00093157]
Epoch: [ 6], step: [990], time: [307.2321], loss: [0.00035775]
Epoch: [ 6], step: [1000], time: [310.2067], loss: [0.00089208]
Epoch: [ 6], step: [1010], time: [313.2307], loss: [0.00456958]
Epoch: [ 6], step: [1020], time: [315.9500], loss: [0.00040236]
Epoch: [ 7], step: [1030], time: [318.7064], loss: [0.00109149]
Epoch: [ 7], step: [1040], time: [321.3944], loss: [0.00081011]
Epoch: [ 7], step: [1050], time: [324.1113], loss: [0.00075121]
Epoch: [ 7], step: [1060], time: [326.8342], loss: [0.00255909]
Epoch: [ 7], step: [1070], time: [329.8699], loss: [0.00096062]
Epoch: [ 7], step: [1080], time: [333.2227], loss: [0.00033346]
Epoch: [ 7], step: [1090], time: [336.7691], loss: [0.00175630]
Epoch: [ 7], step: [1100], time: [339.5250], loss: [0.00027418]
Epoch: [ 7], step: [1110], time: [342.2874], loss: [0.00422178]
Epoch: [ 7], step: [1120], time: [345.2596], loss: [0.00770428]
Epoch: [ 7], step: [1130], time: [348.0093], loss: [0.00030762]
Epoch: [ 7], step: [1140], time: [350.9188], loss: [0.00147303]
Epoch: [ 7], step: [1150], time: [353.6518], loss: [0.00093157]
Epoch: [ 7], step: [1160], time: [356.4463], loss: [0.00035775]
Epoch: [ 7], step: [1170], time: [359.1171], loss: [0.00089208]
Epoch: [ 7], step: [1180], time: [361.9808], loss: [0.00456958]
Epoch: [ 7], step: [1190], time: [364.8063], loss: [0.00040236]
Epoch: [ 8], step: [1200], time: [367.9861], loss: [0.00109149]
Epoch: [ 8], step: [1210], time: [371.2301], loss: [0.00081011]
Epoch: [ 8], step: [1220], time: [374.4329], loss: [0.00075121]
Epoch: [ 8], step: [1230], time: [377.2222], loss: [0.00255909]
Epoch: [ 8], step: [1240], time: [379.9472], loss: [0.00096062]
Epoch: [ 8], step: [1250], time: [382.6565], loss: [0.00033346]
Epoch: [ 8], step: [1260], time: [385.4930], loss: [0.00175630]
Epoch: [ 8], step: [1270], time: [388.2900], loss: [0.00027418]
Epoch: [ 8], step: [1280], time: [391.2438], loss: [0.00422178]
Epoch: [ 8], step: [1290], time: [393.9481], loss: [0.00770428]
Epoch: [ 8], step: [1300], time: [396.7192], loss: [0.00030762]
Epoch: [ 8], step: [1310], time: [399.4867], loss: [0.00147303]
Epoch: [ 8], step: [1320], time: [402.1058], loss: [0.00093157]
Epoch: [ 8], step: [1330], time: [404.7219], loss: [0.00035775]
Epoch: [ 8], step: [1340], time: [407.4092], loss: [0.00089208]
Epoch: [ 8], step: [1350], time: [410.0744], loss: [0.00456958]
Epoch: [ 8], step: [1360], time: [412.8516], loss: [0.00040236]
Epoch: [ 9], step: [1370], time: [416.3582], loss: [0.00109149]
Epoch: [ 9], step: [1380], time: [419.1324], loss: [0.00081011]
Epoch: [ 9], step: [1390], time: [421.9267], loss: [0.00075121]
Epoch: [ 9], step: [1400], time: [424.9457], loss: [0.00255909]
Epoch: [ 9], step: [1410], time: [427.6884], loss: [0.00096062]
Epoch: [ 9], step: [1420], time: [430.3333], loss: [0.00033346]
Epoch: [ 9], step: [1430], time: [433.3037], loss: [0.00175630]
Epoch: [ 9], step: [1440], time: [436.0107], loss: [0.00027418]
Epoch: [ 9], step: [1450], time: [438.9159], loss: [0.00422178]
Epoch: [ 9], step: [1460], time: [442.0330], loss: [0.00770428]
Epoch: [ 9], step: [1470], time: [444.8770], loss: [0.00030762]
Epoch: [ 9], step: [1480], time: [447.7595], loss: [0.00147303]
Epoch: [ 9], step: [1490], time: [450.5213], loss: [0.00093157]
Epoch: [ 9], step: [1500], time: [453.2845], loss: [0.00035775]
Epoch: [ 9], step: [1510], time: [456.4421], loss: [0.00089208]
Epoch: [ 9], step: [1520], time: [459.5848], loss: [0.00456958]
Epoch: [ 9], step: [1530], time: [462.4031], loss: [0.00040236]
Epoch: [10], step: [1540], time: [465.2110], loss: [0.00109149]
Epoch: [10], step: [1550], time: [467.8536], loss: [0.00081011]
Epoch: [10], step: [1560], time: [470.4920], loss: [0.00075121]
Epoch: [10], step: [1570], time: [473.2834], loss: [0.00255909]
Epoch: [10], step: [1580], time: [476.2685], loss: [0.00096062]
Epoch: [10], step: [1590], time: [479.1697], loss: [0.00033346]
Epoch: [10], step: [1600], time: [482.0981], loss: [0.00175630]
Epoch: [10], step: [1610], time: [484.8788], loss: [0.00027418]
Epoch: [10], step: [1620], time: [487.7385], loss: [0.00422178]
Epoch: [10], step: [1630], time: [490.4743], loss: [0.00770428]
Epoch: [10], step: [1640], time: [493.4746], loss: [0.00030762]
Epoch: [10], step: [1650], time: [496.3667], loss: [0.00147303]
Epoch: [10], step: [1660], time: [499.3600], loss: [0.00093157]
Epoch: [10], step: [1670], time: [502.1838], loss: [0.00035775]
Epoch: [10], step: [1680], time: [505.2022], loss: [0.00089208]
Epoch: [10], step: [1690], time: [508.3976], loss: [0.00456958]
Epoch: [10], step: [1700], time: [511.0931], loss: [0.00040236]
Epoch: [11], step: [1710], time: [513.8642], loss: [0.00109149]
Epoch: [11], step: [1720], time: [516.8661], loss: [0.00081011]
Epoch: [11], step: [1730], time: [520.4322], loss: [0.00075121]
Epoch: [11], step: [1740], time: [523.4970], loss: [0.00255909]
Epoch: [11], step: [1750], time: [527.4039], loss: [0.00096062]
Epoch: [11], step: [1760], time: [530.7298], loss: [0.00033346]
Epoch: [11], step: [1770], time: [533.8662], loss: [0.00175630]
Epoch: [11], step: [1780], time: [537.0409], loss: [0.00027418]
Epoch: [11], step: [1790], time: [539.9836], loss: [0.00422178]
Epoch: [11], step: [1800], time: [543.0593], loss: [0.00770428]
Epoch: [11], step: [1810], time: [545.9762], loss: [0.00030762]
Epoch: [11], step: [1820], time: [549.1060], loss: [0.00147303]
Epoch: [11], step: [1830], time: [551.7393], loss: [0.00093157]
Epoch: [11], step: [1840], time: [554.3753], loss: [0.00035775]
Epoch: [11], step: [1850], time: [557.0148], loss: [0.00089208]
Epoch: [11], step: [1860], time: [559.6319], loss: [0.00456958]
Epoch: [11], step: [1870], time: [562.2670], loss: [0.00040236]
Epoch: [12], step: [1880], time: [565.2308], loss: [0.00109149]
Epoch: [12], step: [1890], time: [568.5754], loss: [0.00081011]
Epoch: [12], step: [1900], time: [571.8611], loss: [0.00075121]
Epoch: [12], step: [1910], time: [575.1447], loss: [0.00255909]
Epoch: [12], step: [1920], time: [577.7877], loss: [0.00096062]
Epoch: [12], step: [1930], time: [580.4350], loss: [0.00033346]
Epoch: [12], step: [1940], time: [583.0791], loss: [0.00175630]
Epoch: [12], step: [1950], time: [585.7517], loss: [0.00027418]
Epoch: [12], step: [1960], time: [588.4303], loss: [0.00422178]
Epoch: [12], step: [1970], time: [591.1489], loss: [0.00770428]
Epoch: [12], step: [1980], time: [593.9313], loss: [0.00030762]
Epoch: [12], step: [1990], time: [597.2377], loss: [0.00147303]
Epoch: [12], step: [2000], time: [600.3770], loss: [0.00093157]
Epoch: [12], step: [2010], time: [604.2091], loss: [0.00035775]
Epoch: [12], step: [2020], time: [607.5267], loss: [0.00089208]
Epoch: [12], step: [2030], time: [610.7220], loss: [0.00456957]
Epoch: [12], step: [2040], time: [613.7110], loss: [0.00040236]
Epoch: [13], step: [2050], time: [616.7396], loss: [0.00109149]
Epoch: [13], step: [2060], time: [619.4905], loss: [0.00081011]
Epoch: [13], step: [2070], time: [622.3849], loss: [0.00075121]
Epoch: [13], step: [2080], time: [625.3801], loss: [0.00255909]
Epoch: [13], step: [2090], time: [628.1675], loss: [0.00096062]
Epoch: [13], step: [2100], time: [630.9234], loss: [0.00033346]
Epoch: [13], step: [2110], time: [633.6131], loss: [0.00175630]
Epoch: [13], step: [2120], time: [636.3115], loss: [0.00027418]
Epoch: [13], step: [2130], time: [639.0731], loss: [0.00422178]
Epoch: [13], step: [2140], time: [641.8143], loss: [0.00770428]
Epoch: [13], step: [2150], time: [644.6361], loss: [0.00030762]
Epoch: [13], step: [2160], time: [647.4542], loss: [0.00147303]
Epoch: [13], step: [2170], time: [650.1461], loss: [0.00093157]
Epoch: [13], step: [2180], time: [652.8786], loss: [0.00035775]
Epoch: [13], step: [2190], time: [655.5092], loss: [0.00089208]
Epoch: [13], step: [2200], time: [658.5861], loss: [0.00456957]
Epoch: [13], step: [2210], time: [661.6142], loss: [0.00040236]
Epoch: [14], step: [2220], time: [664.4436], loss: [0.00109149]
Epoch: [14], step: [2230], time: [667.1330], loss: [0.00081011]
Epoch: [14], step: [2240], time: [669.8032], loss: [0.00075121]
Epoch: [14], step: [2250], time: [672.4454], loss: [0.00255909]
Epoch: [14], step: [2260], time: [675.1623], loss: [0.00096062]
Epoch: [14], step: [2270], time: [677.8467], loss: [0.00033346]
Epoch: [14], step: [2280], time: [680.5660], loss: [0.00175630]
Epoch: [14], step: [2290], time: [683.3064], loss: [0.00027418]
Epoch: [14], step: [2300], time: [686.3021], loss: [0.00422178]
Epoch: [14], step: [2310], time: [689.0452], loss: [0.00770428]
Epoch: [14], step: [2320], time: [691.8669], loss: [0.00030762]
Epoch: [14], step: [2330], time: [694.7238], loss: [0.00147303]
Epoch: [14], step: [2340], time: [697.4295], loss: [0.00093157]
Epoch: [14], step: [2350], time: [700.3288], loss: [0.00035775]
Epoch: [14], step: [2360], time: [703.1498], loss: [0.00089208]
Epoch: [14], step: [2370], time: [706.0670], loss: [0.00456957]
Epoch: [14], step: [2380], time: [709.0064], loss: [0.00040236]
Epoch: [15], step: [2390], time: [711.8551], loss: [0.00109149]
Epoch: [15], step: [2400], time: [714.6035], loss: [0.00081011]
Epoch: [15], step: [2410], time: [717.3136], loss: [0.00075121]
Epoch: [15], step: [2420], time: [720.2313], loss: [0.00255909]
Epoch: [15], step: [2430], time: [723.0566], loss: [0.00096062]
Epoch: [15], step: [2440], time: [725.9864], loss: [0.00033346]
Epoch: [15], step: [2450], time: [728.8612], loss: [0.00175630]
Epoch: [15], step: [2460], time: [731.7488], loss: [0.00027418]
Epoch: [15], step: [2470], time: [734.6644], loss: [0.00422178]
Epoch: [15], step: [2480], time: [737.5399], loss: [0.00770428]
Epoch: [15], step: [2490], time: [740.7650], loss: [0.00030762]
Epoch: [15], step: [2500], time: [743.8847], loss: [0.00147303]
Epoch: [15], step: [2510], time: [747.2571], loss: [0.00093157]
Epoch: [15], step: [2520], time: [750.4376], loss: [0.00035775]
Epoch: [15], step: [2530], time: [753.4975], loss: [0.00089208]
Epoch: [15], step: [2540], time: [756.5680], loss: [0.00456957]
Epoch: [15], step: [2550], time: [759.4560], loss: [0.00040236]
Epoch: [16], step: [2560], time: [762.3374], loss: [0.00109149]
Epoch: [16], step: [2570], time: [765.1146], loss: [0.00081011]
Epoch: [16], step: [2580], time: [767.7800], loss: [0.00075121]
Epoch: [16], step: [2590], time: [770.4619], loss: [0.00255909]
Epoch: [16], step: [2600], time: [773.1673], loss: [0.00096062]
Epoch: [16], step: [2610], time: [776.0169], loss: [0.00033346]
Epoch: [16], step: [2620], time: [778.9848], loss: [0.00175630]
Epoch: [16], step: [2630], time: [782.3043], loss: [0.00027418]
Epoch: [16], step: [2640], time: [785.2068], loss: [0.00422177]
Epoch: [16], step: [2650], time: [787.9635], loss: [0.00770428]
Epoch: [16], step: [2660], time: [790.6431], loss: [0.00030762]
Epoch: [16], step: [2670], time: [793.3546], loss: [0.00147303]
Epoch: [16], step: [2680], time: [796.0370], loss: [0.00093157]
Epoch: [16], step: [2690], time: [798.7691], loss: [0.00035775]
Epoch: [16], step: [2700], time: [801.4346], loss: [0.00089208]
Epoch: [16], step: [2710], time: [804.0750], loss: [0.00456957]
Epoch: [16], step: [2720], time: [806.7332], loss: [0.00040236]
Epoch: [17], step: [2730], time: [809.4292], loss: [0.00109149]
Epoch: [17], step: [2740], time: [812.0751], loss: [0.00081011]
Epoch: [17], step: [2750], time: [814.8052], loss: [0.00075121]
Epoch: [17], step: [2760], time: [817.5415], loss: [0.00255909]
Epoch: [17], step: [2770], time: [820.2712], loss: [0.00096062]
Epoch: [17], step: [2780], time: [822.9955], loss: [0.00033346]
Epoch: [17], step: [2790], time: [825.7401], loss: [0.00175629]
Epoch: [17], step: [2800], time: [828.4152], loss: [0.00027418]
Epoch: [17], step: [2810], time: [831.0661], loss: [0.00422177]
Epoch: [17], step: [2820], time: [833.7592], loss: [0.00770428]
Epoch: [17], step: [2830], time: [836.4296], loss: [0.00030762]
Epoch: [17], step: [2840], time: [839.2962], loss: [0.00147303]
Epoch: [17], step: [2850], time: [842.1238], loss: [0.00093157]
Epoch: [17], step: [2860], time: [844.9269], loss: [0.00035775]
Epoch: [17], step: [2870], time: [847.6538], loss: [0.00089208]
Epoch: [17], step: [2880], time: [850.3922], loss: [0.00456957]
Epoch: [17], step: [2890], time: [853.4113], loss: [0.00040236]
Epoch: [18], step: [2900], time: [856.5898], loss: [0.00109149]
Epoch: [18], step: [2910], time: [859.2245], loss: [0.00081011]
Epoch: [18], step: [2920], time: [861.9928], loss: [0.00075121]
Epoch: [18], step: [2930], time: [864.6675], loss: [0.00255909]
Epoch: [18], step: [2940], time: [867.5550], loss: [0.00096062]
Epoch: [18], step: [2950], time: [870.5803], loss: [0.00033346]
Epoch: [18], step: [2960], time: [873.3660], loss: [0.00175629]
Epoch: [18], step: [2970], time: [876.2787], loss: [0.00027418]
Epoch: [18], step: [2980], time: [879.2254], loss: [0.00422177]
Epoch: [18], step: [2990], time: [882.2941], loss: [0.00770428]
Epoch: [18], step: [3000], time: [885.0249], loss: [0.00030762]
Epoch: [18], step: [3010], time: [888.0413], loss: [0.00147303]
Epoch: [18], step: [3020], time: [890.9957], loss: [0.00093157]
Epoch: [18], step: [3030], time: [893.7808], loss: [0.00035774]
Epoch: [18], step: [3040], time: [896.6443], loss: [0.00089208]
Epoch: [18], step: [3050], time: [900.1350], loss: [0.00456957]
Epoch: [18], step: [3060], time: [903.4700], loss: [0.00040236]
Epoch: [19], step: [3070], time: [906.2657], loss: [0.00109149]
Epoch: [19], step: [3080], time: [908.9396], loss: [0.00081011]
Epoch: [19], step: [3090], time: [911.6160], loss: [0.00075121]
Epoch: [19], step: [3100], time: [914.2540], loss: [0.00255909]
Epoch: [19], step: [3110], time: [917.3895], loss: [0.00096062]
Epoch: [19], step: [3120], time: [920.0008], loss: [0.00033346]
Epoch: [19], step: [3130], time: [922.8497], loss: [0.00175629]
Epoch: [19], step: [3140], time: [925.4887], loss: [0.00027418]
Epoch: [19], step: [3150], time: [928.1587], loss: [0.00422177]
Epoch: [19], step: [3160], time: [931.0457], loss: [0.00770428]
Epoch: [19], step: [3170], time: [933.7804], loss: [0.00030762]
Epoch: [19], step: [3180], time: [936.4415], loss: [0.00147303]
Epoch: [19], step: [3190], time: [939.1969], loss: [0.00093157]
Epoch: [19], step: [3200], time: [941.8435], loss: [0.00035774]
Epoch: [19], step: [3210], time: [944.5541], loss: [0.00089207]
Epoch: [19], step: [3220], time: [947.4425], loss: [0.00456957]
Epoch: [19], step: [3230], time: [950.3957], loss: [0.00040236]
Epoch: [20], step: [3240], time: [953.5488], loss: [0.00109149]
Epoch: [20], step: [3250], time: [956.4131], loss: [0.00081011]
Epoch: [20], step: [3260], time: [959.3673], loss: [0.00075121]
Epoch: [20], step: [3270], time: [962.2746], loss: [0.00255909]
Epoch: [20], step: [3280], time: [965.5865], loss: [0.00096062]
Epoch: [20], step: [3290], time: [968.6575], loss: [0.00033346]
Epoch: [20], step: [3300], time: [971.9265], loss: [0.00175629]
Epoch: [20], step: [3310], time: [974.6110], loss: [0.00027418]
Epoch: [20], step: [3320], time: [977.2863], loss: [0.00422177]
Epoch: [20], step: [3330], time: [979.9512], loss: [0.00770428]
Epoch: [20], step: [3340], time: [982.6368], loss: [0.00030762]
Epoch: [20], step: [3350], time: [985.3023], loss: [0.00147303]
Epoch: [20], step: [3360], time: [988.0343], loss: [0.00093157]
Epoch: [20], step: [3370], time: [990.8053], loss: [0.00035774]
Epoch: [20], step: [3380], time: [993.4939], loss: [0.00089207]
Epoch: [20], step: [3390], time: [996.2068], loss: [0.00456957]
Epoch: [20], step: [3400], time: [998.8787], loss: [0.00040236]
Epoch: [21], step: [3410], time: [1001.5493], loss: [0.00109149]
Epoch: [21], step: [3420], time: [1004.2012], loss: [0.00081011]
Epoch: [21], step: [3430], time: [1006.8513], loss: [0.00075121]
Epoch: [21], step: [3440], time: [1009.5248], loss: [0.00255909]
Epoch: [21], step: [3450], time: [1012.1812], loss: [0.00096062]
Epoch: [21], step: [3460], time: [1014.8598], loss: [0.00033346]
Epoch: [21], step: [3470], time: [1017.5138], loss: [0.00175629]
Epoch: [21], step: [3480], time: [1020.2334], loss: [0.00027418]
Epoch: [21], step: [3490], time: [1022.9588], loss: [0.00422177]
Epoch: [21], step: [3500], time: [1025.6195], loss: [0.00770428]
Epoch: [21], step: [3510], time: [1028.5374], loss: [0.00030762]
Epoch: [21], step: [3520], time: [1031.2010], loss: [0.00147303]
Epoch: [21], step: [3530], time: [1033.9935], loss: [0.00093157]
Epoch: [21], step: [3540], time: [1036.7240], loss: [0.00035774]
Epoch: [21], step: [3550], time: [1039.4339], loss: [0.00089207]
Epoch: [21], step: [3560], time: [1042.1773], loss: [0.00456956]
Epoch: [21], step: [3570], time: [1044.8982], loss: [0.00040236]
Epoch: [22], step: [3580], time: [1047.5681], loss: [0.00109149]
Epoch: [22], step: [3590], time: [1050.2481], loss: [0.00081011]
Epoch: [22], step: [3600], time: [1052.9127], loss: [0.00075121]
Epoch: [22], step: [3610], time: [1055.5513], loss: [0.00255909]
Epoch: [22], step: [3620], time: [1058.2068], loss: [0.00096061]
Epoch: [22], step: [3630], time: [1060.8545], loss: [0.00033346]
Epoch: [22], step: [3640], time: [1063.5289], loss: [0.00175629]
Epoch: [22], step: [3650], time: [1066.2088], loss: [0.00027418]
Epoch: [22], step: [3660], time: [1068.8364], loss: [0.00422177]
Epoch: [22], step: [3670], time: [1071.5235], loss: [0.00770428]
Epoch: [22], step: [3680], time: [1074.1875], loss: [0.00030762]
Epoch: [22], step: [3690], time: [1076.8360], loss: [0.00147303]
Epoch: [22], step: [3700], time: [1079.4872], loss: [0.00093157]
Epoch: [22], step: [3710], time: [1082.1913], loss: [0.00035774]
Epoch: [22], step: [3720], time: [1084.8956], loss: [0.00089207]
Epoch: [22], step: [3730], time: [1087.6438], loss: [0.00456956]
Epoch: [22], step: [3740], time: [1090.3281], loss: [0.00040236]
Epoch: [23], step: [3750], time: [1092.9832], loss: [0.00109149]
Epoch: [23], step: [3760], time: [1095.6733], loss: [0.00081011]
Epoch: [23], step: [3770], time: [1098.3642], loss: [0.00075121]
Epoch: [23], step: [3780], time: [1101.0460], loss: [0.00255909]
Epoch: [23], step: [3790], time: [1103.8604], loss: [0.00096061]
Epoch: [23], step: [3800], time: [1106.5498], loss: [0.00033346]
Epoch: [23], step: [3810], time: [1109.2755], loss: [0.00175629]
Epoch: [23], step: [3820], time: [1111.9967], loss: [0.00027418]
Epoch: [23], step: [3830], time: [1114.6325], loss: [0.00422177]
Epoch: [23], step: [3840], time: [1117.2798], loss: [0.00770428]
Epoch: [23], step: [3850], time: [1119.9399], loss: [0.00030762]
Epoch: [23], step: [3860], time: [1122.6133], loss: [0.00147303]
Epoch: [23], step: [3870], time: [1125.2670], loss: [0.00093157]
Epoch: [23], step: [3880], time: [1127.9246], loss: [0.00035774]
Epoch: [23], step: [3890], time: [1130.6066], loss: [0.00089207]
Epoch: [23], step: [3900], time: [1133.2789], loss: [0.00456956]
Epoch: [23], step: [3910], time: [1135.9522], loss: [0.00040236]
Epoch: [24], step: [3920], time: [1138.7150], loss: [0.00109149]
Epoch: [24], step: [3930], time: [1141.3645], loss: [0.00081011]
Epoch: [24], step: [3940], time: [1144.0160], loss: [0.00075121]
Epoch: [24], step: [3950], time: [1146.6875], loss: [0.00255908]
Epoch: [24], step: [3960], time: [1149.4166], loss: [0.00096061]
Epoch: [24], step: [3970], time: [1152.0854], loss: [0.00033346]
Epoch: [24], step: [3980], time: [1154.7286], loss: [0.00175629]
Epoch: [24], step: [3990], time: [1157.3740], loss: [0.00027418]
Epoch: [24], step: [4000], time: [1160.0288], loss: [0.00422177]
Epoch: [24], step: [4010], time: [1162.8457], loss: [0.00770428]
Epoch: [24], step: [4020], time: [1165.4858], loss: [0.00030762]
Epoch: [24], step: [4030], time: [1168.1399], loss: [0.00147303]
Epoch: [24], step: [4040], time: [1170.8114], loss: [0.00093156]
Epoch: [24], step: [4050], time: [1173.4886], loss: [0.00035774]
Epoch: [24], step: [4060], time: [1176.1456], loss: [0.00089207]
Epoch: [24], step: [4070], time: [1178.7977], loss: [0.00456956]
Epoch: [24], step: [4080], time: [1181.4188], loss: [0.00040236]
Epoch: [25], step: [4090], time: [1184.1914], loss: [0.00109149]
Epoch: [25], step: [4100], time: [1186.9536], loss: [0.00081011]
Epoch: [25], step: [4110], time: [1189.6135], loss: [0.00075121]
Epoch: [25], step: [4120], time: [1192.3285], loss: [0.00255908]
Epoch: [25], step: [4130], time: [1194.9950], loss: [0.00096061]
Epoch: [25], step: [4140], time: [1197.6590], loss: [0.00033346]
Epoch: [25], step: [4150], time: [1200.3275], loss: [0.00175629]
Epoch: [25], step: [4160], time: [1202.9685], loss: [0.00027418]
Epoch: [25], step: [4170], time: [1205.6336], loss: [0.00422177]
Epoch: [25], step: [4180], time: [1208.3078], loss: [0.00770428]
Epoch: [25], step: [4190], time: [1211.0306], loss: [0.00030762]
Epoch: [25], step: [4200], time: [1213.8104], loss: [0.00147303]
Epoch: [25], step: [4210], time: [1216.5999], loss: [0.00093156]
Epoch: [25], step: [4220], time: [1219.3835], loss: [0.00035774]
Epoch: [25], step: [4230], time: [1222.1583], loss: [0.00089207]
Epoch: [25], step: [4240], time: [1224.9636], loss: [0.00456956]
Epoch: [25], step: [4250], time: [1227.6670], loss: [0.00040236]
Epoch: [26], step: [4260], time: [1230.3810], loss: [0.00109149]
Epoch: [26], step: [4270], time: [1233.0595], loss: [0.00081011]
Epoch: [26], step: [4280], time: [1235.7178], loss: [0.00075121]
Epoch: [26], step: [4290], time: [1238.3813], loss: [0.00255908]
Epoch: [26], step: [4300], time: [1241.0687], loss: [0.00096061]
Epoch: [26], step: [4310], time: [1243.7586], loss: [0.00033346]
Epoch: [26], step: [4320], time: [1246.4254], loss: [0.00175629]
Epoch: [26], step: [4330], time: [1249.2864], loss: [0.00027418]
Epoch: [26], step: [4340], time: [1251.9908], loss: [0.00422177]
Epoch: [26], step: [4350], time: [1254.6778], loss: [0.00770428]
Epoch: [26], step: [4360], time: [1257.4108], loss: [0.00030762]
Epoch: [26], step: [4370], time: [1260.1515], loss: [0.00147303]
Epoch: [26], step: [4380], time: [1262.8969], loss: [0.00093156]
Epoch: [26], step: [4390], time: [1265.5508], loss: [0.00035774]
Epoch: [26], step: [4400], time: [1268.1945], loss: [0.00089207]
Epoch: [26], step: [4410], time: [1270.9162], loss: [0.00456956]
Epoch: [26], step: [4420], time: [1273.5858], loss: [0.00040236]
Epoch: [27], step: [4430], time: [1276.2557], loss: [0.00109149]
Epoch: [27], step: [4440], time: [1278.9405], loss: [0.00081011]
Epoch: [27], step: [4450], time: [1281.6135], loss: [0.00075121]
Epoch: [27], step: [4460], time: [1284.4302], loss: [0.00255908]
Epoch: [27], step: [4470], time: [1287.1669], loss: [0.00096061]
Epoch: [27], step: [4480], time: [1289.9630], loss: [0.00033346]
Epoch: [27], step: [4490], time: [1292.7416], loss: [0.00175629]
Epoch: [27], step: [4500], time: [1295.3894], loss: [0.00027418]
Epoch: [27], step: [4510], time: [1298.4353], loss: [0.00422177]
Epoch: [27], step: [4520], time: [1301.0828], loss: [0.00770428]
Epoch: [27], step: [4530], time: [1303.7238], loss: [0.00030762]
Epoch: [27], step: [4540], time: [1306.3777], loss: [0.00147303]
Epoch: [27], step: [4550], time: [1309.0257], loss: [0.00093156]
Epoch: [27], step: [4560], time: [1311.6692], loss: [0.00035774]
Epoch: [27], step: [4570], time: [1314.3184], loss: [0.00089207]
Epoch: [27], step: [4580], time: [1316.9812], loss: [0.00456956]
Epoch: [27], step: [4590], time: [1319.6295], loss: [0.00040236]
Epoch: [28], step: [4600], time: [1322.4569], loss: [0.00109149]
Epoch: [28], step: [4610], time: [1325.2112], loss: [0.00081011]
Epoch: [28], step: [4620], time: [1327.8708], loss: [0.00075121]
Epoch: [28], step: [4630], time: [1330.5277], loss: [0.00255908]
Epoch: [28], step: [4640], time: [1333.3393], loss: [0.00096061]
Epoch: [28], step: [4650], time: [1336.0405], loss: [0.00033346]
Epoch: [28], step: [4660], time: [1338.7293], loss: [0.00175628]
Epoch: [28], step: [4670], time: [1341.6025], loss: [0.00027418]
Epoch: [28], step: [4680], time: [1344.3654], loss: [0.00422177]
Epoch: [28], step: [4690], time: [1347.0923], loss: [0.00770427]
Epoch: [28], step: [4700], time: [1349.7956], loss: [0.00030762]
Epoch: [28], step: [4710], time: [1352.4644], loss: [0.00147302]
Epoch: [28], step: [4720], time: [1355.1114], loss: [0.00093156]
Epoch: [28], step: [4730], time: [1357.7950], loss: [0.00035774]
Epoch: [28], step: [4740], time: [1360.4236], loss: [0.00089207]
Epoch: [28], step: [4750], time: [1363.0488], loss: [0.00456956]
Epoch: [28], step: [4760], time: [1365.6928], loss: [0.00040236]
Epoch: [29], step: [4770], time: [1368.3410], loss: [0.00109149]
Epoch: [29], step: [4780], time: [1371.0162], loss: [0.00081011]
Epoch: [29], step: [4790], time: [1373.6824], loss: [0.00075121]
Epoch: [29], step: [4800], time: [1376.3064], loss: [0.00255908]
Epoch: [29], step: [4810], time: [1378.9565], loss: [0.00096061]
Epoch: [29], step: [4820], time: [1381.6336], loss: [0.00033346]
Epoch: [29], step: [4830], time: [1384.3287], loss: [0.00175628]
Epoch: [29], step: [4840], time: [1386.9726], loss: [0.00027418]
Epoch: [29], step: [4850], time: [1389.6312], loss: [0.00422177]
Epoch: [29], step: [4860], time: [1392.3306], loss: [0.00770428]
Epoch: [29], step: [4870], time: [1395.0092], loss: [0.00030762]
Epoch: [29], step: [4880], time: [1397.6533], loss: [0.00147302]
Epoch: [29], step: [4890], time: [1400.2968], loss: [0.00093156]
Epoch: [29], step: [4900], time: [1402.9356], loss: [0.00035774]
Epoch: [29], step: [4910], time: [1405.6013], loss: [0.00089207]
Epoch: [29], step: [4920], time: [1408.2493], loss: [0.00456956]
Epoch: [29], step: [4930], time: [1410.9192], loss: [0.00040236]
Epoch: [30], step: [4940], time: [1413.6737], loss: [0.00109149]
Epoch: [30], step: [4950], time: [1416.3770], loss: [0.00081011]
Epoch: [30], step: [4960], time: [1419.0663], loss: [0.00075121]
Epoch: [30], step: [4970], time: [1421.7531], loss: [0.00255908]
Epoch: [30], step: [4980], time: [1424.3916], loss: [0.00096061]
Epoch: [30], step: [4990], time: [1427.0468], loss: [0.00033346]
Epoch: [30], step: [5000], time: [1429.6953], loss: [0.00175628]
Epoch: [30], step: [5010], time: [1432.5806], loss: [0.00027418]
Epoch: [30], step: [5020], time: [1435.2254], loss: [0.00422177]
Epoch: [30], step: [5030], time: [1437.8526], loss: [0.00770427]
Epoch: [30], step: [5040], time: [1440.5233], loss: [0.00030762]
Epoch: [30], step: [5050], time: [1443.1778], loss: [0.00147302]
Epoch: [30], step: [5060], time: [1445.8427], loss: [0.00093156]
Epoch: [30], step: [5070], time: [1448.4848], loss: [0.00035774]
Epoch: [30], step: [5080], time: [1451.1264], loss: [0.00089207]
Epoch: [30], step: [5090], time: [1453.8660], loss: [0.00456955]
Epoch: [30], step: [5100], time: [1456.5206], loss: [0.00040236]
Epoch: [31], step: [5110], time: [1459.1686], loss: [0.00109149]
Epoch: [31], step: [5120], time: [1461.9395], loss: [0.00081011]
Epoch: [31], step: [5130], time: [1464.6734], loss: [0.00075121]
Epoch: [31], step: [5140], time: [1467.3464], loss: [0.00255908]
Epoch: [31], step: [5150], time: [1470.0832], loss: [0.00096061]
Epoch: [31], step: [5160], time: [1472.7682], loss: [0.00033346]
Epoch: [31], step: [5170], time: [1475.4351], loss: [0.00175628]
Epoch: [31], step: [5180], time: [1478.0957], loss: [0.00027418]
Epoch: [31], step: [5190], time: [1480.8035], loss: [0.00422177]
Epoch: [31], step: [5200], time: [1483.6389], loss: [0.00770427]
Epoch: [31], step: [5210], time: [1486.6538], loss: [0.00030762]
Epoch: [31], step: [5220], time: [1489.5847], loss: [0.00147302]
Epoch: [31], step: [5230], time: [1492.3736], loss: [0.00093156]
Epoch: [31], step: [5240], time: [1495.1450], loss: [0.00035774]
Epoch: [31], step: [5250], time: [1497.9077], loss: [0.00089207]
Epoch: [31], step: [5260], time: [1500.6695], loss: [0.00456955]
Epoch: [31], step: [5270], time: [1503.4673], loss: [0.00040236]
Epoch: [32], step: [5280], time: [1506.2490], loss: [0.00109149]
Epoch: [32], step: [5290], time: [1508.9878], loss: [0.00081011]
Epoch: [32], step: [5300], time: [1511.6867], loss: [0.00075121]
Epoch: [32], step: [5310], time: [1514.4968], loss: [0.00255908]
Epoch: [32], step: [5320], time: [1517.2714], loss: [0.00096061]
Epoch: [32], step: [5330], time: [1520.0109], loss: [0.00033346]
Epoch: [32], step: [5340], time: [1522.7721], loss: [0.00175628]
Epoch: [32], step: [5350], time: [1525.6206], loss: [0.00027418]
Epoch: [32], step: [5360], time: [1528.3006], loss: [0.00422177]
Epoch: [32], step: [5370], time: [1530.9846], loss: [0.00770427]
Epoch: [32], step: [5380], time: [1533.6937], loss: [0.00030762]
Epoch: [32], step: [5390], time: [1536.3612], loss: [0.00147302]
Epoch: [32], step: [5400], time: [1539.0182], loss: [0.00093156]
Epoch: [32], step: [5410], time: [1541.6745], loss: [0.00035774]
Epoch: [32], step: [5420], time: [1544.3300], loss: [0.00089207]
Epoch: [32], step: [5430], time: [1547.0000], loss: [0.00456955]
Epoch: [32], step: [5440], time: [1549.6789], loss: [0.00040236]
Epoch: [33], step: [5450], time: [1552.3883], loss: [0.00109149]
Epoch: [33], step: [5460], time: [1555.0536], loss: [0.00081011]
Epoch: [33], step: [5470], time: [1557.7311], loss: [0.00075121]
Epoch: [33], step: [5480], time: [1560.3901], loss: [0.00255908]
Epoch: [33], step: [5490], time: [1563.0497], loss: [0.00096061]
Epoch: [33], step: [5500], time: [1565.7063], loss: [0.00033346]
Epoch: [33], step: [5510], time: [1568.5477], loss: [0.00175628]
Epoch: [33], step: [5520], time: [1571.2048], loss: [0.00027418]
Epoch: [33], step: [5530], time: [1573.8602], loss: [0.00422177]
Epoch: [33], step: [5540], time: [1576.6128], loss: [0.00770427]
Epoch: [33], step: [5550], time: [1579.2633], loss: [0.00030762]
Epoch: [33], step: [5560], time: [1581.9176], loss: [0.00147302]
Epoch: [33], step: [5570], time: [1584.5691], loss: [0.00093156]
Epoch: [33], step: [5580], time: [1587.2451], loss: [0.00035774]
Epoch: [33], step: [5590], time: [1589.9131], loss: [0.00089207]
Epoch: [33], step: [5600], time: [1592.5719], loss: [0.00456955]
Epoch: [33], step: [5610], time: [1595.2218], loss: [0.00040236]
Epoch: [34], step: [5620], time: [1597.9811], loss: [0.00109149]
Epoch: [34], step: [5630], time: [1600.6630], loss: [0.00081011]
Epoch: [34], step: [5640], time: [1603.3220], loss: [0.00075121]
Epoch: [34], step: [5650], time: [1605.9945], loss: [0.00255908]
Epoch: [34], step: [5660], time: [1608.6522], loss: [0.00096061]
Epoch: [34], step: [5670], time: [1611.2932], loss: [0.00033346]
Epoch: [34], step: [5680], time: [1613.9472], loss: [0.00175628]
Epoch: [34], step: [5690], time: [1616.5907], loss: [0.00027418]
Epoch: [34], step: [5700], time: [1619.2083], loss: [0.00422177]
Epoch: [34], step: [5710], time: [1621.8544], loss: [0.00770427]
Epoch: [34], step: [5720], time: [1624.5192], loss: [0.00030762]
Epoch: [34], step: [5730], time: [1627.1842], loss: [0.00147302]
Epoch: [34], step: [5740], time: [1629.8238], loss: [0.00093156]
Epoch: [34], step: [5750], time: [1632.4442], loss: [0.00035774]
Epoch: [34], step: [5760], time: [1635.2890], loss: [0.00089207]
Epoch: [34], step: [5770], time: [1638.2684], loss: [0.00456955]
Epoch: [34], step: [5780], time: [1641.1722], loss: [0.00040236]
Epoch: [35], step: [5790], time: [1644.1807], loss: [0.00109149]
Epoch: [35], step: [5800], time: [1646.8764], loss: [0.00081011]
Epoch: [35], step: [5810], time: [1649.6223], loss: [0.00075121]
Epoch: [35], step: [5820], time: [1652.3255], loss: [0.00255908]
Epoch: [35], step: [5830], time: [1655.0133], loss: [0.00096061]
Epoch: [35], step: [5840], time: [1657.6528], loss: [0.00033346]
Epoch: [35], step: [5850], time: [1660.4080], loss: [0.00175628]
Epoch: [35], step: [5860], time: [1663.0974], loss: [0.00027418]
Epoch: [35], step: [5870], time: [1665.7998], loss: [0.00422177]
Epoch: [35], step: [5880], time: [1668.5023], loss: [0.00770427]
Epoch: [35], step: [5890], time: [1671.1999], loss: [0.00030762]
Epoch: [35], step: [5900], time: [1673.8791], loss: [0.00147302]
Epoch: [35], step: [5910], time: [1676.5236], loss: [0.00093156]
Epoch: [35], step: [5920], time: [1679.2046], loss: [0.00035774]
Epoch: [35], step: [5930], time: [1681.8772], loss: [0.00089207]
Epoch: [35], step: [5940], time: [1684.6086], loss: [0.00456955]
Epoch: [35], step: [5950], time: [1687.2957], loss: [0.00040236]
Epoch: [36], step: [5960], time: [1689.9432], loss: [0.00109149]
Epoch: [36], step: [5970], time: [1692.5937], loss: [0.00081011]
Epoch: [36], step: [5980], time: [1695.2498], loss: [0.00075121]
Epoch: [36], step: [5990], time: [1697.9935], loss: [0.00255908]
Epoch: [36], step: [6000], time: [1700.6388], loss: [0.00096061]
Epoch: [36], step: [6010], time: [1703.6807], loss: [0.00033346]
Epoch: [36], step: [6020], time: [1706.3193], loss: [0.00175628]
Epoch: [36], step: [6030], time: [1708.9859], loss: [0.00027418]
Epoch: [36], step: [6040], time: [1711.6484], loss: [0.00422177]
Epoch: [36], step: [6050], time: [1714.2825], loss: [0.00770427]
Epoch: [36], step: [6060], time: [1716.9787], loss: [0.00030762]
Epoch: [36], step: [6070], time: [1719.6213], loss: [0.00147302]
Epoch: [36], step: [6080], time: [1722.2808], loss: [0.00093156]
Epoch: [36], step: [6090], time: [1724.9556], loss: [0.00035774]
Epoch: [36], step: [6100], time: [1727.6521], loss: [0.00089207]
Epoch: [36], step: [6110], time: [1730.4847], loss: [0.00456955]
Epoch: [36], step: [6120], time: [1733.1840], loss: [0.00040236]
Epoch: [37], step: [6130], time: [1735.8726], loss: [0.00109149]
Epoch: [37], step: [6140], time: [1738.5465], loss: [0.00081011]
Epoch: [37], step: [6150], time: [1741.2259], loss: [0.00075121]
Epoch: [37], step: [6160], time: [1743.9126], loss: [0.00255908]
Epoch: [37], step: [6170], time: [1746.5496], loss: [0.00096061]
Epoch: [37], step: [6180], time: [1749.2062], loss: [0.00033346]
Epoch: [37], step: [6190], time: [1751.8569], loss: [0.00175628]
Epoch: [37], step: [6200], time: [1754.5060], loss: [0.00027418]
Epoch: [37], step: [6210], time: [1757.1780], loss: [0.00422177]
Epoch: [37], step: [6220], time: [1759.9051], loss: [0.00770427]
Epoch: [37], step: [6230], time: [1762.5486], loss: [0.00030762]
Epoch: [37], step: [6240], time: [1765.1877], loss: [0.00147302]
Epoch: [37], step: [6250], time: [1767.8417], loss: [0.00093156]
Epoch: [37], step: [6260], time: [1770.4887], loss: [0.00035774]
Epoch: [37], step: [6270], time: [1773.1341], loss: [0.00089207]
Epoch: [37], step: [6280], time: [1775.7757], loss: [0.00456955]
Epoch: [37], step: [6290], time: [1778.4004], loss: [0.00040236]
Epoch: [38], step: [6300], time: [1781.0429], loss: [0.00109149]
Epoch: [38], step: [6310], time: [1783.7154], loss: [0.00081011]
Epoch: [38], step: [6320], time: [1786.3699], loss: [0.00075121]
Epoch: [38], step: [6330], time: [1789.0237], loss: [0.00255908]
Epoch: [38], step: [6340], time: [1791.6518], loss: [0.00096061]
Epoch: [38], step: [6350], time: [1794.3309], loss: [0.00033346]
Epoch: [38], step: [6360], time: [1796.9681], loss: [0.00175628]
Epoch: [38], step: [6370], time: [1799.6426], loss: [0.00027418]
Epoch: [38], step: [6380], time: [1802.3151], loss: [0.00422177]
Epoch: [38], step: [6390], time: [1804.9956], loss: [0.00770427]
Epoch: [38], step: [6400], time: [1807.6519], loss: [0.00030762]
Epoch: [38], step: [6410], time: [1810.3233], loss: [0.00147302]
Epoch: [38], step: [6420], time: [1813.0130], loss: [0.00093156]
Epoch: [38], step: [6430], time: [1815.6919], loss: [0.00035774]
Epoch: [38], step: [6440], time: [1818.3209], loss: [0.00089207]
Epoch: [38], step: [6450], time: [1821.0850], loss: [0.00456955]
Epoch: [38], step: [6460], time: [1823.7686], loss: [0.00040236]
Epoch: [39], step: [6470], time: [1826.3942], loss: [0.00109149]
Epoch: [39], step: [6480], time: [1829.0529], loss: [0.00081011]
Epoch: [39], step: [6490], time: [1831.7353], loss: [0.00075121]
Epoch: [39], step: [6500], time: [1834.4237], loss: [0.00255908]
Epoch: [39], step: [6510], time: [1837.4524], loss: [0.00096061]
Epoch: [39], step: [6520], time: [1840.1189], loss: [0.00033346]
Epoch: [39], step: [6530], time: [1842.7624], loss: [0.00175628]
Epoch: [39], step: [6540], time: [1845.4165], loss: [0.00027418]
Epoch: [39], step: [6550], time: [1848.0649], loss: [0.00422177]
Epoch: [39], step: [6560], time: [1850.7164], loss: [0.00770427]
Epoch: [39], step: [6570], time: [1853.3654], loss: [0.00030762]
Epoch: [39], step: [6580], time: [1856.0431], loss: [0.00147302]
Epoch: [39], step: [6590], time: [1858.6896], loss: [0.00093156]
Epoch: [39], step: [6600], time: [1861.3451], loss: [0.00035774]
Epoch: [39], step: [6610], time: [1863.9817], loss: [0.00089207]
Epoch: [39], step: [6620], time: [1866.6310], loss: [0.00456954]
Epoch: [39], step: [6630], time: [1869.3140], loss: [0.00040236]
Epoch: [40], step: [6640], time: [1871.9830], loss: [0.00109148]
Epoch: [40], step: [6650], time: [1874.6994], loss: [0.00081011]
Epoch: [40], step: [6660], time: [1877.3623], loss: [0.00075121]
Epoch: [40], step: [6670], time: [1880.0708], loss: [0.00255908]
Epoch: [40], step: [6680], time: [1882.8105], loss: [0.00096061]
Epoch: [40], step: [6690], time: [1885.5228], loss: [0.00033346]
Epoch: [40], step: [6700], time: [1888.1918], loss: [0.00175627]
Epoch: [40], step: [6710], time: [1890.8522], loss: [0.00027418]
Epoch: [40], step: [6720], time: [1893.4902], loss: [0.00422176]
Epoch: [40], step: [6730], time: [1896.1407], loss: [0.00770427]
Epoch: [40], step: [6740], time: [1898.7752], loss: [0.00030762]
Epoch: [40], step: [6750], time: [1901.4292], loss: [0.00147302]
Epoch: [40], step: [6760], time: [1904.0859], loss: [0.00093156]
Epoch: [40], step: [6770], time: [1906.7370], loss: [0.00035774]
Epoch: [40], step: [6780], time: [1909.4071], loss: [0.00089207]
Epoch: [40], step: [6790], time: [1912.0531], loss: [0.00456954]
Epoch: [40], step: [6800], time: [1914.7211], loss: [0.00040236]
Epoch: [41], step: [6810], time: [1917.3788], loss: [0.00109148]
Epoch: [41], step: [6820], time: [1920.0607], loss: [0.00081011]
Epoch: [41], step: [6830], time: [1922.7167], loss: [0.00075121]
Epoch: [41], step: [6840], time: [1925.3745], loss: [0.00255908]
Epoch: [41], step: [6850], time: [1928.0046], loss: [0.00096061]
Epoch: [41], step: [6860], time: [1930.6615], loss: [0.00033346]
Epoch: [41], step: [6870], time: [1933.3227], loss: [0.00175627]
Epoch: [41], step: [6880], time: [1936.0354], loss: [0.00027418]
Epoch: [41], step: [6890], time: [1938.6966], loss: [0.00422176]
Epoch: [41], step: [6900], time: [1941.4886], loss: [0.00770427]
Epoch: [41], step: [6910], time: [1944.1620], loss: [0.00030762]
Epoch: [41], step: [6920], time: [1946.8506], loss: [0.00147302]
Epoch: [41], step: [6930], time: [1949.5442], loss: [0.00093156]
Epoch: [41], step: [6940], time: [1952.2026], loss: [0.00035774]
Epoch: [41], step: [6950], time: [1954.9658], loss: [0.00089207]
Epoch: [41], step: [6960], time: [1957.6350], loss: [0.00456954]
Epoch: [41], step: [6970], time: [1960.3140], loss: [0.00040236]
Epoch: [42], step: [6980], time: [1962.9712], loss: [0.00109148]
Epoch: [42], step: [6990], time: [1965.6272], loss: [0.00081011]
Epoch: [42], step: [7000], time: [1968.3306], loss: [0.00075121]
Epoch: [42], step: [7010], time: [1971.4350], loss: [0.00255908]
Epoch: [42], step: [7020], time: [1974.1198], loss: [0.00096061]
Epoch: [42], step: [7030], time: [1976.7806], loss: [0.00033346]
Epoch: [42], step: [7040], time: [1979.4425], loss: [0.00175627]
Epoch: [42], step: [7050], time: [1982.1288], loss: [0.00027418]
Epoch: [42], step: [7060], time: [1984.7938], loss: [0.00422176]
Epoch: [42], step: [7070], time: [1987.4768], loss: [0.00770427]
Epoch: [42], step: [7080], time: [1990.1494], loss: [0.00030762]
Epoch: [42], step: [7090], time: [1992.8253], loss: [0.00147302]
Epoch: [42], step: [7100], time: [1995.5144], loss: [0.00093156]
Epoch: [42], step: [7110], time: [1998.1960], loss: [0.00035774]
Epoch: [42], step: [7120], time: [2000.8670], loss: [0.00089207]
Epoch: [42], step: [7130], time: [2003.6407], loss: [0.00456954]
Epoch: [42], step: [7140], time: [2006.3011], loss: [0.00040236]
Epoch: [43], step: [7150], time: [2008.9834], loss: [0.00109148]
Epoch: [43], step: [7160], time: [2011.7136], loss: [0.00081011]
Epoch: [43], step: [7170], time: [2014.4116], loss: [0.00075121]
Epoch: [43], step: [7180], time: [2017.1244], loss: [0.00255908]
Epoch: [43], step: [7190], time: [2019.8145], loss: [0.00096061]
Epoch: [43], step: [7200], time: [2022.4969], loss: [0.00033346]
Epoch: [43], step: [7210], time: [2025.1810], loss: [0.00175627]
Epoch: [43], step: [7220], time: [2027.8544], loss: [0.00027418]
Epoch: [43], step: [7230], time: [2030.5463], loss: [0.00422176]
Epoch: [43], step: [7240], time: [2033.2248], loss: [0.00770427]
Epoch: [43], step: [7250], time: [2035.9393], loss: [0.00030762]
Epoch: [43], step: [7260], time: [2038.6228], loss: [0.00147302]
Epoch: [43], step: [7270], time: [2041.3142], loss: [0.00093156]
Epoch: [43], step: [7280], time: [2043.9876], loss: [0.00035774]
Epoch: [43], step: [7290], time: [2046.6813], loss: [0.00089207]
Epoch: [43], step: [7300], time: [2049.3459], loss: [0.00456954]
Epoch: [43], step: [7310], time: [2052.0093], loss: [0.00040236]
Epoch: [44], step: [7320], time: [2054.6991], loss: [0.00109148]
Epoch: [44], step: [7330], time: [2057.3647], loss: [0.00081011]
Epoch: [44], step: [7340], time: [2060.0358], loss: [0.00075121]
Epoch: [44], step: [7350], time: [2062.7310], loss: [0.00255908]
Epoch: [44], step: [7360], time: [2065.4672], loss: [0.00096061]
Epoch: [44], step: [7370], time: [2068.1064], loss: [0.00033346]
Epoch: [44], step: [7380], time: [2070.7838], loss: [0.00175627]
Epoch: [44], step: [7390], time: [2073.4626], loss: [0.00027418]
Epoch: [44], step: [7400], time: [2076.1031], loss: [0.00422176]
Epoch: [44], step: [7410], time: [2078.7582], loss: [0.00770427]
Epoch: [44], step: [7420], time: [2081.4279], loss: [0.00030762]
Epoch: [44], step: [7430], time: [2084.1628], loss: [0.00147302]
Epoch: [44], step: [7440], time: [2086.8493], loss: [0.00093156]
Epoch: [44], step: [7450], time: [2089.5624], loss: [0.00035774]
Epoch: [44], step: [7460], time: [2092.2579], loss: [0.00089207]
Epoch: [44], step: [7470], time: [2094.9275], loss: [0.00456954]
Epoch: [44], step: [7480], time: [2097.5928], loss: [0.00040236]
Epoch: [45], step: [7490], time: [2100.2641], loss: [0.00109148]
Epoch: [45], step: [7500], time: [2102.9566], loss: [0.00081010]
Epoch: [45], step: [7510], time: [2106.0063], loss: [0.00075121]
Epoch: [45], step: [7520], time: [2108.7008], loss: [0.00255908]
Epoch: [45], step: [7530], time: [2111.3745], loss: [0.00096061]
Epoch: [45], step: [7540], time: [2114.0554], loss: [0.00033346]
Epoch: [45], step: [7550], time: [2116.7196], loss: [0.00175627]
Epoch: [45], step: [7560], time: [2119.3718], loss: [0.00027418]
Epoch: [45], step: [7570], time: [2122.0597], loss: [0.00422176]
Epoch: [45], step: [7580], time: [2124.8025], loss: [0.00770427]
Epoch: [45], step: [7590], time: [2127.4605], loss: [0.00030762]
Epoch: [45], step: [7600], time: [2130.1205], loss: [0.00147302]
Epoch: [45], step: [7610], time: [2132.7738], loss: [0.00093156]
Epoch: [45], step: [7620], time: [2135.4157], loss: [0.00035774]
Epoch: [45], step: [7630], time: [2138.0597], loss: [0.00089207]
Epoch: [45], step: [7640], time: [2140.7371], loss: [0.00456954]
Epoch: [45], step: [7650], time: [2143.4022], loss: [0.00040236]
Epoch: [46], step: [7660], time: [2146.0479], loss: [0.00109148]
Epoch: [46], step: [7670], time: [2148.7134], loss: [0.00081010]
Epoch: [46], step: [7680], time: [2151.3928], loss: [0.00075121]
Epoch: [46], step: [7690], time: [2154.0869], loss: [0.00255908]
Epoch: [46], step: [7700], time: [2156.7889], loss: [0.00096061]
Epoch: [46], step: [7710], time: [2159.4822], loss: [0.00033346]
Epoch: [46], step: [7720], time: [2162.1547], loss: [0.00175627]
Epoch: [46], step: [7730], time: [2164.9184], loss: [0.00027418]
Epoch: [46], step: [7740], time: [2167.6574], loss: [0.00422176]
Epoch: [46], step: [7750], time: [2170.3391], loss: [0.00770427]
Epoch: [46], step: [7760], time: [2173.0062], loss: [0.00030762]
Epoch: [46], step: [7770], time: [2175.6619], loss: [0.00147302]
Epoch: [46], step: [7780], time: [2178.3130], loss: [0.00093156]
Epoch: [46], step: [7790], time: [2180.9693], loss: [0.00035774]
Epoch: [46], step: [7800], time: [2183.6251], loss: [0.00089207]
Epoch: [46], step: [7810], time: [2186.3549], loss: [0.00456954]
Epoch: [46], step: [7820], time: [2189.0272], loss: [0.00040236]
Epoch: [47], step: [7830], time: [2191.6616], loss: [0.00109148]
Epoch: [47], step: [7840], time: [2194.3311], loss: [0.00081010]
Epoch: [47], step: [7850], time: [2196.9742], loss: [0.00075121]
Epoch: [47], step: [7860], time: [2199.6296], loss: [0.00255907]
Epoch: [47], step: [7870], time: [2202.3607], loss: [0.00096061]
Epoch: [47], step: [7880], time: [2205.0463], loss: [0.00033346]
Epoch: [47], step: [7890], time: [2207.7035], loss: [0.00175627]
Epoch: [47], step: [7900], time: [2210.3808], loss: [0.00027418]
Epoch: [47], step: [7910], time: [2213.0423], loss: [0.00422176]
Epoch: [47], step: [7920], time: [2215.7172], loss: [0.00770427]
Epoch: [47], step: [7930], time: [2218.3787], loss: [0.00030762]
Epoch: [47], step: [7940], time: [2221.0404], loss: [0.00147302]
Epoch: [47], step: [7950], time: [2223.7075], loss: [0.00093156]
Epoch: [47], step: [7960], time: [2226.4233], loss: [0.00035774]
Epoch: [47], step: [7970], time: [2229.1210], loss: [0.00089207]
Epoch: [47], step: [7980], time: [2231.7919], loss: [0.00456954]
Epoch: [47], step: [7990], time: [2234.4354], loss: [0.00040236]
Epoch: [48], step: [8000], time: [2237.1000], loss: [0.00109148]
Epoch: [48], step: [8010], time: [2240.1602], loss: [0.00081010]
Epoch: [48], step: [8020], time: [2242.8083], loss: [0.00075121]
Epoch: [48], step: [8030], time: [2245.4654], loss: [0.00255907]
Epoch: [48], step: [8040], time: [2248.2045], loss: [0.00096061]
Epoch: [48], step: [8050], time: [2250.8579], loss: [0.00033346]
Epoch: [48], step: [8060], time: [2253.5164], loss: [0.00175627]
Epoch: [48], step: [8070], time: [2256.1548], loss: [0.00027418]
Epoch: [48], step: [8080], time: [2258.8113], loss: [0.00422176]
Epoch: [48], step: [8090], time: [2261.4568], loss: [0.00770427]
Epoch: [48], step: [8100], time: [2264.1187], loss: [0.00030762]
Epoch: [48], step: [8110], time: [2266.7790], loss: [0.00147302]
Epoch: [48], step: [8120], time: [2269.4884], loss: [0.00093156]
Epoch: [48], step: [8130], time: [2272.1803], loss: [0.00035774]
Epoch: [48], step: [8140], time: [2274.8434], loss: [0.00089207]
Epoch: [48], step: [8150], time: [2277.5188], loss: [0.00456953]
Epoch: [48], step: [8160], time: [2280.1708], loss: [0.00040236]
Epoch: [49], step: [8170], time: [2282.8427], loss: [0.00109148]
Epoch: [49], step: [8180], time: [2285.4892], loss: [0.00081010]
Epoch: [49], step: [8190], time: [2288.1158], loss: [0.00075121]
Epoch: [49], step: [8200], time: [2290.7877], loss: [0.00255907]
Epoch: [49], step: [8210], time: [2293.4331], loss: [0.00096061]
Epoch: [49], step: [8220], time: [2296.1434], loss: [0.00033346]
Epoch: [49], step: [8230], time: [2298.8330], loss: [0.00175627]
Epoch: [49], step: [8240], time: [2301.4921], loss: [0.00027418]
Epoch: [49], step: [8250], time: [2304.1632], loss: [0.00422176]
Epoch: [49], step: [8260], time: [2306.8042], loss: [0.00770427]
Epoch: [49], step: [8270], time: [2309.5515], loss: [0.00030762]
Epoch: [49], step: [8280], time: [2312.2173], loss: [0.00147302]
Epoch: [49], step: [8290], time: [2314.8701], loss: [0.00093156]
Epoch: [49], step: [8300], time: [2317.5410], loss: [0.00035774]
Epoch: [49], step: [8310], time: [2320.2063], loss: [0.00089207]
Epoch: [49], step: [8320], time: [2322.8732], loss: [0.00456953]
Epoch: [49], step: [8330], time: [2325.5383], loss: [0.00040236]
Epoch: [50], step: [8340], time: [2328.1933], loss: [0.00109148]
Epoch: [50], step: [8350], time: [2330.8538], loss: [0.00081010]
Epoch: [50], step: [8360], time: [2333.5013], loss: [0.00075121]
Epoch: [50], step: [8370], time: [2336.1642], loss: [0.00255907]
Epoch: [50], step: [8380], time: [2338.8351], loss: [0.00096061]
Epoch: [50], step: [8390], time: [2341.5145], loss: [0.00033346]
Epoch: [50], step: [8400], time: [2344.1740], loss: [0.00175627]
Epoch: [50], step: [8410], time: [2346.8071], loss: [0.00027418]
Epoch: [50], step: [8420], time: [2349.4568], loss: [0.00422176]
Epoch: [50], step: [8430], time: [2352.1243], loss: [0.00770427]
Epoch: [50], step: [8440], time: [2354.7714], loss: [0.00030762]
Epoch: [50], step: [8450], time: [2357.4484], loss: [0.00147302]
Epoch: [50], step: [8460], time: [2360.1037], loss: [0.00093156]
Epoch: [50], step: [8470], time: [2362.7644], loss: [0.00035774]
Epoch: [50], step: [8480], time: [2365.4204], loss: [0.00089207]
Epoch: [50], step: [8490], time: [2368.1391], loss: [0.00456953]
Epoch: [50], step: [8500], time: [2370.9118], loss: [0.00040236]
Epoch: [51], step: [8510], time: [2373.7315], loss: [0.00109148]
Epoch: [51], step: [8520], time: [2376.4056], loss: [0.00081010]
Epoch: [51], step: [8530], time: [2379.0523], loss: [0.00075121]
Epoch: [51], step: [8540], time: [2381.6965], loss: [0.00255907]
Epoch: [51], step: [8550], time: [2384.3540], loss: [0.00096061]
Epoch: [51], step: [8560], time: [2387.0314], loss: [0.00033346]
Epoch: [51], step: [8570], time: [2389.6955], loss: [0.00175627]
Epoch: [51], step: [8580], time: [2392.3510], loss: [0.00027418]
Epoch: [51], step: [8590], time: [2395.0021], loss: [0.00422176]
Epoch: [51], step: [8600], time: [2397.6577], loss: [0.00770427]
Epoch: [51], step: [8610], time: [2400.3257], loss: [0.00030762]
Epoch: [51], step: [8620], time: [2402.9852], loss: [0.00147302]
Epoch: [51], step: [8630], time: [2405.6627], loss: [0.00093156]
Epoch: [51], step: [8640], time: [2408.3151], loss: [0.00035774]
Epoch: [51], step: [8650], time: [2410.9929], loss: [0.00089207]
Epoch: [51], step: [8660], time: [2413.6580], loss: [0.00456953]
Epoch: [51], step: [8670], time: [2416.3274], loss: [0.00040236]
Epoch: [52], step: [8680], time: [2418.9924], loss: [0.00109148]
Epoch: [52], step: [8690], time: [2421.6634], loss: [0.00081010]
Epoch: [52], step: [8700], time: [2424.3200], loss: [0.00075121]
Epoch: [52], step: [8710], time: [2426.9648], loss: [0.00255907]
Epoch: [52], step: [8720], time: [2429.7101], loss: [0.00096061]
Epoch: [52], step: [8730], time: [2432.3789], loss: [0.00033346]
Epoch: [52], step: [8740], time: [2435.0452], loss: [0.00175626]
Epoch: [52], step: [8750], time: [2437.7312], loss: [0.00027418]
Epoch: [52], step: [8760], time: [2440.4571], loss: [0.00422176]
Epoch: [52], step: [8770], time: [2443.1973], loss: [0.00770427]
Epoch: [52], step: [8780], time: [2445.9220], loss: [0.00030762]
Epoch: [52], step: [8790], time: [2448.6041], loss: [0.00147302]
Epoch: [52], step: [8800], time: [2451.2540], loss: [0.00093156]
Epoch: [52], step: [8810], time: [2453.9177], loss: [0.00035774]
Epoch: [52], step: [8820], time: [2456.6047], loss: [0.00089207]
Epoch: [52], step: [8830], time: [2459.2742], loss: [0.00456953]
Epoch: [52], step: [8840], time: [2461.9517], loss: [0.00040236]
Epoch: [53], step: [8850], time: [2464.6312], loss: [0.00109148]
Epoch: [53], step: [8860], time: [2467.3111], loss: [0.00081010]
Epoch: [53], step: [8870], time: [2469.9750], loss: [0.00075121]
Epoch: [53], step: [8880], time: [2472.6196], loss: [0.00255907]
Epoch: [53], step: [8890], time: [2475.2511], loss: [0.00096061]
Epoch: [53], step: [8900], time: [2477.8899], loss: [0.00033346]
Epoch: [53], step: [8910], time: [2480.5748], loss: [0.00175626]
Epoch: [53], step: [8920], time: [2483.2324], loss: [0.00027418]
Epoch: [53], step: [8930], time: [2485.9055], loss: [0.00422176]
Epoch: [53], step: [8940], time: [2488.5420], loss: [0.00770427]
Epoch: [53], step: [8950], time: [2491.2867], loss: [0.00030762]
Epoch: [53], step: [8960], time: [2493.9531], loss: [0.00147302]
Epoch: [53], step: [8970], time: [2496.6411], loss: [0.00093156]
Epoch: [53], step: [8980], time: [2499.2966], loss: [0.00035774]
Epoch: [53], step: [8990], time: [2501.9502], loss: [0.00089207]
Epoch: [53], step: [9000], time: [2504.6042], loss: [0.00456953]
Epoch: [53], step: [9010], time: [2507.7166], loss: [0.00040236]
Epoch: [54], step: [9020], time: [2510.4201], loss: [0.00109148]
Epoch: [54], step: [9030], time: [2513.0932], loss: [0.00081010]
Epoch: [54], step: [9040], time: [2515.7752], loss: [0.00075121]
Epoch: [54], step: [9050], time: [2518.4646], loss: [0.00255907]
Epoch: [54], step: [9060], time: [2521.0997], loss: [0.00096061]
Epoch: [54], step: [9070], time: [2523.7643], loss: [0.00033346]
Epoch: [54], step: [9080], time: [2526.4230], loss: [0.00175626]
Epoch: [54], step: [9090], time: [2529.0918], loss: [0.00027418]
Epoch: [54], step: [9100], time: [2531.7609], loss: [0.00422176]
Epoch: [54], step: [9110], time: [2534.4146], loss: [0.00770427]
Epoch: [54], step: [9120], time: [2537.0624], loss: [0.00030762]
Epoch: [54], step: [9130], time: [2539.7174], loss: [0.00147302]
Epoch: [54], step: [9140], time: [2542.3709], loss: [0.00093156]
Epoch: [54], step: [9150], time: [2545.0189], loss: [0.00035774]
Epoch: [54], step: [9160], time: [2547.6805], loss: [0.00089207]
Epoch: [54], step: [9170], time: [2550.3510], loss: [0.00456953]
Epoch: [54], step: [9180], time: [2553.0821], loss: [0.00040236]
Epoch: [55], step: [9190], time: [2555.7381], loss: [0.00109148]
Epoch: [55], step: [9200], time: [2558.3941], loss: [0.00081010]
Epoch: [55], step: [9210], time: [2561.0629], loss: [0.00075121]
Epoch: [55], step: [9220], time: [2563.7169], loss: [0.00255907]
Epoch: [55], step: [9230], time: [2566.3766], loss: [0.00096061]
Epoch: [55], step: [9240], time: [2569.0463], loss: [0.00033346]
Epoch: [55], step: [9250], time: [2571.7056], loss: [0.00175626]
Epoch: [55], step: [9260], time: [2574.3516], loss: [0.00027418]
Epoch: [55], step: [9270], time: [2577.0321], loss: [0.00422176]
Epoch: [55], step: [9280], time: [2579.7281], loss: [0.00770427]
Epoch: [55], step: [9290], time: [2582.4030], loss: [0.00030762]
Epoch: [55], step: [9300], time: [2585.1054], loss: [0.00147302]
Epoch: [55], step: [9310], time: [2587.7928], loss: [0.00093156]
Epoch: [55], step: [9320], time: [2590.4716], loss: [0.00035774]
Epoch: [55], step: [9330], time: [2593.1402], loss: [0.00089207]
Epoch: [55], step: [9340], time: [2595.8094], loss: [0.00456953]
Epoch: [55], step: [9350], time: [2598.4700], loss: [0.00040236]
Epoch: [56], step: [9360], time: [2601.1125], loss: [0.00109148]
Epoch: [56], step: [9370], time: [2603.7814], loss: [0.00081010]
Epoch: [56], step: [9380], time: [2606.4488], loss: [0.00075121]
Epoch: [56], step: [9390], time: [2609.1188], loss: [0.00255907]
Epoch: [56], step: [9400], time: [2611.7733], loss: [0.00096061]
Epoch: [56], step: [9410], time: [2614.5520], loss: [0.00033346]
Epoch: [56], step: [9420], time: [2617.2129], loss: [0.00175626]
Epoch: [56], step: [9430], time: [2619.8738], loss: [0.00027418]
Epoch: [56], step: [9440], time: [2622.5297], loss: [0.00422176]
Epoch: [56], step: [9450], time: [2625.1783], loss: [0.00770427]
Epoch: [56], step: [9460], time: [2627.8641], loss: [0.00030762]
Epoch: [56], step: [9470], time: [2630.5146], loss: [0.00147301]
Epoch: [56], step: [9480], time: [2633.1654], loss: [0.00093156]
Epoch: [56], step: [9490], time: [2635.8333], loss: [0.00035774]
Epoch: [56], step: [9500], time: [2638.5231], loss: [0.00089207]
Epoch: [56], step: [9510], time: [2641.5962], loss: [0.00456952]
Epoch: [56], step: [9520], time: [2644.2604], loss: [0.00040236]
Epoch: [57], step: [9530], time: [2646.9219], loss: [0.00109148]
Epoch: [57], step: [9540], time: [2649.6117], loss: [0.00081010]
Epoch: [57], step: [9550], time: [2652.2973], loss: [0.00075121]
Epoch: [57], step: [9560], time: [2654.9737], loss: [0.00255907]
Epoch: [57], step: [9570], time: [2657.6399], loss: [0.00096061]
Epoch: [57], step: [9580], time: [2660.3003], loss: [0.00033346]
Epoch: [57], step: [9590], time: [2663.0122], loss: [0.00175626]
Epoch: [57], step: [9600], time: [2665.6642], loss: [0.00027418]
Epoch: [57], step: [9610], time: [2668.3376], loss: [0.00422176]
Epoch: [57], step: [9620], time: [2671.0117], loss: [0.00770427]
Epoch: [57], step: [9630], time: [2673.7188], loss: [0.00030762]
Epoch: [57], step: [9640], time: [2676.4172], loss: [0.00147301]
Epoch: [57], step: [9650], time: [2679.0926], loss: [0.00093156]
Epoch: [57], step: [9660], time: [2681.7399], loss: [0.00035774]
Epoch: [57], step: [9670], time: [2684.4139], loss: [0.00089206]
Epoch: [57], step: [9680], time: [2687.0756], loss: [0.00456952]
Epoch: [57], step: [9690], time: [2689.7218], loss: [0.00040236]
Epoch: [58], step: [9700], time: [2692.3802], loss: [0.00109148]
Epoch: [58], step: [9710], time: [2695.0472], loss: [0.00081010]
Epoch: [58], step: [9720], time: [2697.7222], loss: [0.00075121]
Epoch: [58], step: [9730], time: [2700.3767], loss: [0.00255907]
Epoch: [58], step: [9740], time: [2703.0417], loss: [0.00096061]
Epoch: [58], step: [9750], time: [2705.7158], loss: [0.00033346]
Epoch: [58], step: [9760], time: [2708.3699], loss: [0.00175626]
Epoch: [58], step: [9770], time: [2711.0378], loss: [0.00027418]
Epoch: [58], step: [9780], time: [2713.6894], loss: [0.00422176]
Epoch: [58], step: [9790], time: [2716.3534], loss: [0.00770427]
Epoch: [58], step: [9800], time: [2719.0570], loss: [0.00030762]
Epoch: [58], step: [9810], time: [2721.7788], loss: [0.00147301]
Epoch: [58], step: [9820], time: [2724.4613], loss: [0.00093156]
Epoch: [58], step: [9830], time: [2727.1407], loss: [0.00035774]
Epoch: [58], step: [9840], time: [2729.8710], loss: [0.00089206]
Epoch: [58], step: [9850], time: [2732.5505], loss: [0.00456952]
Epoch: [58], step: [9860], time: [2735.2878], loss: [0.00040236]
Epoch: [59], step: [9870], time: [2737.9572], loss: [0.00109148]
Epoch: [59], step: [9880], time: [2740.5971], loss: [0.00081010]
Epoch: [59], step: [9890], time: [2743.2527], loss: [0.00075121]
Epoch: [59], step: [9900], time: [2745.9052], loss: [0.00255907]
Epoch: [59], step: [9910], time: [2748.5751], loss: [0.00096061]
Epoch: [59], step: [9920], time: [2751.2252], loss: [0.00033346]
Epoch: [59], step: [9930], time: [2753.8573], loss: [0.00175626]
Epoch: [59], step: [9940], time: [2756.5079], loss: [0.00027418]
Epoch: [59], step: [9950], time: [2759.1748], loss: [0.00422176]
Epoch: [59], step: [9960], time: [2761.8313], loss: [0.00770427]
Epoch: [59], step: [9970], time: [2764.4770], loss: [0.00030762]
Epoch: [59], step: [9980], time: [2767.1381], loss: [0.00147301]
Epoch: [59], step: [9990], time: [2769.7977], loss: [0.00093156]
Epoch: [59], step: [10000], time: [2772.4687], loss: [0.00035774]