-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtry1.rtf
11432 lines (11431 loc) · 221 KB
/
try1.rtf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
{\rtf1\ansi\ansicpg936\cocoartf2636
\cocoatextscaling0\cocoaplatform0{\fonttbl\f0\fnil\fcharset0 HelveticaNeue;\f1\fnil\fcharset134 PingFangSC-Regular;}
{\colortbl;\red255\green255\blue255;\red255\green255\blue255;\red0\green0\blue0;}
{\*\expandedcolortbl;;\cssrgb\c100000\c100000\c100000;\cssrgb\c0\c0\c0;}
\paperw11900\paperh16840\margl1440\margr1440\vieww11520\viewh8400\viewkind0
\deftab720
\pard\pardeftab720\partightenfactor0
\f0\fs28 \cf0 \cb2 \expnd0\expndtw0\kerning0
\outl0\strokewidth0 \strokec3 Epoch:
\f1 [
\f0 1
\f1 ][
\f0 0/2860
\f1 ]
\f0 Elapsed 0m 2s (remain 98m 10s) Loss: 0.6108(0.6108) Grad: inf LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 10/2860
\f1 ]
\f0 Elapsed 0m 10s (remain 43m 34s) Loss: 0.0913(0.3740) Grad: 1953.4050 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 20/2860
\f1 ]
\f0 Elapsed 0m 18s (remain 41m 27s) Loss: 0.0386(0.2278) Grad: 717.4629 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 30/2860
\f1 ]
\f0 Elapsed 0m 26s (remain 40m 30s) Loss: 0.0744(0.1779) Grad: 2012.9658 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 40/2860
\f1 ]
\f0 Elapsed 0m 34s (remain 39m 54s) Loss: 0.0391(0.1488) Grad: 3234.1128 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 50/2860
\f1 ]
\f0 Elapsed 0m 43s (remain 39m 30s) Loss: 0.0970(0.1268) Grad: 4354.9707 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 60/2860
\f1 ]
\f0 Elapsed 0m 51s (remain 39m 16s) Loss: 0.0063(0.1119) Grad: 743.3780 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 70/2860
\f1 ]
\f0 Elapsed 0m 59s (remain 39m 0s) Loss: 0.1378(0.1030) Grad: 6307.5220 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 80/2860
\f1 ]
\f0 Elapsed 1m 7s (remain 38m 45s) Loss: 0.0121(0.0949) Grad: 1953.7349 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 90/2860
\f1 ]
\f0 Elapsed 1m 16s (remain 38m 32s) Loss: 0.0179(0.0874) Grad: 4272.2188 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 100/2860
\f1 ]
\f0 Elapsed 1m 24s (remain 38m 23s) Loss: 0.0359(0.0818) Grad: 1267.7244 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 110/2860
\f1 ]
\f0 Elapsed 1m 32s (remain 38m 11s) Loss: 0.0354(0.0796) Grad: 8002.2876 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 120/2860
\f1 ]
\f0 Elapsed 1m 40s (remain 38m 0s) Loss: 0.0486(0.0775) Grad: 3616.9944 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 130/2860
\f1 ]
\f0 Elapsed 1m 48s (remain 37m 49s) Loss: 0.0577(0.0740) Grad: 29742.5234 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 140/2860
\f1 ]
\f0 Elapsed 1m 57s (remain 37m 40s) Loss: 0.0072(0.0709) Grad: 962.4625 LR: 0.00002000 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 150/2860
\f1 ]
\f0 Elapsed 2m 5s (remain 37m 30s) Loss: 0.0319(0.0692) Grad: 1483.0662 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 160/2860
\f1 ]
\f0 Elapsed 2m 13s (remain 37m 20s) Loss: 0.0194(0.0674) Grad: 1716.7446 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 170/2860
\f1 ]
\f0 Elapsed 2m 21s (remain 37m 10s) Loss: 0.0101(0.0650) Grad: 1321.3226 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 180/2860
\f1 ]
\f0 Elapsed 2m 30s (remain 37m 2s) Loss: 0.0127(0.0642) Grad: 1682.9147 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 190/2860
\f1 ]
\f0 Elapsed 2m 38s (remain 36m 52s) Loss: 0.0258(0.0632) Grad: 2915.6426 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 200/2860
\f1 ]
\f0 Elapsed 2m 46s (remain 36m 43s) Loss: 0.0031(0.0611) Grad: 524.8220 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 210/2860
\f1 ]
\f0 Elapsed 2m 54s (remain 36m 34s) Loss: 0.0209(0.0596) Grad: 5533.0649 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 220/2860
\f1 ]
\f0 Elapsed 3m 3s (remain 36m 25s) Loss: 0.0138(0.0581) Grad: 1845.1012 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 230/2860
\f1 ]
\f0 Elapsed 3m 11s (remain 36m 16s) Loss: 0.0153(0.0568) Grad: 1827.6858 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 240/2860
\f1 ]
\f0 Elapsed 3m 19s (remain 36m 7s) Loss: 0.0278(0.0554) Grad: 6372.4619 LR: 0.00001999 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 250/2860
\f1 ]
\f0 Elapsed 3m 27s (remain 35m 58s) Loss: 0.0173(0.0543) Grad: 3333.4895 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 260/2860
\f1 ]
\f0 Elapsed 3m 35s (remain 35m 50s) Loss: 0.0303(0.0543) Grad: 2552.7419 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 270/2860
\f1 ]
\f0 Elapsed 3m 44s (remain 35m 41s) Loss: 0.0285(0.0532) Grad: 4873.1392 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 280/2860
\f1 ]
\f0 Elapsed 3m 52s (remain 35m 32s) Loss: 0.0538(0.0526) Grad: 3953.9246 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 290/2860
\f1 ]
\f0 Elapsed 4m 0s (remain 35m 23s) Loss: 0.0212(0.0515) Grad: 2318.3091 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 300/2860
\f1 ]
\f0 Elapsed 4m 8s (remain 35m 15s) Loss: 0.0078(0.0505) Grad: 1034.7826 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 310/2860
\f1 ]
\f0 Elapsed 4m 17s (remain 35m 6s) Loss: 0.0179(0.0494) Grad: 2621.5688 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 320/2860
\f1 ]
\f0 Elapsed 4m 25s (remain 34m 57s) Loss: 0.0355(0.0490) Grad: 15161.8555 LR: 0.00001998 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 330/2860
\f1 ]
\f0 Elapsed 4m 33s (remain 34m 49s) Loss: 0.0130(0.0482) Grad: 1883.4728 LR: 0.00001997 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 340/2860
\f1 ]
\f0 Elapsed 4m 41s (remain 34m 40s) Loss: 0.0034(0.0472) Grad: 559.2449 LR: 0.00001997 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 350/2860
\f1 ]
\f0 Elapsed 4m 49s (remain 34m 32s) Loss: 0.0212(0.0469) Grad: 4445.6372 LR: 0.00001997 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 360/2860
\f1 ]
\f0 Elapsed 4m 58s (remain 34m 23s) Loss: 0.0320(0.0466) Grad: 3716.6516 LR: 0.00001997 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 370/2860
\f1 ]
\f0 Elapsed 5m 6s (remain 34m 15s) Loss: 0.1024(0.0463) Grad: 8502.2168 LR: 0.00001997 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 380/2860
\f1 ]
\f0 Elapsed 5m 14s (remain 34m 7s) Loss: 0.0023(0.0455) Grad: 658.9265 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 390/2860
\f1 ]
\f0 Elapsed 5m 22s (remain 33m 58s) Loss: 0.0079(0.0449) Grad: 513.9031 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 400/2860
\f1 ]
\f0 Elapsed 5m 31s (remain 33m 49s) Loss: 0.0150(0.0442) Grad: 2149.3130 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 410/2860
\f1 ]
\f0 Elapsed 5m 39s (remain 33m 41s) Loss: 0.0170(0.0436) Grad: 1606.3003 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 420/2860
\f1 ]
\f0 Elapsed 5m 47s (remain 33m 32s) Loss: 0.0106(0.0429) Grad: 2211.8186 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 430/2860
\f1 ]
\f0 Elapsed 5m 55s (remain 33m 24s) Loss: 0.0380(0.0426) Grad: 2610.4500 LR: 0.00001996 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 440/2860
\f1 ]
\f0 Elapsed 6m 3s (remain 33m 15s) Loss: 0.0129(0.0419) Grad: 2109.6521 LR: 0.00001995 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 450/2860
\f1 ]
\f0 Elapsed 6m 12s (remain 33m 7s) Loss: 0.0172(0.0415) Grad: 1686.4252 LR: 0.00001995 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 460/2860
\f1 ]
\f0 Elapsed 6m 20s (remain 32m 59s) Loss: 0.0128(0.0412) Grad: 2220.1482 LR: 0.00001995 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 470/2860
\f1 ]
\f0 Elapsed 6m 28s (remain 32m 50s) Loss: 0.0103(0.0407) Grad: 4506.2886 LR: 0.00001995 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 480/2860
\f1 ]
\f0 Elapsed 6m 36s (remain 32m 42s) Loss: 0.0290(0.0402) Grad: 3401.6304 LR: 0.00001994 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 490/2860
\f1 ]
\f0 Elapsed 6m 44s (remain 32m 33s) Loss: 0.0301(0.0401) Grad: 3654.3191 LR: 0.00001994 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 500/2860
\f1 ]
\f0 Elapsed 6m 53s (remain 32m 25s) Loss: 0.0392(0.0397) Grad: 5773.6265 LR: 0.00001994 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 510/2860
\f1 ]
\f0 Elapsed 7m 1s (remain 32m 16s) Loss: 0.0084(0.0392) Grad: 1069.5203 LR: 0.00001994 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 520/2860
\f1 ]
\f0 Elapsed 7m 9s (remain 32m 8s) Loss: 0.0087(0.0391) Grad: 2918.5266 LR: 0.00001993 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 530/2860
\f1 ]
\f0 Elapsed 7m 17s (remain 31m 59s) Loss: 0.0047(0.0386) Grad: 1480.8824 LR: 0.00001993 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 540/2860
\f1 ]
\f0 Elapsed 7m 25s (remain 31m 51s) Loss: 0.0028(0.0382) Grad: 992.0798 LR: 0.00001993 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 550/2860
\f1 ]
\f0 Elapsed 7m 34s (remain 31m 43s) Loss: 0.0009(0.0379) Grad: 239.5064 LR: 0.00001993 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 560/2860
\f1 ]
\f0 Elapsed 7m 42s (remain 31m 34s) Loss: 0.0424(0.0376) Grad: 4803.5566 LR: 0.00001992 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 570/2860
\f1 ]
\f0 Elapsed 7m 50s (remain 31m 26s) Loss: 0.0045(0.0376) Grad: 467.7649 LR: 0.00001992 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 580/2860
\f1 ]
\f0 Elapsed 7m 58s (remain 31m 18s) Loss: 0.0068(0.0373) Grad: 1227.2766 LR: 0.00001992 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 590/2860
\f1 ]
\f0 Elapsed 8m 6s (remain 31m 9s) Loss: 0.1785(0.0372) Grad: 4308.8389 LR: 0.00001992 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 600/2860
\f1 ]
\f0 Elapsed 8m 15s (remain 31m 1s) Loss: 0.0249(0.0368) Grad: 1280.4293 LR: 0.00001991 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 610/2860
\f1 ]
\f0 Elapsed 8m 23s (remain 30m 52s) Loss: 0.0028(0.0367) Grad: 442.7398 LR: 0.00001991 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 620/2860
\f1 ]
\f0 Elapsed 8m 31s (remain 30m 44s) Loss: 0.0065(0.0365) Grad: 2247.6897 LR: 0.00001991 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 630/2860
\f1 ]
\f0 Elapsed 8m 39s (remain 30m 36s) Loss: 0.0032(0.0363) Grad: 367.5108 LR: 0.00001990 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 640/2860
\f1 ]
\f0 Elapsed 8m 48s (remain 30m 28s) Loss: 0.0469(0.0362) Grad: 2204.7693 LR: 0.00001990 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 650/2860
\f1 ]
\f0 Elapsed 8m 56s (remain 30m 19s) Loss: 0.0120(0.0359) Grad: 2449.3621 LR: 0.00001990 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 660/2860
\f1 ]
\f0 Elapsed 9m 4s (remain 30m 11s) Loss: 0.0012(0.0355) Grad: 144.1304 LR: 0.00001989 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 670/2860
\f1 ]
\f0 Elapsed 9m 12s (remain 30m 3s) Loss: 0.0340(0.0352) Grad: 2512.0864 LR: 0.00001989 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 680/2860
\f1 ]
\f0 Elapsed 9m 20s (remain 29m 54s) Loss: 0.0069(0.0351) Grad: 1396.6794 LR: 0.00001989 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 690/2860
\f1 ]
\f0 Elapsed 9m 29s (remain 29m 46s) Loss: 0.0035(0.0350) Grad: 533.8792 LR: 0.00001988 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 700/2860
\f1 ]
\f0 Elapsed 9m 37s (remain 29m 38s) Loss: 0.0029(0.0347) Grad: 985.9089 LR: 0.00001988 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 710/2860
\f1 ]
\f0 Elapsed 9m 45s (remain 29m 29s) Loss: 0.0073(0.0344) Grad: 1609.0620 LR: 0.00001988 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 720/2860
\f1 ]
\f0 Elapsed 9m 53s (remain 29m 21s) Loss: 0.0134(0.0342) Grad: 2848.2502 LR: 0.00001987 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 730/2860
\f1 ]
\f0 Elapsed 10m 1s (remain 29m 13s) Loss: 0.0287(0.0338) Grad: 4409.4678 LR: 0.00001987 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 740/2860
\f1 ]
\f0 Elapsed 10m 10s (remain 29m 5s) Loss: 0.1185(0.0337) Grad: 11977.6562 LR: 0.00001987 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 750/2860
\f1 ]
\f0 Elapsed 10m 18s (remain 28m 56s) Loss: 0.0058(0.0334) Grad: 1422.9092 LR: 0.00001986 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 760/2860
\f1 ]
\f0 Elapsed 10m 26s (remain 28m 48s) Loss: 0.0165(0.0332) Grad: 4086.7908 LR: 0.00001986 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 770/2860
\f1 ]
\f0 Elapsed 10m 34s (remain 28m 40s) Loss: 0.0894(0.0330) Grad: 17464.1582 LR: 0.00001986 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 780/2860
\f1 ]
\f0 Elapsed 10m 43s (remain 28m 31s) Loss: 0.0009(0.0327) Grad: 329.0542 LR: 0.00001985 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 790/2860
\f1 ]
\f0 Elapsed 10m 51s (remain 28m 23s) Loss: 0.0114(0.0327) Grad: 923.8387 LR: 0.00001985 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 800/2860
\f1 ]
\f0 Elapsed 10m 59s (remain 28m 15s) Loss: 0.0036(0.0325) Grad: 455.6085 LR: 0.00001985 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 810/2860
\f1 ]
\f0 Elapsed 11m 7s (remain 28m 6s) Loss: 0.0046(0.0324) Grad: 503.9062 LR: 0.00001984 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 820/2860
\f1 ]
\f0 Elapsed 11m 15s (remain 27m 58s) Loss: 0.0028(0.0324) Grad: 337.9487 LR: 0.00001984 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 830/2860
\f1 ]
\f0 Elapsed 11m 24s (remain 27m 50s) Loss: 0.0130(0.0322) Grad: 1441.8400 LR: 0.00001983 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 840/2860
\f1 ]
\f0 Elapsed 11m 32s (remain 27m 42s) Loss: 0.0029(0.0321) Grad: 3393.6799 LR: 0.00001983 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 850/2860
\f1 ]
\f0 Elapsed 11m 40s (remain 27m 33s) Loss: 0.0506(0.0321) Grad: 4324.2124 LR: 0.00001983 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 860/2860
\f1 ]
\f0 Elapsed 11m 48s (remain 27m 25s) Loss: 0.0078(0.0318) Grad: 803.2009 LR: 0.00001982 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 870/2860
\f1 ]
\f0 Elapsed 11m 57s (remain 27m 17s) Loss: 0.0453(0.0316) Grad: 8595.1201 LR: 0.00001982 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 880/2860
\f1 ]
\f0 Elapsed 12m 5s (remain 27m 9s) Loss: 0.0259(0.0314) Grad: 840.5153 LR: 0.00001981 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 890/2860
\f1 ]
\f0 Elapsed 12m 13s (remain 27m 0s) Loss: 0.0277(0.0314) Grad: 3066.1685 LR: 0.00001981 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 900/2860
\f1 ]
\f0 Elapsed 12m 21s (remain 26m 52s) Loss: 0.0013(0.0313) Grad: 293.5524 LR: 0.00001980 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 910/2860
\f1 ]
\f0 Elapsed 12m 29s (remain 26m 44s) Loss: 0.0053(0.0311) Grad: 587.1148 LR: 0.00001980 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 920/2860
\f1 ]
\f0 Elapsed 12m 38s (remain 26m 35s) Loss: 0.0158(0.0311) Grad: 1723.9363 LR: 0.00001980 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 930/2860
\f1 ]
\f0 Elapsed 12m 46s (remain 26m 27s) Loss: 0.0006(0.0310) Grad: 92.0069 LR: 0.00001979 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 940/2860
\f1 ]
\f0 Elapsed 12m 54s (remain 26m 19s) Loss: 0.0114(0.0308) Grad: 1010.4116 LR: 0.00001979 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 950/2860
\f1 ]
\f0 Elapsed 13m 2s (remain 26m 11s) Loss: 0.0070(0.0307) Grad: 3127.9939 LR: 0.00001978 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 960/2860
\f1 ]
\f0 Elapsed 13m 10s (remain 26m 2s) Loss: 0.0107(0.0305) Grad: 1645.5048 LR: 0.00001978 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 970/2860
\f1 ]
\f0 Elapsed 13m 19s (remain 25m 54s) Loss: 0.0754(0.0304) Grad: 2343.7942 LR: 0.00001977 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 980/2860
\f1 ]
\f0 Elapsed 13m 27s (remain 25m 46s) Loss: 0.0076(0.0304) Grad: 615.5984 LR: 0.00001977 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 990/2860
\f1 ]
\f0 Elapsed 13m 35s (remain 25m 38s) Loss: 0.0597(0.0303) Grad: 4912.3364 LR: 0.00001976 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1000/2860
\f1 ]
\f0 Elapsed 13m 43s (remain 25m 29s) Loss: 0.0270(0.0302) Grad: 1651.0914 LR: 0.00001976 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1010/2860
\f1 ]
\f0 Elapsed 13m 52s (remain 25m 21s) Loss: 0.0276(0.0300) Grad: 3186.9771 LR: 0.00001975 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1020/2860
\f1 ]
\f0 Elapsed 14m 0s (remain 25m 13s) Loss: 0.1851(0.0303) Grad: 9821.4199 LR: 0.00001975 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1030/2860
\f1 ]
\f0 Elapsed 14m 8s (remain 25m 5s) Loss: 0.0341(0.0301) Grad: 2006.6206 LR: 0.00001974 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1040/2860
\f1 ]
\f0 Elapsed 14m 16s (remain 24m 56s) Loss: 0.0111(0.0300) Grad: 3040.7998 LR: 0.00001974 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1050/2860
\f1 ]
\f0 Elapsed 14m 24s (remain 24m 48s) Loss: 0.0131(0.0298) Grad: 1372.5095 LR: 0.00001973 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1060/2860
\f1 ]
\f0 Elapsed 14m 33s (remain 24m 40s) Loss: 0.0034(0.0296) Grad: 695.5359 LR: 0.00001973 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1070/2860
\f1 ]
\f0 Elapsed 14m 41s (remain 24m 32s) Loss: 0.0154(0.0295) Grad: 3165.1919 LR: 0.00001972 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1080/2860
\f1 ]
\f0 Elapsed 14m 49s (remain 24m 23s) Loss: 0.0008(0.0296) Grad: 88.8649 LR: 0.00001972 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1090/2860
\f1 ]
\f0 Elapsed 14m 57s (remain 24m 15s) Loss: 0.0477(0.0295) Grad: 1907.8783 LR: 0.00001971 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1100/2860
\f1 ]
\f0 Elapsed 15m 5s (remain 24m 7s) Loss: 0.0055(0.0293) Grad: 939.3925 LR: 0.00001971 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1110/2860
\f1 ]
\f0 Elapsed 15m 14s (remain 23m 59s) Loss: 0.0058(0.0294) Grad: 1977.2729 LR: 0.00001970 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1120/2860
\f1 ]
\f0 Elapsed 15m 22s (remain 23m 50s) Loss: 0.0055(0.0293) Grad: 2691.3228 LR: 0.00001970 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1130/2860
\f1 ]
\f0 Elapsed 15m 30s (remain 23m 42s) Loss: 0.0563(0.0292) Grad: 5906.4097 LR: 0.00001969 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1140/2860
\f1 ]
\f0 Elapsed 15m 38s (remain 23m 34s) Loss: 0.0094(0.0291) Grad: 831.8715 LR: 0.00001969 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1150/2860
\f1 ]
\f0 Elapsed 15m 47s (remain 23m 26s) Loss: 0.0067(0.0290) Grad: 973.6745 LR: 0.00001968 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1160/2860
\f1 ]
\f0 Elapsed 15m 55s (remain 23m 17s) Loss: 0.0006(0.0288) Grad: 385.2322 LR: 0.00001968 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1170/2860
\f1 ]
\f0 Elapsed 16m 3s (remain 23m 9s) Loss: 0.0570(0.0287) Grad: 1406.4912 LR: 0.00001967 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1180/2860
\f1 ]
\f0 Elapsed 16m 11s (remain 23m 1s) Loss: 0.0117(0.0287) Grad: 979.5421 LR: 0.00001967 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1190/2860
\f1 ]
\f0 Elapsed 16m 19s (remain 22m 53s) Loss: 0.0185(0.0286) Grad: 4003.3977 LR: 0.00001966 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1200/2860
\f1 ]
\f0 Elapsed 16m 28s (remain 22m 44s) Loss: 0.0005(0.0285) Grad: 101.4013 LR: 0.00001965 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1210/2860
\f1 ]
\f0 Elapsed 16m 36s (remain 22m 36s) Loss: 0.0055(0.0284) Grad: 771.5208 LR: 0.00001965 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1220/2860
\f1 ]
\f0 Elapsed 16m 44s (remain 22m 28s) Loss: 0.0226(0.0282) Grad: 1794.1139 LR: 0.00001964 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1230/2860
\f1 ]
\f0 Elapsed 16m 52s (remain 22m 20s) Loss: 0.0079(0.0281) Grad: 1655.1674 LR: 0.00001964 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1240/2860
\f1 ]
\f0 Elapsed 17m 0s (remain 22m 11s) Loss: 0.0226(0.0280) Grad: 1514.9624 LR: 0.00001963 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1260/2860
\f1 ]
\f0 Elapsed 17m 17s (remain 21m 55s) Loss: 0.0089(0.0279) Grad: 1242.8691 LR: 0.00001962 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1270/2860
\f1 ]
\f0 Elapsed 17m 25s (remain 21m 47s) Loss: 0.0054(0.0280) Grad: 914.6548 LR: 0.00001961 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1280/2860
\f1 ]
\f0 Elapsed 17m 33s (remain 21m 39s) Loss: 0.0609(0.0279) Grad: 4280.1626 LR: 0.00001961 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1290/2860
\f1 ]
\f0 Elapsed 17m 42s (remain 21m 30s) Loss: 0.0059(0.0279) Grad: 663.1463 LR: 0.00001960 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1300/2860
\f1 ]
\f0 Elapsed 17m 50s (remain 21m 22s) Loss: 0.0029(0.0278) Grad: 1852.0331 LR: 0.00001959 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1310/2860
\f1 ]
\f0 Elapsed 17m 58s (remain 21m 14s) Loss: 0.0043(0.0277) Grad: 2112.5723 LR: 0.00001959 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1330/2860
\f1 ]
\f0 Elapsed 18m 14s (remain 20m 57s) Loss: 0.0115(0.0275) Grad: 692.4731 LR: 0.00001958 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1340/2860
\f1 ]
\f0 Elapsed 18m 23s (remain 20m 49s) Loss: 0.0108(0.0275) Grad: 973.9722 LR: 0.00001957 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1350/2860
\f1 ]
\f0 Elapsed 18m 31s (remain 20m 41s) Loss: 0.0058(0.0274) Grad: 970.1072 LR: 0.00001956 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1360/2860
\f1 ]
\f0 Elapsed 18m 39s (remain 20m 33s) Loss: 0.0267(0.0274) Grad: 2706.7607 LR: 0.00001956 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1370/2860
\f1 ]
\f0 Elapsed 18m 47s (remain 20m 24s) Loss: 0.0036(0.0272) Grad: 736.9479 LR: 0.00001955 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1380/2860
\f1 ]
\f0 Elapsed 18m 55s (remain 20m 16s) Loss: 0.1394(0.0274) Grad: 6614.6201 LR: 0.00001954 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1390/2860
\f1 ]
\f0 Elapsed 19m 4s (remain 20m 8s) Loss: 0.0017(0.0272) Grad: 460.9350 LR: 0.00001954 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1400/2860
\f1 ]
\f0 Elapsed 19m 12s (remain 19m 59s) Loss: 0.0710(0.0271) Grad: 2077.4055 LR: 0.00001953 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1410/2860
\f1 ]
\f0 Elapsed 19m 20s (remain 19m 51s) Loss: 0.0051(0.0271) Grad: 1014.3798 LR: 0.00001952 \
Epoch:
\f1 [
\f0 1
\f1 ][
\f0 1420/2860
\f1 ]
\f0 Elapsed 19m 28s (remain 19m 43s) Loss: 0.0247(0.0270) Grad: 1742.2474 LR: 0.00001952 \
Epoch:
\f1 [
\f0 1
\f1 ][