diff --git "a/training.log" "b/training.log" --- "a/training.log" +++ "b/training.log" @@ -1,2170 +1,2188 @@ -2019-08-08 15:20:41,997 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:41,998 Model: "SequenceTagger( +2023-04-05 22:30:15,038 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,038 Model: "SequenceTagger( (embeddings): StackedEmbeddings( - (list_embedding_0): WordEmbeddings('en-crawl') + (list_embedding_0): WordEmbeddings( + 'en-crawl' + (embedding): Embedding(1000001, 300) + ) (list_embedding_1): FlairEmbeddings( (lm): LanguageModel( - (drop): Dropout(p=0.05) + (drop): Dropout(p=0.05, inplace=False) (encoder): Embedding(300, 100) (rnn): LSTM(100, 2048) - (decoder): Linear(in_features=2048, out_features=300, bias=True) ) ) (list_embedding_2): FlairEmbeddings( (lm): LanguageModel( - (drop): Dropout(p=0.05) + (drop): Dropout(p=0.05, inplace=False) (encoder): Embedding(300, 100) (rnn): LSTM(100, 2048) - (decoder): Linear(in_features=2048, out_features=300, bias=True) ) ) ) (word_dropout): WordDropout(p=0.05) (locked_dropout): LockedDropout(p=0.5) (embedding2nn): Linear(in_features=4396, out_features=4396, bias=True) - (rnn): LSTM(4396, 256, bidirectional=True) - (linear): Linear(in_features=512, out_features=76, bias=True) + (rnn): LSTM(4396, 256, batch_first=True, bidirectional=True) + (linear): Linear(in_features=512, out_features=75, bias=True) + (loss_function): ViterbiLoss() + (crf): CRF() )" -2019-08-08 15:20:42,001 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,001 Corpus: "Corpus: 75187 train + 9603 dev + 9479 test sentences" -2019-08-08 15:20:42,001 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,001 Parameters: -2019-08-08 15:20:42,002 - learning_rate: "0.1" -2019-08-08 15:20:42,002 - mini_batch_size: "32" -2019-08-08 15:20:42,002 - patience: "3" -2019-08-08 15:20:42,002 - anneal_factor: "0.5" -2019-08-08 15:20:42,003 - max_epochs: "150" -2019-08-08 15:20:42,003 - shuffle: "True" -2019-08-08 15:20:42,003 - train_with_dev: "True" -2019-08-08 15:20:42,003 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,003 Model training base path: "resources/taggers/release-ner-ontonotes-0" -2019-08-08 15:20:42,004 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,004 Device: cuda:0 -2019-08-08 15:20:42,004 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,004 Embeddings storage mode: cpu -2019-08-08 15:20:42,006 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:20:42,706 epoch 1 - iter 0/2650 - loss 90.75070953 throughput (samples/sec): 12245.95 -2019-08-08 15:25:11,326 epoch 1 - iter 265/2650 - loss 8.05192522 throughput (samples/sec): 31.58 -2019-08-08 15:28:29,918 epoch 1 - iter 530/2650 - loss 5.74790360 throughput (samples/sec): 42.71 -2019-08-08 15:30:53,752 epoch 1 - iter 795/2650 - loss 4.73484335 throughput (samples/sec): 58.98 -2019-08-08 15:33:12,907 epoch 1 - iter 1060/2650 - loss 4.16465857 throughput (samples/sec): 60.96 -2019-08-08 15:35:42,668 epoch 1 - iter 1325/2650 - loss 3.75189948 throughput (samples/sec): 56.64 -2019-08-08 15:38:05,267 epoch 1 - iter 1590/2650 - loss 3.48626362 throughput (samples/sec): 59.49 -2019-08-08 15:41:12,107 epoch 1 - iter 1855/2650 - loss 3.25458774 throughput (samples/sec): 45.40 -2019-08-08 15:45:10,586 epoch 1 - iter 2120/2650 - loss 3.08264929 throughput (samples/sec): 35.57 -2019-08-08 15:47:42,241 epoch 1 - iter 2385/2650 - loss 2.93271476 throughput (samples/sec): 55.93 -2019-08-08 15:49:53,578 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:49:53,578 EPOCH 1 done: loss 2.8082 - lr 0.1000 -2019-08-08 15:49:53,578 BAD EPOCHS (no improvement): 0 -2019-08-08 15:49:53,579 ---------------------------------------------------------------------------------------------------- -2019-08-08 15:49:54,027 epoch 2 - iter 0/2650 - loss 1.08342016 throughput (samples/sec): 19119.22 -2019-08-08 15:51:19,359 epoch 2 - iter 265/2650 - loss 1.54061787 throughput (samples/sec): 99.43 -2019-08-08 15:53:07,575 epoch 2 - iter 530/2650 - loss 1.53140490 throughput (samples/sec): 78.39 -2019-08-08 15:54:51,548 epoch 2 - iter 795/2650 - loss 1.51926253 throughput (samples/sec): 81.59 -2019-08-08 15:56:38,658 epoch 2 - iter 1060/2650 - loss 1.49826083 throughput (samples/sec): 79.20 -2019-08-08 15:58:25,200 epoch 2 - iter 1325/2650 - loss 1.48544577 throughput (samples/sec): 79.63 -2019-08-08 16:00:11,584 epoch 2 - iter 1590/2650 - loss 1.46933582 throughput (samples/sec): 79.74 -2019-08-08 16:01:55,473 epoch 2 - iter 1855/2650 - loss 1.45738936 throughput (samples/sec): 81.66 -2019-08-08 16:03:44,081 epoch 2 - iter 2120/2650 - loss 1.43893822 throughput (samples/sec): 78.11 -2019-08-08 16:05:30,366 epoch 2 - iter 2385/2650 - loss 1.42155793 throughput (samples/sec): 79.82 -2019-08-08 16:07:19,187 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:07:19,187 EPOCH 2 done: loss 1.4068 - lr 0.1000 -2019-08-08 16:07:19,187 BAD EPOCHS (no improvement): 0 -2019-08-08 16:07:19,188 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:07:19,618 epoch 3 - iter 0/2650 - loss 1.58778930 throughput (samples/sec): 19865.91 -2019-08-08 16:09:06,986 epoch 3 - iter 265/2650 - loss 1.16421955 throughput (samples/sec): 79.05 -2019-08-08 16:10:53,634 epoch 3 - iter 530/2650 - loss 1.20188002 throughput (samples/sec): 79.55 -2019-08-08 16:12:41,733 epoch 3 - iter 795/2650 - loss 1.19425702 throughput (samples/sec): 78.48 -2019-08-08 16:14:24,681 epoch 3 - iter 1060/2650 - loss 1.17431878 throughput (samples/sec): 82.40 -2019-08-08 16:16:11,359 epoch 3 - iter 1325/2650 - loss 1.17960944 throughput (samples/sec): 79.52 -2019-08-08 16:17:56,526 epoch 3 - iter 1590/2650 - loss 1.17908100 throughput (samples/sec): 80.67 -2019-08-08 16:19:44,104 epoch 3 - iter 1855/2650 - loss 1.17739159 throughput (samples/sec): 78.86 -2019-08-08 16:21:33,279 epoch 3 - iter 2120/2650 - loss 1.17726247 throughput (samples/sec): 77.70 -2019-08-08 16:23:24,344 epoch 3 - iter 2385/2650 - loss 1.16852081 throughput (samples/sec): 76.38 -2019-08-08 16:25:11,423 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:25:11,423 EPOCH 3 done: loss 1.1575 - lr 0.1000 -2019-08-08 16:25:11,423 BAD EPOCHS (no improvement): 0 -2019-08-08 16:25:11,423 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:25:11,766 epoch 4 - iter 0/2650 - loss 1.14999568 throughput (samples/sec): 25005.62 -2019-08-08 16:26:57,835 epoch 4 - iter 265/2650 - loss 1.04068717 throughput (samples/sec): 79.98 -2019-08-08 16:28:27,757 epoch 4 - iter 530/2650 - loss 1.04265378 throughput (samples/sec): 94.35 -2019-08-08 16:29:52,409 epoch 4 - iter 795/2650 - loss 1.04839287 throughput (samples/sec): 100.22 -2019-08-08 16:31:15,713 epoch 4 - iter 1060/2650 - loss 1.04304986 throughput (samples/sec): 101.85 -2019-08-08 16:32:41,178 epoch 4 - iter 1325/2650 - loss 1.04820806 throughput (samples/sec): 99.27 -2019-08-08 16:34:05,352 epoch 4 - iter 1590/2650 - loss 1.03913764 throughput (samples/sec): 100.80 -2019-08-08 16:35:29,522 epoch 4 - iter 1855/2650 - loss 1.04166087 throughput (samples/sec): 100.80 -2019-08-08 16:36:52,045 epoch 4 - iter 2120/2650 - loss 1.03833859 throughput (samples/sec): 102.81 -2019-08-08 16:38:14,724 epoch 4 - iter 2385/2650 - loss 1.03699822 throughput (samples/sec): 102.62 -2019-08-08 16:39:39,284 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:39:39,284 EPOCH 4 done: loss 1.0290 - lr 0.1000 -2019-08-08 16:39:39,284 BAD EPOCHS (no improvement): 0 -2019-08-08 16:39:39,284 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:39:39,669 epoch 5 - iter 0/2650 - loss 0.53899717 throughput (samples/sec): 22252.70 -2019-08-08 16:41:04,512 epoch 5 - iter 265/2650 - loss 0.92754135 throughput (samples/sec): 100.00 -2019-08-08 16:42:28,941 epoch 5 - iter 530/2650 - loss 0.93655912 throughput (samples/sec): 100.49 -2019-08-08 16:43:52,096 epoch 5 - iter 795/2650 - loss 0.94548098 throughput (samples/sec): 102.03 -2019-08-08 16:45:14,291 epoch 5 - iter 1060/2650 - loss 0.93975989 throughput (samples/sec): 103.22 -2019-08-08 16:46:36,004 epoch 5 - iter 1325/2650 - loss 0.93974178 throughput (samples/sec): 103.83 -2019-08-08 16:48:00,623 epoch 5 - iter 1590/2650 - loss 0.93978730 throughput (samples/sec): 100.27 -2019-08-08 16:49:24,752 epoch 5 - iter 1855/2650 - loss 0.94068006 throughput (samples/sec): 100.85 -2019-08-08 16:50:46,786 epoch 5 - iter 2120/2650 - loss 0.93627722 throughput (samples/sec): 103.43 -2019-08-08 16:52:10,457 epoch 5 - iter 2385/2650 - loss 0.93997815 throughput (samples/sec): 101.40 -2019-08-08 16:53:34,212 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:53:34,212 EPOCH 5 done: loss 0.9425 - lr 0.1000 -2019-08-08 16:53:34,212 BAD EPOCHS (no improvement): 0 -2019-08-08 16:53:34,212 ---------------------------------------------------------------------------------------------------- -2019-08-08 16:53:34,567 epoch 6 - iter 0/2650 - loss 0.71811497 throughput (samples/sec): 24176.83 -2019-08-08 16:54:58,173 epoch 6 - iter 265/2650 - loss 0.91425702 throughput (samples/sec): 101.48 -2019-08-08 16:56:22,916 epoch 6 - iter 530/2650 - loss 0.89681687 throughput (samples/sec): 100.12 -2019-08-08 16:57:46,952 epoch 6 - iter 795/2650 - loss 0.90082930 throughput (samples/sec): 100.96 -2019-08-08 16:59:10,108 epoch 6 - iter 1060/2650 - loss 0.89114065 throughput (samples/sec): 102.03 -2019-08-08 17:00:32,215 epoch 6 - iter 1325/2650 - loss 0.88763672 throughput (samples/sec): 103.33 -2019-08-08 17:01:54,837 epoch 6 - iter 1590/2650 - loss 0.88353599 throughput (samples/sec): 102.69 -2019-08-08 17:03:18,944 epoch 6 - iter 1855/2650 - loss 0.88240916 throughput (samples/sec): 100.88 -2019-08-08 17:04:41,109 epoch 6 - iter 2120/2650 - loss 0.87991433 throughput (samples/sec): 103.26 -2019-08-08 17:06:01,921 epoch 6 - iter 2385/2650 - loss 0.88353759 throughput (samples/sec): 104.99 -2019-08-08 17:07:24,814 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:07:24,814 EPOCH 6 done: loss 0.8817 - lr 0.1000 -2019-08-08 17:07:24,814 BAD EPOCHS (no improvement): 0 -2019-08-08 17:07:24,814 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:07:25,046 epoch 7 - iter 0/2650 - loss 0.52113622 throughput (samples/sec): 37246.04 -2019-08-08 17:08:47,879 epoch 7 - iter 265/2650 - loss 0.82532514 throughput (samples/sec): 102.43 -2019-08-08 17:10:11,039 epoch 7 - iter 530/2650 - loss 0.83438101 throughput (samples/sec): 102.02 -2019-08-08 17:11:35,673 epoch 7 - iter 795/2650 - loss 0.84165589 throughput (samples/sec): 100.25 -2019-08-08 17:12:57,606 epoch 7 - iter 1060/2650 - loss 0.84357283 throughput (samples/sec): 103.55 -2019-08-08 17:14:19,312 epoch 7 - iter 1325/2650 - loss 0.84310125 throughput (samples/sec): 103.84 -2019-08-08 17:15:40,079 epoch 7 - iter 1590/2650 - loss 0.84222415 throughput (samples/sec): 105.05 -2019-08-08 17:17:03,390 epoch 7 - iter 1855/2650 - loss 0.83522148 throughput (samples/sec): 101.84 -2019-08-08 17:18:22,478 epoch 7 - iter 2120/2650 - loss 0.83452025 throughput (samples/sec): 107.28 -2019-08-08 17:19:44,394 epoch 7 - iter 2385/2650 - loss 0.83712000 throughput (samples/sec): 103.57 -2019-08-08 17:21:06,164 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:21:06,164 EPOCH 7 done: loss 0.8362 - lr 0.1000 -2019-08-08 17:21:06,164 BAD EPOCHS (no improvement): 0 -2019-08-08 17:21:06,164 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:21:06,447 epoch 8 - iter 0/2650 - loss 0.31120512 throughput (samples/sec): 30380.53 -2019-08-08 17:22:28,405 epoch 8 - iter 265/2650 - loss 0.79242385 throughput (samples/sec): 103.52 -2019-08-08 17:23:49,783 epoch 8 - iter 530/2650 - loss 0.79098483 throughput (samples/sec): 104.26 -2019-08-08 17:25:11,511 epoch 8 - iter 795/2650 - loss 0.79566310 throughput (samples/sec): 103.81 -2019-08-08 17:26:32,413 epoch 8 - iter 1060/2650 - loss 0.80065974 throughput (samples/sec): 104.87 -2019-08-08 17:27:55,300 epoch 8 - iter 1325/2650 - loss 0.79848518 throughput (samples/sec): 102.36 -2019-08-08 17:29:15,589 epoch 8 - iter 1590/2650 - loss 0.79980795 throughput (samples/sec): 105.67 -2019-08-08 17:30:37,982 epoch 8 - iter 1855/2650 - loss 0.79944622 throughput (samples/sec): 102.97 -2019-08-08 17:31:59,100 epoch 8 - iter 2120/2650 - loss 0.79601046 throughput (samples/sec): 104.59 -2019-08-08 17:33:21,722 epoch 8 - iter 2385/2650 - loss 0.79566301 throughput (samples/sec): 102.69 -2019-08-08 17:34:44,425 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:34:44,425 EPOCH 8 done: loss 0.7956 - lr 0.1000 -2019-08-08 17:34:44,425 BAD EPOCHS (no improvement): 0 -2019-08-08 17:34:44,426 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:34:44,700 epoch 9 - iter 0/2650 - loss 0.33114570 throughput (samples/sec): 31325.23 -2019-08-08 17:36:09,149 epoch 9 - iter 265/2650 - loss 0.71138384 throughput (samples/sec): 100.46 -2019-08-08 17:37:32,791 epoch 9 - iter 530/2650 - loss 0.73561072 throughput (samples/sec): 101.43 -2019-08-08 17:38:54,948 epoch 9 - iter 795/2650 - loss 0.73038753 throughput (samples/sec): 103.27 -2019-08-08 17:40:16,011 epoch 9 - iter 1060/2650 - loss 0.73531846 throughput (samples/sec): 104.66 -2019-08-08 17:41:39,428 epoch 9 - iter 1325/2650 - loss 0.74376542 throughput (samples/sec): 101.71 -2019-08-08 17:43:00,699 epoch 9 - iter 1590/2650 - loss 0.74233462 throughput (samples/sec): 104.39 -2019-08-08 17:44:24,255 epoch 9 - iter 1855/2650 - loss 0.74873773 throughput (samples/sec): 101.54 -2019-08-08 17:45:47,199 epoch 9 - iter 2120/2650 - loss 0.75418378 throughput (samples/sec): 102.29 -2019-08-08 17:47:08,345 epoch 9 - iter 2385/2650 - loss 0.75580455 throughput (samples/sec): 104.56 -2019-08-08 17:48:29,880 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:48:29,881 EPOCH 9 done: loss 0.7541 - lr 0.1000 -2019-08-08 17:48:29,881 BAD EPOCHS (no improvement): 0 -2019-08-08 17:48:29,881 ---------------------------------------------------------------------------------------------------- -2019-08-08 17:48:30,227 epoch 10 - iter 0/2650 - loss 0.20781451 throughput (samples/sec): 24735.71 -2019-08-08 17:49:51,205 epoch 10 - iter 265/2650 - loss 0.73816882 throughput (samples/sec): 104.77 -2019-08-08 17:51:13,388 epoch 10 - iter 530/2650 - loss 0.73724366 throughput (samples/sec): 103.23 -2019-08-08 17:52:36,441 epoch 10 - iter 795/2650 - loss 0.72408397 throughput (samples/sec): 102.16 -2019-08-08 17:53:59,285 epoch 10 - iter 1060/2650 - loss 0.72510667 throughput (samples/sec): 102.41 -2019-08-08 17:55:23,175 epoch 10 - iter 1325/2650 - loss 0.72550675 throughput (samples/sec): 101.13 -2019-08-08 17:56:46,986 epoch 10 - iter 1590/2650 - loss 0.73064532 throughput (samples/sec): 101.23 -2019-08-08 17:58:09,420 epoch 10 - iter 1855/2650 - loss 0.73039080 throughput (samples/sec): 102.92 -2019-08-08 17:59:31,340 epoch 10 - iter 2120/2650 - loss 0.72694734 throughput (samples/sec): 103.57 -2019-08-08 18:00:56,907 epoch 10 - iter 2385/2650 - loss 0.72787513 throughput (samples/sec): 99.15 -2019-08-08 18:02:20,192 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:02:20,192 EPOCH 10 done: loss 0.7291 - lr 0.1000 -2019-08-08 18:02:20,193 BAD EPOCHS (no improvement): 0 -2019-08-08 18:02:20,193 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:02:20,500 epoch 11 - iter 0/2650 - loss 0.50029397 throughput (samples/sec): 27882.19 -2019-08-08 18:03:43,197 epoch 11 - iter 265/2650 - loss 0.70863046 throughput (samples/sec): 102.59 -2019-08-08 18:05:05,954 epoch 11 - iter 530/2650 - loss 0.70211022 throughput (samples/sec): 102.52 -2019-08-08 18:06:29,170 epoch 11 - iter 795/2650 - loss 0.68860873 throughput (samples/sec): 101.95 -2019-08-08 18:07:52,774 epoch 11 - iter 1060/2650 - loss 0.69494610 throughput (samples/sec): 101.48 -2019-08-08 18:09:18,384 epoch 11 - iter 1325/2650 - loss 0.70142607 throughput (samples/sec): 99.10 -2019-08-08 18:10:40,366 epoch 11 - iter 1590/2650 - loss 0.69582252 throughput (samples/sec): 103.49 -2019-08-08 18:12:02,130 epoch 11 - iter 1855/2650 - loss 0.69249461 throughput (samples/sec): 103.77 -2019-08-08 18:13:24,837 epoch 11 - iter 2120/2650 - loss 0.69641427 throughput (samples/sec): 102.58 -2019-08-08 18:14:48,451 epoch 11 - iter 2385/2650 - loss 0.69899453 throughput (samples/sec): 101.47 -2019-08-08 18:16:09,719 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:16:09,719 EPOCH 11 done: loss 0.6970 - lr 0.1000 -2019-08-08 18:16:09,719 BAD EPOCHS (no improvement): 0 -2019-08-08 18:16:09,719 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:16:10,031 epoch 12 - iter 0/2650 - loss 0.40702319 throughput (samples/sec): 27493.26 -2019-08-08 18:17:31,000 epoch 12 - iter 265/2650 - loss 0.66587432 throughput (samples/sec): 104.79 -2019-08-08 18:18:54,045 epoch 12 - iter 530/2650 - loss 0.67297174 throughput (samples/sec): 102.16 -2019-08-08 18:20:15,252 epoch 12 - iter 795/2650 - loss 0.67509741 throughput (samples/sec): 104.48 -2019-08-08 18:21:35,678 epoch 12 - iter 1060/2650 - loss 0.67343907 throughput (samples/sec): 105.49 -2019-08-08 18:22:55,758 epoch 12 - iter 1325/2650 - loss 0.66840702 throughput (samples/sec): 105.95 -2019-08-08 18:24:20,514 epoch 12 - iter 1590/2650 - loss 0.67305647 throughput (samples/sec): 100.10 -2019-08-08 18:25:47,346 epoch 12 - iter 1855/2650 - loss 0.66909806 throughput (samples/sec): 97.71 -2019-08-08 18:27:13,284 epoch 12 - iter 2120/2650 - loss 0.67391500 throughput (samples/sec): 98.73 -2019-08-08 18:28:39,079 epoch 12 - iter 2385/2650 - loss 0.67661136 throughput (samples/sec): 98.89 -2019-08-08 18:30:03,504 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:30:03,504 EPOCH 12 done: loss 0.6815 - lr 0.1000 -2019-08-08 18:30:03,504 BAD EPOCHS (no improvement): 0 -2019-08-08 18:30:03,505 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:30:03,773 epoch 13 - iter 0/2650 - loss 1.33587968 throughput (samples/sec): 31980.08 -2019-08-08 18:31:26,119 epoch 13 - iter 265/2650 - loss 0.64723022 throughput (samples/sec): 103.04 -2019-08-08 18:32:48,942 epoch 13 - iter 530/2650 - loss 0.65080629 throughput (samples/sec): 102.44 -2019-08-08 18:34:12,033 epoch 13 - iter 795/2650 - loss 0.65294088 throughput (samples/sec): 102.11 -2019-08-08 18:35:34,691 epoch 13 - iter 1060/2650 - loss 0.66003400 throughput (samples/sec): 102.64 -2019-08-08 18:36:59,007 epoch 13 - iter 1325/2650 - loss 0.65143917 throughput (samples/sec): 100.62 -2019-08-08 18:38:24,455 epoch 13 - iter 1590/2650 - loss 0.65682313 throughput (samples/sec): 99.29 -2019-08-08 18:39:49,205 epoch 13 - iter 1855/2650 - loss 0.65919649 throughput (samples/sec): 100.11 -2019-08-08 18:41:13,874 epoch 13 - iter 2120/2650 - loss 0.66327202 throughput (samples/sec): 100.20 -2019-08-08 18:42:38,562 epoch 13 - iter 2385/2650 - loss 0.65944174 throughput (samples/sec): 100.18 -2019-08-08 18:44:02,715 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:44:02,715 EPOCH 13 done: loss 0.6653 - lr 0.1000 -2019-08-08 18:44:02,715 BAD EPOCHS (no improvement): 0 -2019-08-08 18:44:02,716 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:44:02,955 epoch 14 - iter 0/2650 - loss 0.18008149 throughput (samples/sec): 36013.00 -2019-08-08 18:45:27,337 epoch 14 - iter 265/2650 - loss 0.61258302 throughput (samples/sec): 100.55 -2019-08-08 18:46:51,051 epoch 14 - iter 530/2650 - loss 0.61261081 throughput (samples/sec): 101.35 -2019-08-08 18:48:15,450 epoch 14 - iter 795/2650 - loss 0.60901396 throughput (samples/sec): 100.52 -2019-08-08 18:49:41,790 epoch 14 - iter 1060/2650 - loss 0.61372813 throughput (samples/sec): 98.26 -2019-08-08 18:51:06,087 epoch 14 - iter 1325/2650 - loss 0.62606423 throughput (samples/sec): 100.65 -2019-08-08 18:52:31,940 epoch 14 - iter 1590/2650 - loss 0.63438289 throughput (samples/sec): 98.82 -2019-08-08 18:53:57,262 epoch 14 - iter 1855/2650 - loss 0.63373499 throughput (samples/sec): 99.44 -2019-08-08 18:55:21,506 epoch 14 - iter 2120/2650 - loss 0.63583586 throughput (samples/sec): 100.71 -2019-08-08 18:56:45,860 epoch 14 - iter 2385/2650 - loss 0.63567055 throughput (samples/sec): 100.58 -2019-08-08 18:58:08,636 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:58:08,637 EPOCH 14 done: loss 0.6391 - lr 0.1000 -2019-08-08 18:58:08,637 BAD EPOCHS (no improvement): 0 -2019-08-08 18:58:08,637 ---------------------------------------------------------------------------------------------------- -2019-08-08 18:58:08,956 epoch 15 - iter 0/2650 - loss 0.60840911 throughput (samples/sec): 26876.10 -2019-08-08 18:59:30,350 epoch 15 - iter 265/2650 - loss 0.62553894 throughput (samples/sec): 104.24 -2019-08-08 19:00:51,414 epoch 15 - iter 530/2650 - loss 0.62427393 throughput (samples/sec): 104.66 -2019-08-08 19:02:13,135 epoch 15 - iter 795/2650 - loss 0.62611703 throughput (samples/sec): 103.82 -2019-08-08 19:03:36,800 epoch 15 - iter 1060/2650 - loss 0.62077318 throughput (samples/sec): 101.41 -2019-08-08 19:04:58,782 epoch 15 - iter 1325/2650 - loss 0.61968550 throughput (samples/sec): 103.49 -2019-08-08 19:06:20,946 epoch 15 - iter 1590/2650 - loss 0.62215039 throughput (samples/sec): 103.26 -2019-08-08 19:07:44,025 epoch 15 - iter 1855/2650 - loss 0.62866423 throughput (samples/sec): 102.12 -2019-08-08 19:09:07,925 epoch 15 - iter 2120/2650 - loss 0.62789089 throughput (samples/sec): 101.13 -2019-08-08 19:10:32,706 epoch 15 - iter 2385/2650 - loss 0.62921397 throughput (samples/sec): 100.07 -2019-08-08 19:11:55,631 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:11:55,631 EPOCH 15 done: loss 0.6273 - lr 0.1000 -2019-08-08 19:11:55,631 BAD EPOCHS (no improvement): 0 -2019-08-08 19:11:55,631 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:11:55,976 epoch 16 - iter 0/2650 - loss 0.94160718 throughput (samples/sec): 24900.08 -2019-08-08 19:13:19,298 epoch 16 - iter 265/2650 - loss 0.59180739 throughput (samples/sec): 101.82 -2019-08-08 19:14:40,818 epoch 16 - iter 530/2650 - loss 0.59786585 throughput (samples/sec): 104.08 -2019-08-08 19:16:03,559 epoch 16 - iter 795/2650 - loss 0.60746862 throughput (samples/sec): 102.54 -2019-08-08 19:17:25,796 epoch 16 - iter 1060/2650 - loss 0.61848220 throughput (samples/sec): 103.17 -2019-08-08 19:18:50,718 epoch 16 - iter 1325/2650 - loss 0.62167395 throughput (samples/sec): 99.91 -2019-08-08 19:20:13,998 epoch 16 - iter 1590/2650 - loss 0.61834927 throughput (samples/sec): 101.88 -2019-08-08 19:21:37,008 epoch 16 - iter 1855/2650 - loss 0.61509640 throughput (samples/sec): 102.21 -2019-08-08 19:22:59,492 epoch 16 - iter 2120/2650 - loss 0.62033930 throughput (samples/sec): 102.86 -2019-08-08 19:24:22,957 epoch 16 - iter 2385/2650 - loss 0.62313076 throughput (samples/sec): 101.65 -2019-08-08 19:25:45,115 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:25:45,115 EPOCH 16 done: loss 0.6228 - lr 0.1000 -2019-08-08 19:25:45,115 BAD EPOCHS (no improvement): 0 -2019-08-08 19:25:45,115 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:25:45,947 epoch 17 - iter 0/2650 - loss 1.20939708 throughput (samples/sec): 10232.47 -2019-08-08 19:27:08,467 epoch 17 - iter 265/2650 - loss 0.57800328 throughput (samples/sec): 102.82 -2019-08-08 19:28:32,845 epoch 17 - iter 530/2650 - loss 0.57658257 throughput (samples/sec): 100.55 -2019-08-08 19:29:56,742 epoch 17 - iter 795/2650 - loss 0.58483981 throughput (samples/sec): 101.13 -2019-08-08 19:31:18,486 epoch 17 - iter 1060/2650 - loss 0.58720709 throughput (samples/sec): 103.79 -2019-08-08 19:32:41,281 epoch 17 - iter 1325/2650 - loss 0.59781084 throughput (samples/sec): 102.47 -2019-08-08 19:34:02,838 epoch 17 - iter 1590/2650 - loss 0.59617215 throughput (samples/sec): 104.03 -2019-08-08 19:35:25,050 epoch 17 - iter 1855/2650 - loss 0.59803773 throughput (samples/sec): 103.20 -2019-08-08 19:36:49,534 epoch 17 - iter 2120/2650 - loss 0.59811791 throughput (samples/sec): 100.42 -2019-08-08 19:38:11,397 epoch 17 - iter 2385/2650 - loss 0.59791156 throughput (samples/sec): 103.64 -2019-08-08 19:39:33,947 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:39:33,947 EPOCH 17 done: loss 0.5999 - lr 0.1000 -2019-08-08 19:39:33,947 BAD EPOCHS (no improvement): 0 -2019-08-08 19:39:33,947 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:39:34,652 epoch 18 - iter 0/2650 - loss 0.69268775 throughput (samples/sec): 12084.64 -2019-08-08 19:40:59,712 epoch 18 - iter 265/2650 - loss 0.58545711 throughput (samples/sec): 99.74 -2019-08-08 19:42:22,754 epoch 18 - iter 530/2650 - loss 0.57530186 throughput (samples/sec): 102.17 -2019-08-08 19:43:44,307 epoch 18 - iter 795/2650 - loss 0.56978332 throughput (samples/sec): 104.04 -2019-08-08 19:45:08,084 epoch 18 - iter 1060/2650 - loss 0.57286610 throughput (samples/sec): 101.27 -2019-08-08 19:46:31,134 epoch 18 - iter 1325/2650 - loss 0.57089774 throughput (samples/sec): 102.16 -2019-08-08 19:47:52,743 epoch 18 - iter 1590/2650 - loss 0.57540413 throughput (samples/sec): 103.97 -2019-08-08 19:49:16,061 epoch 18 - iter 1855/2650 - loss 0.57893976 throughput (samples/sec): 101.83 -2019-08-08 19:50:37,652 epoch 18 - iter 2120/2650 - loss 0.58182218 throughput (samples/sec): 103.99 -2019-08-08 19:51:57,853 epoch 18 - iter 2385/2650 - loss 0.58034444 throughput (samples/sec): 105.79 -2019-08-08 19:53:23,122 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:53:23,122 EPOCH 18 done: loss 0.5845 - lr 0.1000 -2019-08-08 19:53:23,123 BAD EPOCHS (no improvement): 0 -2019-08-08 19:53:23,123 ---------------------------------------------------------------------------------------------------- -2019-08-08 19:53:23,462 epoch 19 - iter 0/2650 - loss 0.43647367 throughput (samples/sec): 25292.59 -2019-08-08 19:54:46,993 epoch 19 - iter 265/2650 - loss 0.54473870 throughput (samples/sec): 101.57 -2019-08-08 19:56:11,050 epoch 19 - iter 530/2650 - loss 0.55996604 throughput (samples/sec): 100.93 -2019-08-08 19:57:34,402 epoch 19 - iter 795/2650 - loss 0.55381026 throughput (samples/sec): 101.79 -2019-08-08 19:58:59,353 epoch 19 - iter 1060/2650 - loss 0.55430670 throughput (samples/sec): 99.87 -2019-08-08 20:00:23,171 epoch 19 - iter 1325/2650 - loss 0.55458048 throughput (samples/sec): 101.22 -2019-08-08 20:01:44,238 epoch 19 - iter 1590/2650 - loss 0.55892193 throughput (samples/sec): 104.66 -2019-08-08 20:03:05,470 epoch 19 - iter 1855/2650 - loss 0.55759518 throughput (samples/sec): 104.45 -2019-08-08 20:04:25,104 epoch 19 - iter 2120/2650 - loss 0.55812337 throughput (samples/sec): 106.54 -2019-08-08 20:05:45,471 epoch 19 - iter 2385/2650 - loss 0.56561302 throughput (samples/sec): 105.57 -2019-08-08 20:07:11,557 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:07:11,557 EPOCH 19 done: loss 0.5679 - lr 0.1000 -2019-08-08 20:07:11,557 BAD EPOCHS (no improvement): 0 -2019-08-08 20:07:11,557 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:07:11,780 epoch 20 - iter 0/2650 - loss 0.38332438 throughput (samples/sec): 38718.37 -2019-08-08 20:08:35,502 epoch 20 - iter 265/2650 - loss 0.54123043 throughput (samples/sec): 101.34 -2019-08-08 20:09:58,840 epoch 20 - iter 530/2650 - loss 0.53824506 throughput (samples/sec): 101.80 -2019-08-08 20:11:21,896 epoch 20 - iter 795/2650 - loss 0.55035664 throughput (samples/sec): 102.15 -2019-08-08 20:12:44,719 epoch 20 - iter 1060/2650 - loss 0.55304590 throughput (samples/sec): 102.44 -2019-08-08 20:14:06,623 epoch 20 - iter 1325/2650 - loss 0.55024053 throughput (samples/sec): 103.59 -2019-08-08 20:15:33,162 epoch 20 - iter 1590/2650 - loss 0.56121609 throughput (samples/sec): 98.04 -2019-08-08 20:16:57,377 epoch 20 - iter 1855/2650 - loss 0.56322955 throughput (samples/sec): 100.74 -2019-08-08 20:18:22,931 epoch 20 - iter 2120/2650 - loss 0.56688845 throughput (samples/sec): 99.17 -2019-08-08 20:19:48,457 epoch 20 - iter 2385/2650 - loss 0.56450431 throughput (samples/sec): 99.20 -2019-08-08 20:21:09,514 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:21:09,515 EPOCH 20 done: loss 0.5622 - lr 0.1000 -2019-08-08 20:21:09,515 BAD EPOCHS (no improvement): 0 -2019-08-08 20:21:09,515 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:21:09,729 epoch 21 - iter 0/2650 - loss 0.14398801 throughput (samples/sec): 40230.26 -2019-08-08 20:22:33,062 epoch 21 - iter 265/2650 - loss 0.53684237 throughput (samples/sec): 101.81 -2019-08-08 20:23:56,412 epoch 21 - iter 530/2650 - loss 0.54625567 throughput (samples/sec): 101.79 -2019-08-08 20:25:21,716 epoch 21 - iter 795/2650 - loss 0.54900351 throughput (samples/sec): 99.46 -2019-08-08 20:26:45,862 epoch 21 - iter 1060/2650 - loss 0.55466434 throughput (samples/sec): 100.83 -2019-08-08 20:28:12,027 epoch 21 - iter 1325/2650 - loss 0.55690414 throughput (samples/sec): 98.46 -2019-08-08 20:29:34,494 epoch 21 - iter 1590/2650 - loss 0.55185984 throughput (samples/sec): 102.88 -2019-08-08 20:30:56,405 epoch 21 - iter 1855/2650 - loss 0.55072349 throughput (samples/sec): 103.58 -2019-08-08 20:32:21,256 epoch 21 - iter 2120/2650 - loss 0.55099161 throughput (samples/sec): 99.99 -2019-08-08 20:33:42,512 epoch 21 - iter 2385/2650 - loss 0.55010761 throughput (samples/sec): 104.41 -2019-08-08 20:35:06,364 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:35:06,365 EPOCH 21 done: loss 0.5569 - lr 0.1000 -2019-08-08 20:35:06,365 BAD EPOCHS (no improvement): 0 -2019-08-08 20:35:06,365 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:35:06,688 epoch 22 - iter 0/2650 - loss 0.60782385 throughput (samples/sec): 26523.80 -2019-08-08 20:36:29,123 epoch 22 - iter 265/2650 - loss 0.56063507 throughput (samples/sec): 102.92 -2019-08-08 20:37:52,648 epoch 22 - iter 530/2650 - loss 0.53398722 throughput (samples/sec): 101.58 -2019-08-08 20:39:13,167 epoch 22 - iter 795/2650 - loss 0.52332084 throughput (samples/sec): 105.37 -2019-08-08 20:40:37,734 epoch 22 - iter 1060/2650 - loss 0.52989065 throughput (samples/sec): 100.33 -2019-08-08 20:41:58,234 epoch 22 - iter 1325/2650 - loss 0.52793110 throughput (samples/sec): 105.40 -2019-08-08 20:43:21,016 epoch 22 - iter 1590/2650 - loss 0.53497032 throughput (samples/sec): 102.49 -2019-08-08 20:44:45,678 epoch 22 - iter 1855/2650 - loss 0.53796359 throughput (samples/sec): 100.21 -2019-08-08 20:46:07,892 epoch 22 - iter 2120/2650 - loss 0.53773830 throughput (samples/sec): 103.20 -2019-08-08 20:47:32,648 epoch 22 - iter 2385/2650 - loss 0.54078624 throughput (samples/sec): 100.10 -2019-08-08 20:48:55,513 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:48:55,513 EPOCH 22 done: loss 0.5425 - lr 0.1000 -2019-08-08 20:48:55,513 BAD EPOCHS (no improvement): 0 -2019-08-08 20:48:55,513 ---------------------------------------------------------------------------------------------------- -2019-08-08 20:48:55,895 epoch 23 - iter 0/2650 - loss 0.32699037 throughput (samples/sec): 22443.30 -2019-08-08 20:50:21,329 epoch 23 - iter 265/2650 - loss 0.52524323 throughput (samples/sec): 99.31 -2019-08-08 20:51:43,936 epoch 23 - iter 530/2650 - loss 0.52778067 throughput (samples/sec): 102.70 -2019-08-08 20:53:05,031 epoch 23 - iter 795/2650 - loss 0.52967581 throughput (samples/sec): 104.62 -2019-08-08 20:54:26,084 epoch 23 - iter 1060/2650 - loss 0.53796673 throughput (samples/sec): 104.68 -2019-08-08 20:55:49,630 epoch 23 - iter 1325/2650 - loss 0.53401904 throughput (samples/sec): 101.55 -2019-08-08 20:57:09,632 epoch 23 - iter 1590/2650 - loss 0.53304952 throughput (samples/sec): 106.05 -2019-08-08 20:58:30,625 epoch 23 - iter 1855/2650 - loss 0.53158119 throughput (samples/sec): 104.75 -2019-08-08 20:59:51,885 epoch 23 - iter 2120/2650 - loss 0.53388211 throughput (samples/sec): 104.41 -2019-08-08 21:01:14,769 epoch 23 - iter 2385/2650 - loss 0.53553253 throughput (samples/sec): 102.36 -2019-08-08 21:02:37,752 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:02:37,752 EPOCH 23 done: loss 0.5385 - lr 0.1000 -2019-08-08 21:02:37,752 BAD EPOCHS (no improvement): 0 -2019-08-08 21:02:37,752 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:02:38,006 epoch 24 - iter 0/2650 - loss 0.47493708 throughput (samples/sec): 33953.29 -2019-08-08 21:04:02,496 epoch 24 - iter 265/2650 - loss 0.49742818 throughput (samples/sec): 100.41 -2019-08-08 21:05:24,841 epoch 24 - iter 530/2650 - loss 0.50220125 throughput (samples/sec): 103.03 -2019-08-08 21:06:45,796 epoch 24 - iter 795/2650 - loss 0.49836216 throughput (samples/sec): 104.80 -2019-08-08 21:08:08,436 epoch 24 - iter 1060/2650 - loss 0.49902281 throughput (samples/sec): 102.66 -2019-08-08 21:09:35,911 epoch 24 - iter 1325/2650 - loss 0.49835616 throughput (samples/sec): 96.99 -2019-08-08 21:11:12,978 epoch 24 - iter 1590/2650 - loss 0.50463183 throughput (samples/sec): 87.40 -2019-08-08 21:12:51,444 epoch 24 - iter 1855/2650 - loss 0.51022280 throughput (samples/sec): 86.16 -2019-08-08 21:14:31,385 epoch 24 - iter 2120/2650 - loss 0.51123804 throughput (samples/sec): 84.88 -2019-08-08 21:16:11,910 epoch 24 - iter 2385/2650 - loss 0.51695340 throughput (samples/sec): 84.39 -2019-08-08 21:17:38,749 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:17:38,749 EPOCH 24 done: loss 0.5224 - lr 0.1000 -2019-08-08 21:17:38,749 BAD EPOCHS (no improvement): 0 -2019-08-08 21:17:38,750 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:17:39,000 epoch 25 - iter 0/2650 - loss 0.35931003 throughput (samples/sec): 34323.90 -2019-08-08 21:19:10,948 epoch 25 - iter 265/2650 - loss 0.49128119 throughput (samples/sec): 92.27 -2019-08-08 21:20:51,737 epoch 25 - iter 530/2650 - loss 0.48623202 throughput (samples/sec): 84.17 -2019-08-08 21:22:29,264 epoch 25 - iter 795/2650 - loss 0.49672397 throughput (samples/sec): 86.99 -2019-08-08 21:24:06,048 epoch 25 - iter 1060/2650 - loss 0.49902245 throughput (samples/sec): 87.65 -2019-08-08 21:25:46,150 epoch 25 - iter 1325/2650 - loss 0.50629441 throughput (samples/sec): 84.75 -2019-08-08 21:27:27,657 epoch 25 - iter 1590/2650 - loss 0.50737415 throughput (samples/sec): 83.58 -2019-08-08 21:29:07,430 epoch 25 - iter 1855/2650 - loss 0.50753595 throughput (samples/sec): 85.03 -2019-08-08 21:30:48,290 epoch 25 - iter 2120/2650 - loss 0.51176585 throughput (samples/sec): 84.11 -2019-08-08 21:32:30,349 epoch 25 - iter 2385/2650 - loss 0.51310921 throughput (samples/sec): 83.12 -2019-08-08 21:34:07,552 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:34:07,553 EPOCH 25 done: loss 0.5158 - lr 0.1000 -2019-08-08 21:34:07,553 BAD EPOCHS (no improvement): 0 -2019-08-08 21:34:07,553 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:34:07,887 epoch 26 - iter 0/2650 - loss 0.80676651 throughput (samples/sec): 25651.27 -2019-08-08 21:35:39,712 epoch 26 - iter 265/2650 - loss 0.46816354 throughput (samples/sec): 92.39 -2019-08-08 21:37:16,552 epoch 26 - iter 530/2650 - loss 0.47075052 throughput (samples/sec): 87.60 -2019-08-08 21:38:58,661 epoch 26 - iter 795/2650 - loss 0.48404235 throughput (samples/sec): 83.08 -2019-08-08 21:40:39,535 epoch 26 - iter 1060/2650 - loss 0.49126738 throughput (samples/sec): 84.10 -2019-08-08 21:42:18,872 epoch 26 - iter 1325/2650 - loss 0.49537077 throughput (samples/sec): 85.40 -2019-08-08 21:43:56,531 epoch 26 - iter 1590/2650 - loss 0.49786972 throughput (samples/sec): 86.87 -2019-08-08 21:45:36,459 epoch 26 - iter 1855/2650 - loss 0.49870067 throughput (samples/sec): 84.90 -2019-08-08 21:47:19,041 epoch 26 - iter 2120/2650 - loss 0.50033980 throughput (samples/sec): 82.70 -2019-08-08 21:48:58,189 epoch 26 - iter 2385/2650 - loss 0.50404171 throughput (samples/sec): 85.57 -2019-08-08 21:50:37,700 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:50:37,701 EPOCH 26 done: loss 0.5059 - lr 0.1000 -2019-08-08 21:50:37,701 BAD EPOCHS (no improvement): 0 -2019-08-08 21:50:37,701 ---------------------------------------------------------------------------------------------------- -2019-08-08 21:50:38,032 epoch 27 - iter 0/2650 - loss 0.10203117 throughput (samples/sec): 25932.99 -2019-08-08 21:52:11,797 epoch 27 - iter 265/2650 - loss 0.47089718 throughput (samples/sec): 90.48 -2019-08-08 21:53:38,809 epoch 27 - iter 530/2650 - loss 0.47928792 throughput (samples/sec): 97.50 -2019-08-08 21:55:19,156 epoch 27 - iter 795/2650 - loss 0.48085990 throughput (samples/sec): 84.54 -2019-08-08 21:56:59,233 epoch 27 - iter 1060/2650 - loss 0.48920794 throughput (samples/sec): 84.77 -2019-08-08 21:58:36,974 epoch 27 - iter 1325/2650 - loss 0.49272136 throughput (samples/sec): 86.80 -2019-08-08 22:00:17,030 epoch 27 - iter 1590/2650 - loss 0.48878605 throughput (samples/sec): 84.79 -2019-08-08 22:02:01,527 epoch 27 - iter 1855/2650 - loss 0.49192334 throughput (samples/sec): 81.18 -2019-08-08 22:03:41,170 epoch 27 - iter 2120/2650 - loss 0.49098018 throughput (samples/sec): 85.14 -2019-08-08 22:05:22,176 epoch 27 - iter 2385/2650 - loss 0.49461183 throughput (samples/sec): 83.99 -2019-08-08 22:07:02,080 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:07:02,080 EPOCH 27 done: loss 0.4973 - lr 0.1000 -2019-08-08 22:07:02,081 BAD EPOCHS (no improvement): 0 -2019-08-08 22:07:02,081 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:07:02,685 epoch 28 - iter 0/2650 - loss 0.23517013 throughput (samples/sec): 14113.53 -2019-08-08 22:08:44,991 epoch 28 - iter 265/2650 - loss 0.47403408 throughput (samples/sec): 82.92 -2019-08-08 22:10:16,524 epoch 28 - iter 530/2650 - loss 0.46669906 throughput (samples/sec): 92.69 -2019-08-08 22:11:54,697 epoch 28 - iter 795/2650 - loss 0.47084272 throughput (samples/sec): 86.42 -2019-08-08 22:13:33,631 epoch 28 - iter 1060/2650 - loss 0.47923173 throughput (samples/sec): 85.75 -2019-08-08 22:15:11,787 epoch 28 - iter 1325/2650 - loss 0.48122996 throughput (samples/sec): 86.43 -2019-08-08 22:16:51,589 epoch 28 - iter 1590/2650 - loss 0.48313786 throughput (samples/sec): 85.00 -2019-08-08 22:18:30,108 epoch 28 - iter 1855/2650 - loss 0.48443250 throughput (samples/sec): 86.11 -2019-08-08 22:20:10,730 epoch 28 - iter 2120/2650 - loss 0.48703428 throughput (samples/sec): 84.31 -2019-08-08 22:21:51,367 epoch 28 - iter 2385/2650 - loss 0.49207506 throughput (samples/sec): 84.30 -2019-08-08 22:23:30,322 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:23:30,322 EPOCH 28 done: loss 0.4937 - lr 0.1000 -2019-08-08 22:23:30,323 BAD EPOCHS (no improvement): 0 -2019-08-08 22:23:30,323 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:23:30,779 epoch 29 - iter 0/2650 - loss 0.22029161 throughput (samples/sec): 18718.11 -2019-08-08 22:25:11,515 epoch 29 - iter 265/2650 - loss 0.46843173 throughput (samples/sec): 84.21 -2019-08-08 22:26:50,537 epoch 29 - iter 530/2650 - loss 0.47590995 throughput (samples/sec): 85.67 -2019-08-08 22:28:23,206 epoch 29 - iter 795/2650 - loss 0.48655021 throughput (samples/sec): 91.55 -2019-08-08 22:30:00,672 epoch 29 - iter 1060/2650 - loss 0.48190160 throughput (samples/sec): 87.04 -2019-08-08 22:31:42,060 epoch 29 - iter 1325/2650 - loss 0.48277661 throughput (samples/sec): 83.67 -2019-08-08 22:33:21,127 epoch 29 - iter 1590/2650 - loss 0.48563179 throughput (samples/sec): 85.63 -2019-08-08 22:35:01,083 epoch 29 - iter 1855/2650 - loss 0.48883912 throughput (samples/sec): 84.87 -2019-08-08 22:36:39,691 epoch 29 - iter 2120/2650 - loss 0.48852700 throughput (samples/sec): 86.03 -2019-08-08 22:38:18,631 epoch 29 - iter 2385/2650 - loss 0.49001170 throughput (samples/sec): 85.74 -2019-08-08 22:39:57,658 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:39:57,659 EPOCH 29 done: loss 0.4874 - lr 0.1000 -2019-08-08 22:39:57,659 BAD EPOCHS (no improvement): 0 -2019-08-08 22:39:57,659 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:39:57,992 epoch 30 - iter 0/2650 - loss 0.53292990 throughput (samples/sec): 25749.96 -2019-08-08 22:41:38,826 epoch 30 - iter 265/2650 - loss 0.48666803 throughput (samples/sec): 84.13 -2019-08-08 22:43:17,308 epoch 30 - iter 530/2650 - loss 0.47851895 throughput (samples/sec): 86.14 -2019-08-08 22:44:51,986 epoch 30 - iter 795/2650 - loss 0.46467003 throughput (samples/sec): 89.61 -2019-08-08 22:46:22,826 epoch 30 - iter 1060/2650 - loss 0.47588904 throughput (samples/sec): 93.39 -2019-08-08 22:48:02,302 epoch 30 - iter 1325/2650 - loss 0.47448517 throughput (samples/sec): 85.28 -2019-08-08 22:49:42,302 epoch 30 - iter 1590/2650 - loss 0.47503637 throughput (samples/sec): 84.84 -2019-08-08 22:51:20,550 epoch 30 - iter 1855/2650 - loss 0.47733555 throughput (samples/sec): 86.35 -2019-08-08 22:52:58,384 epoch 30 - iter 2120/2650 - loss 0.47928561 throughput (samples/sec): 86.71 -2019-08-08 22:54:38,248 epoch 30 - iter 2385/2650 - loss 0.48029486 throughput (samples/sec): 84.95 -2019-08-08 22:56:18,727 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:56:18,727 EPOCH 30 done: loss 0.4793 - lr 0.1000 -2019-08-08 22:56:18,727 BAD EPOCHS (no improvement): 0 -2019-08-08 22:56:18,727 ---------------------------------------------------------------------------------------------------- -2019-08-08 22:56:19,041 epoch 31 - iter 0/2650 - loss 0.89822137 throughput (samples/sec): 27322.97 -2019-08-08 22:57:58,412 epoch 31 - iter 265/2650 - loss 0.45808364 throughput (samples/sec): 85.37 -2019-08-08 22:59:39,989 epoch 31 - iter 530/2650 - loss 0.47406353 throughput (samples/sec): 83.52 -2019-08-08 23:01:21,469 epoch 31 - iter 795/2650 - loss 0.46752654 throughput (samples/sec): 83.60 -2019-08-08 23:02:55,319 epoch 31 - iter 1060/2650 - loss 0.46736042 throughput (samples/sec): 90.40 -2019-08-08 23:04:31,745 epoch 31 - iter 1325/2650 - loss 0.46064089 throughput (samples/sec): 87.98 -2019-08-08 23:06:15,121 epoch 31 - iter 1590/2650 - loss 0.46587969 throughput (samples/sec): 82.06 -2019-08-08 23:08:01,406 epoch 31 - iter 1855/2650 - loss 0.47084024 throughput (samples/sec): 79.82 -2019-08-08 23:09:39,312 epoch 31 - iter 2120/2650 - loss 0.46942132 throughput (samples/sec): 86.65 -2019-08-08 23:11:18,733 epoch 31 - iter 2385/2650 - loss 0.47113184 throughput (samples/sec): 85.33 -2019-08-08 23:13:01,794 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:13:01,794 EPOCH 31 done: loss 0.4726 - lr 0.1000 -2019-08-08 23:13:01,794 BAD EPOCHS (no improvement): 0 -2019-08-08 23:13:01,794 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:13:02,326 epoch 32 - iter 0/2650 - loss 0.51065916 throughput (samples/sec): 16078.69 -2019-08-08 23:14:38,588 epoch 32 - iter 265/2650 - loss 0.45667724 throughput (samples/sec): 88.13 -2019-08-08 23:16:18,865 epoch 32 - iter 530/2650 - loss 0.45393455 throughput (samples/sec): 84.60 -2019-08-08 23:17:58,257 epoch 32 - iter 795/2650 - loss 0.45741449 throughput (samples/sec): 85.35 -2019-08-08 23:19:32,725 epoch 32 - iter 1060/2650 - loss 0.45477013 throughput (samples/sec): 89.80 -2019-08-08 23:21:04,319 epoch 32 - iter 1325/2650 - loss 0.46259872 throughput (samples/sec): 92.62 -2019-08-08 23:22:43,311 epoch 32 - iter 1590/2650 - loss 0.46248434 throughput (samples/sec): 85.70 -2019-08-08 23:24:20,921 epoch 32 - iter 1855/2650 - loss 0.46305481 throughput (samples/sec): 86.91 -2019-08-08 23:25:59,631 epoch 32 - iter 2120/2650 - loss 0.46424551 throughput (samples/sec): 85.94 -2019-08-08 23:27:42,129 epoch 32 - iter 2385/2650 - loss 0.46683482 throughput (samples/sec): 82.77 -2019-08-08 23:29:23,334 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:29:23,335 EPOCH 32 done: loss 0.4671 - lr 0.1000 -2019-08-08 23:29:23,335 BAD EPOCHS (no improvement): 0 -2019-08-08 23:29:23,335 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:29:23,816 epoch 33 - iter 0/2650 - loss 0.59553295 throughput (samples/sec): 17771.48 -2019-08-08 23:30:50,517 epoch 33 - iter 265/2650 - loss 0.43458016 throughput (samples/sec): 97.85 -2019-08-08 23:32:15,288 epoch 33 - iter 530/2650 - loss 0.44498484 throughput (samples/sec): 100.08 -2019-08-08 23:33:39,347 epoch 33 - iter 795/2650 - loss 0.45438843 throughput (samples/sec): 100.93 -2019-08-08 23:35:01,703 epoch 33 - iter 1060/2650 - loss 0.45242876 throughput (samples/sec): 103.02 -2019-08-08 23:36:27,579 epoch 33 - iter 1325/2650 - loss 0.45193698 throughput (samples/sec): 98.79 -2019-08-08 23:37:50,385 epoch 33 - iter 1590/2650 - loss 0.45055993 throughput (samples/sec): 102.46 -2019-08-08 23:39:18,401 epoch 33 - iter 1855/2650 - loss 0.45395918 throughput (samples/sec): 96.39 -2019-08-08 23:40:42,070 epoch 33 - iter 2120/2650 - loss 0.45866855 throughput (samples/sec): 101.40 -2019-08-08 23:42:04,483 epoch 33 - iter 2385/2650 - loss 0.45901743 throughput (samples/sec): 102.95 -2019-08-08 23:43:26,895 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:43:26,895 EPOCH 33 done: loss 0.4598 - lr 0.1000 -2019-08-08 23:43:26,895 BAD EPOCHS (no improvement): 0 -2019-08-08 23:43:26,896 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:43:27,301 epoch 34 - iter 0/2650 - loss 0.58408910 throughput (samples/sec): 21107.24 -2019-08-08 23:44:51,132 epoch 34 - iter 265/2650 - loss 0.43716153 throughput (samples/sec): 101.20 -2019-08-08 23:46:16,971 epoch 34 - iter 530/2650 - loss 0.43276712 throughput (samples/sec): 98.84 -2019-08-08 23:47:43,578 epoch 34 - iter 795/2650 - loss 0.43467532 throughput (samples/sec): 97.96 -2019-08-08 23:49:10,286 epoch 34 - iter 1060/2650 - loss 0.43682818 throughput (samples/sec): 97.85 -2019-08-08 23:50:36,784 epoch 34 - iter 1325/2650 - loss 0.44724794 throughput (samples/sec): 98.09 -2019-08-08 23:52:01,919 epoch 34 - iter 1590/2650 - loss 0.44587124 throughput (samples/sec): 99.66 -2019-08-08 23:53:25,766 epoch 34 - iter 1855/2650 - loss 0.44744382 throughput (samples/sec): 101.19 -2019-08-08 23:54:49,534 epoch 34 - iter 2120/2650 - loss 0.44717141 throughput (samples/sec): 101.28 -2019-08-08 23:56:14,963 epoch 34 - iter 2385/2650 - loss 0.45150160 throughput (samples/sec): 99.31 -2019-08-08 23:57:37,304 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:57:37,305 EPOCH 34 done: loss 0.4540 - lr 0.1000 -2019-08-08 23:57:37,305 BAD EPOCHS (no improvement): 0 -2019-08-08 23:57:37,305 ---------------------------------------------------------------------------------------------------- -2019-08-08 23:57:37,537 epoch 35 - iter 0/2650 - loss 0.31775418 throughput (samples/sec): 37117.31 -2019-08-08 23:59:01,379 epoch 35 - iter 265/2650 - loss 0.45492699 throughput (samples/sec): 101.19 -2019-08-09 00:00:25,808 epoch 35 - iter 530/2650 - loss 0.44794266 throughput (samples/sec): 100.49 -2019-08-09 00:01:52,847 epoch 35 - iter 795/2650 - loss 0.45491089 throughput (samples/sec): 97.47 -2019-08-09 00:03:19,067 epoch 35 - iter 1060/2650 - loss 0.44997949 throughput (samples/sec): 98.40 -2019-08-09 00:04:40,665 epoch 35 - iter 1325/2650 - loss 0.44733031 throughput (samples/sec): 103.98 -2019-08-09 00:06:03,458 epoch 35 - iter 1590/2650 - loss 0.44700463 throughput (samples/sec): 102.47 -2019-08-09 00:07:25,761 epoch 35 - iter 1855/2650 - loss 0.44831945 throughput (samples/sec): 103.08 -2019-08-09 00:08:49,629 epoch 35 - iter 2120/2650 - loss 0.45066334 throughput (samples/sec): 101.16 -2019-08-09 00:10:12,467 epoch 35 - iter 2385/2650 - loss 0.45200193 throughput (samples/sec): 102.42 -2019-08-09 00:11:34,404 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:11:34,404 EPOCH 35 done: loss 0.4533 - lr 0.1000 -2019-08-09 00:11:34,405 BAD EPOCHS (no improvement): 0 -2019-08-09 00:11:34,405 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:11:34,742 epoch 36 - iter 0/2650 - loss 0.62461257 throughput (samples/sec): 25396.19 -2019-08-09 00:12:57,665 epoch 36 - iter 265/2650 - loss 0.43829823 throughput (samples/sec): 102.31 -2019-08-09 00:14:21,086 epoch 36 - iter 530/2650 - loss 0.44178401 throughput (samples/sec): 101.70 -2019-08-09 00:15:45,310 epoch 36 - iter 795/2650 - loss 0.44079294 throughput (samples/sec): 100.73 -2019-08-09 00:17:10,661 epoch 36 - iter 1060/2650 - loss 0.44174909 throughput (samples/sec): 99.40 -2019-08-09 00:18:33,924 epoch 36 - iter 1325/2650 - loss 0.44362749 throughput (samples/sec): 101.90 -2019-08-09 00:19:58,603 epoch 36 - iter 1590/2650 - loss 0.44314179 throughput (samples/sec): 100.19 -2019-08-09 00:21:23,635 epoch 36 - iter 1855/2650 - loss 0.44119174 throughput (samples/sec): 99.78 -2019-08-09 00:22:48,338 epoch 36 - iter 2120/2650 - loss 0.44320248 throughput (samples/sec): 100.16 -2019-08-09 00:24:10,323 epoch 36 - iter 2385/2650 - loss 0.44331174 throughput (samples/sec): 103.48 -2019-08-09 00:25:31,377 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:25:31,377 EPOCH 36 done: loss 0.4437 - lr 0.1000 -2019-08-09 00:25:31,377 BAD EPOCHS (no improvement): 0 -2019-08-09 00:25:31,377 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:25:31,656 epoch 37 - iter 0/2650 - loss 0.42289853 throughput (samples/sec): 30802.20 -2019-08-09 00:26:52,811 epoch 37 - iter 265/2650 - loss 0.44167244 throughput (samples/sec): 104.55 -2019-08-09 00:28:14,554 epoch 37 - iter 530/2650 - loss 0.42072807 throughput (samples/sec): 103.79 -2019-08-09 00:29:36,469 epoch 37 - iter 795/2650 - loss 0.42808174 throughput (samples/sec): 103.57 -2019-08-09 00:31:00,387 epoch 37 - iter 1060/2650 - loss 0.42997729 throughput (samples/sec): 101.10 -2019-08-09 00:32:22,804 epoch 37 - iter 1325/2650 - loss 0.43235690 throughput (samples/sec): 102.95 -2019-08-09 00:33:45,758 epoch 37 - iter 1590/2650 - loss 0.43596003 throughput (samples/sec): 102.28 -2019-08-09 00:35:07,605 epoch 37 - iter 1855/2650 - loss 0.44093529 throughput (samples/sec): 103.66 -2019-08-09 00:36:28,848 epoch 37 - iter 2120/2650 - loss 0.44118229 throughput (samples/sec): 104.43 -2019-08-09 00:37:52,151 epoch 37 - iter 2385/2650 - loss 0.43846440 throughput (samples/sec): 101.85 -2019-08-09 00:39:12,729 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:39:12,730 EPOCH 37 done: loss 0.4415 - lr 0.1000 -2019-08-09 00:39:12,730 BAD EPOCHS (no improvement): 0 -2019-08-09 00:39:12,730 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:39:13,054 epoch 38 - iter 0/2650 - loss 0.66496325 throughput (samples/sec): 26440.61 -2019-08-09 00:40:32,202 epoch 38 - iter 265/2650 - loss 0.39900460 throughput (samples/sec): 107.20 -2019-08-09 00:41:53,168 epoch 38 - iter 530/2650 - loss 0.40989244 throughput (samples/sec): 104.79 -2019-08-09 00:43:15,296 epoch 38 - iter 795/2650 - loss 0.41089250 throughput (samples/sec): 103.31 -2019-08-09 00:44:38,361 epoch 38 - iter 1060/2650 - loss 0.41630097 throughput (samples/sec): 102.14 -2019-08-09 00:45:59,643 epoch 38 - iter 1325/2650 - loss 0.42683281 throughput (samples/sec): 104.38 -2019-08-09 00:47:21,316 epoch 38 - iter 1590/2650 - loss 0.42687347 throughput (samples/sec): 103.88 -2019-08-09 00:48:41,989 epoch 38 - iter 1855/2650 - loss 0.42766458 throughput (samples/sec): 105.17 -2019-08-09 00:50:03,488 epoch 38 - iter 2120/2650 - loss 0.42924051 throughput (samples/sec): 104.10 -2019-08-09 00:51:26,095 epoch 38 - iter 2385/2650 - loss 0.43340574 throughput (samples/sec): 102.70 -2019-08-09 00:52:46,916 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:52:46,916 EPOCH 38 done: loss 0.4354 - lr 0.1000 -2019-08-09 00:52:46,916 BAD EPOCHS (no improvement): 0 -2019-08-09 00:52:46,916 ---------------------------------------------------------------------------------------------------- -2019-08-09 00:52:47,178 epoch 39 - iter 0/2650 - loss 0.26522106 throughput (samples/sec): 32863.92 -2019-08-09 00:54:09,061 epoch 39 - iter 265/2650 - loss 0.40514745 throughput (samples/sec): 103.62 -2019-08-09 00:55:31,295 epoch 39 - iter 530/2650 - loss 0.40792397 throughput (samples/sec): 103.17 -2019-08-09 00:56:50,765 epoch 39 - iter 795/2650 - loss 0.41767177 throughput (samples/sec): 106.76 -2019-08-09 00:58:13,399 epoch 39 - iter 1060/2650 - loss 0.42496022 throughput (samples/sec): 102.67 -2019-08-09 00:59:38,793 epoch 39 - iter 1325/2650 - loss 0.42308681 throughput (samples/sec): 99.35 -2019-08-09 01:00:59,955 epoch 39 - iter 1590/2650 - loss 0.42208519 throughput (samples/sec): 104.53 -2019-08-09 01:02:21,787 epoch 39 - iter 1855/2650 - loss 0.42558077 throughput (samples/sec): 103.68 -2019-08-09 01:03:40,357 epoch 39 - iter 2120/2650 - loss 0.43022192 throughput (samples/sec): 107.99 -2019-08-09 01:05:01,523 epoch 39 - iter 2385/2650 - loss 0.42865656 throughput (samples/sec): 104.53 -2019-08-09 01:06:23,457 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:06:23,458 EPOCH 39 done: loss 0.4287 - lr 0.1000 -2019-08-09 01:06:23,458 BAD EPOCHS (no improvement): 0 -2019-08-09 01:06:23,458 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:06:23,755 epoch 40 - iter 0/2650 - loss 0.26726326 throughput (samples/sec): 28920.00 -2019-08-09 01:07:44,973 epoch 40 - iter 265/2650 - loss 0.38989836 throughput (samples/sec): 104.46 -2019-08-09 01:09:06,581 epoch 40 - iter 530/2650 - loss 0.40017055 throughput (samples/sec): 103.96 -2019-08-09 01:10:30,675 epoch 40 - iter 795/2650 - loss 0.41757987 throughput (samples/sec): 100.89 -2019-08-09 01:11:55,659 epoch 40 - iter 1060/2650 - loss 0.41457401 throughput (samples/sec): 99.83 -2019-08-09 01:13:20,091 epoch 40 - iter 1325/2650 - loss 0.41663371 throughput (samples/sec): 100.49 -2019-08-09 01:14:42,221 epoch 40 - iter 1590/2650 - loss 0.41385480 throughput (samples/sec): 103.30 -2019-08-09 01:16:01,179 epoch 40 - iter 1855/2650 - loss 0.41203232 throughput (samples/sec): 107.45 -2019-08-09 01:17:23,815 epoch 40 - iter 2120/2650 - loss 0.41445348 throughput (samples/sec): 102.67 -2019-08-09 01:18:45,639 epoch 40 - iter 2385/2650 - loss 0.42004346 throughput (samples/sec): 103.69 -2019-08-09 01:20:05,710 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:20:05,710 EPOCH 40 done: loss 0.4233 - lr 0.1000 -2019-08-09 01:20:05,710 BAD EPOCHS (no improvement): 0 -2019-08-09 01:20:05,710 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:20:05,912 epoch 41 - iter 0/2650 - loss 0.14586067 throughput (samples/sec): 42649.01 -2019-08-09 01:21:28,104 epoch 41 - iter 265/2650 - loss 0.42868440 throughput (samples/sec): 103.22 -2019-08-09 01:22:48,576 epoch 41 - iter 530/2650 - loss 0.42097532 throughput (samples/sec): 105.43 -2019-08-09 01:24:11,453 epoch 41 - iter 795/2650 - loss 0.41460588 throughput (samples/sec): 102.37 -2019-08-09 01:25:34,857 epoch 41 - iter 1060/2650 - loss 0.41461898 throughput (samples/sec): 101.73 -2019-08-09 01:27:00,403 epoch 41 - iter 1325/2650 - loss 0.41975883 throughput (samples/sec): 99.18 -2019-08-09 01:28:24,269 epoch 41 - iter 1590/2650 - loss 0.42249522 throughput (samples/sec): 101.16 -2019-08-09 01:29:49,335 epoch 41 - iter 1855/2650 - loss 0.42045717 throughput (samples/sec): 99.74 -2019-08-09 01:31:12,580 epoch 41 - iter 2120/2650 - loss 0.42135616 throughput (samples/sec): 101.92 -2019-08-09 01:32:36,101 epoch 41 - iter 2385/2650 - loss 0.41910080 throughput (samples/sec): 101.58 -2019-08-09 01:33:58,903 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:33:58,903 EPOCH 41 done: loss 0.4219 - lr 0.1000 -2019-08-09 01:33:58,903 BAD EPOCHS (no improvement): 0 -2019-08-09 01:33:58,904 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:33:59,244 epoch 42 - iter 0/2650 - loss 0.24474555 throughput (samples/sec): 25183.51 -2019-08-09 01:35:22,626 epoch 42 - iter 265/2650 - loss 0.40553383 throughput (samples/sec): 101.75 -2019-08-09 01:36:46,279 epoch 42 - iter 530/2650 - loss 0.41139236 throughput (samples/sec): 101.42 -2019-08-09 01:38:07,013 epoch 42 - iter 795/2650 - loss 0.41750882 throughput (samples/sec): 105.09 -2019-08-09 01:39:29,784 epoch 42 - iter 1060/2650 - loss 0.41511593 throughput (samples/sec): 102.50 -2019-08-09 01:40:49,044 epoch 42 - iter 1325/2650 - loss 0.41569206 throughput (samples/sec): 107.04 -2019-08-09 01:42:12,235 epoch 42 - iter 1590/2650 - loss 0.41438960 throughput (samples/sec): 101.98 -2019-08-09 01:43:35,752 epoch 42 - iter 1855/2650 - loss 0.41574280 throughput (samples/sec): 101.59 -2019-08-09 01:44:58,671 epoch 42 - iter 2120/2650 - loss 0.41607063 throughput (samples/sec): 102.32 -2019-08-09 01:46:20,904 epoch 42 - iter 2385/2650 - loss 0.41951967 throughput (samples/sec): 103.18 -2019-08-09 01:47:41,787 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:47:41,787 EPOCH 42 done: loss 0.4212 - lr 0.1000 -2019-08-09 01:47:41,787 BAD EPOCHS (no improvement): 0 -2019-08-09 01:47:41,788 ---------------------------------------------------------------------------------------------------- -2019-08-09 01:47:42,061 epoch 43 - iter 0/2650 - loss 0.31859362 throughput (samples/sec): 31520.53 -2019-08-09 01:49:03,649 epoch 43 - iter 265/2650 - loss 0.38579090 throughput (samples/sec): 103.99 -2019-08-09 01:50:28,060 epoch 43 - iter 530/2650 - loss 0.40206989 throughput (samples/sec): 100.51 -2019-08-09 01:51:47,782 epoch 43 - iter 795/2650 - loss 0.40795117 throughput (samples/sec): 106.42 -2019-08-09 01:53:09,887 epoch 43 - iter 1060/2650 - loss 0.40827751 throughput (samples/sec): 103.33 -2019-08-09 01:54:31,692 epoch 43 - iter 1325/2650 - loss 0.40497291 throughput (samples/sec): 103.71 -2019-08-09 01:55:54,453 epoch 43 - iter 1590/2650 - loss 0.40716669 throughput (samples/sec): 102.51 -2019-08-09 01:57:14,540 epoch 43 - iter 1855/2650 - loss 0.40971238 throughput (samples/sec): 105.94 -2019-08-09 01:58:38,662 epoch 43 - iter 2120/2650 - loss 0.41309735 throughput (samples/sec): 100.85 -2019-08-09 02:00:01,108 epoch 43 - iter 2385/2650 - loss 0.41167147 throughput (samples/sec): 102.91 -2019-08-09 02:01:20,870 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:01:20,870 EPOCH 43 done: loss 0.4123 - lr 0.1000 -2019-08-09 02:01:20,870 BAD EPOCHS (no improvement): 0 -2019-08-09 02:01:20,870 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:01:21,179 epoch 44 - iter 0/2650 - loss 0.38331008 throughput (samples/sec): 27821.82 -2019-08-09 02:02:43,068 epoch 44 - iter 265/2650 - loss 0.41039358 throughput (samples/sec): 103.61 -2019-08-09 02:04:03,526 epoch 44 - iter 530/2650 - loss 0.39916051 throughput (samples/sec): 105.45 -2019-08-09 02:05:25,565 epoch 44 - iter 795/2650 - loss 0.40496591 throughput (samples/sec): 103.42 -2019-08-09 02:06:45,450 epoch 44 - iter 1060/2650 - loss 0.40863292 throughput (samples/sec): 106.21 -2019-08-09 02:08:05,819 epoch 44 - iter 1325/2650 - loss 0.40376641 throughput (samples/sec): 105.57 -2019-08-09 02:09:28,161 epoch 44 - iter 1590/2650 - loss 0.40671579 throughput (samples/sec): 103.04 -2019-08-09 02:10:52,237 epoch 44 - iter 1855/2650 - loss 0.40905970 throughput (samples/sec): 100.91 -2019-08-09 02:12:14,739 epoch 44 - iter 2120/2650 - loss 0.40909409 throughput (samples/sec): 102.84 -2019-08-09 02:13:34,146 epoch 44 - iter 2385/2650 - loss 0.41179820 throughput (samples/sec): 106.85 -2019-08-09 02:14:55,760 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:14:55,760 EPOCH 44 done: loss 0.4116 - lr 0.1000 -2019-08-09 02:14:55,760 BAD EPOCHS (no improvement): 0 -2019-08-09 02:14:55,760 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:14:56,098 epoch 45 - iter 0/2650 - loss 0.33184862 throughput (samples/sec): 25381.39 -2019-08-09 02:16:19,316 epoch 45 - iter 265/2650 - loss 0.38948589 throughput (samples/sec): 101.95 -2019-08-09 02:17:39,948 epoch 45 - iter 530/2650 - loss 0.39913672 throughput (samples/sec): 105.22 -2019-08-09 02:18:59,891 epoch 45 - iter 795/2650 - loss 0.39711459 throughput (samples/sec): 106.13 -2019-08-09 02:20:20,222 epoch 45 - iter 1060/2650 - loss 0.39863823 throughput (samples/sec): 105.62 -2019-08-09 02:21:39,617 epoch 45 - iter 1325/2650 - loss 0.39819490 throughput (samples/sec): 106.86 -2019-08-09 02:23:01,654 epoch 45 - iter 1590/2650 - loss 0.39895652 throughput (samples/sec): 103.42 -2019-08-09 02:24:23,389 epoch 45 - iter 1855/2650 - loss 0.39989993 throughput (samples/sec): 103.80 -2019-08-09 02:25:44,300 epoch 45 - iter 2120/2650 - loss 0.39995595 throughput (samples/sec): 104.86 -2019-08-09 02:27:06,545 epoch 45 - iter 2385/2650 - loss 0.40241438 throughput (samples/sec): 103.16 -2019-08-09 02:28:31,604 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:28:31,604 EPOCH 45 done: loss 0.4064 - lr 0.1000 -2019-08-09 02:28:31,604 BAD EPOCHS (no improvement): 0 -2019-08-09 02:28:31,604 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:28:31,868 epoch 46 - iter 0/2650 - loss 0.37440667 throughput (samples/sec): 32581.98 -2019-08-09 02:29:53,839 epoch 46 - iter 265/2650 - loss 0.40327622 throughput (samples/sec): 103.50 -2019-08-09 02:31:15,042 epoch 46 - iter 530/2650 - loss 0.40318071 throughput (samples/sec): 104.48 -2019-08-09 02:32:35,597 epoch 46 - iter 795/2650 - loss 0.39257078 throughput (samples/sec): 105.32 -2019-08-09 02:33:57,077 epoch 46 - iter 1060/2650 - loss 0.39437895 throughput (samples/sec): 104.13 -2019-08-09 02:35:19,369 epoch 46 - iter 1325/2650 - loss 0.39646379 throughput (samples/sec): 103.10 -2019-08-09 02:36:41,500 epoch 46 - iter 1590/2650 - loss 0.39704554 throughput (samples/sec): 103.30 -2019-08-09 02:38:05,717 epoch 46 - iter 1855/2650 - loss 0.39944474 throughput (samples/sec): 100.74 -2019-08-09 02:39:28,128 epoch 46 - iter 2120/2650 - loss 0.40339038 throughput (samples/sec): 102.95 -2019-08-09 02:40:50,813 epoch 46 - iter 2385/2650 - loss 0.40351108 throughput (samples/sec): 102.61 -2019-08-09 02:42:12,867 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:42:12,867 EPOCH 46 done: loss 0.4066 - lr 0.1000 -2019-08-09 02:42:12,867 BAD EPOCHS (no improvement): 1 -2019-08-09 02:42:12,868 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:42:13,136 epoch 47 - iter 0/2650 - loss 0.28122184 throughput (samples/sec): 32051.63 -2019-08-09 02:43:35,524 epoch 47 - iter 265/2650 - loss 0.40222935 throughput (samples/sec): 102.98 -2019-08-09 02:44:57,551 epoch 47 - iter 530/2650 - loss 0.38764925 throughput (samples/sec): 103.43 -2019-08-09 02:46:21,529 epoch 47 - iter 795/2650 - loss 0.40201988 throughput (samples/sec): 101.03 -2019-08-09 02:47:43,833 epoch 47 - iter 1060/2650 - loss 0.39836737 throughput (samples/sec): 103.09 -2019-08-09 02:49:05,896 epoch 47 - iter 1325/2650 - loss 0.39914816 throughput (samples/sec): 103.39 -2019-08-09 02:50:26,941 epoch 47 - iter 1590/2650 - loss 0.40171112 throughput (samples/sec): 104.69 -2019-08-09 02:51:45,653 epoch 47 - iter 1855/2650 - loss 0.40004478 throughput (samples/sec): 107.79 -2019-08-09 02:53:06,169 epoch 47 - iter 2120/2650 - loss 0.40233503 throughput (samples/sec): 105.37 -2019-08-09 02:54:27,891 epoch 47 - iter 2385/2650 - loss 0.40435368 throughput (samples/sec): 103.82 -2019-08-09 02:55:52,565 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:55:52,565 EPOCH 47 done: loss 0.4029 - lr 0.1000 -2019-08-09 02:55:52,565 BAD EPOCHS (no improvement): 0 -2019-08-09 02:55:52,565 ---------------------------------------------------------------------------------------------------- -2019-08-09 02:55:52,861 epoch 48 - iter 0/2650 - loss 0.30471680 throughput (samples/sec): 29039.12 -2019-08-09 02:57:17,904 epoch 48 - iter 265/2650 - loss 0.43164881 throughput (samples/sec): 99.76 -2019-08-09 02:58:43,810 epoch 48 - iter 530/2650 - loss 0.41074536 throughput (samples/sec): 98.76 -2019-08-09 03:00:04,851 epoch 48 - iter 795/2650 - loss 0.40130801 throughput (samples/sec): 104.69 -2019-08-09 03:01:27,696 epoch 48 - iter 1060/2650 - loss 0.39719240 throughput (samples/sec): 102.41 -2019-08-09 03:02:49,336 epoch 48 - iter 1325/2650 - loss 0.39964177 throughput (samples/sec): 103.92 -2019-08-09 03:04:11,051 epoch 48 - iter 1590/2650 - loss 0.40081180 throughput (samples/sec): 103.83 -2019-08-09 03:05:32,369 epoch 48 - iter 1855/2650 - loss 0.39861318 throughput (samples/sec): 104.33 -2019-08-09 03:06:54,994 epoch 48 - iter 2120/2650 - loss 0.39849387 throughput (samples/sec): 102.68 -2019-08-09 03:08:18,243 epoch 48 - iter 2385/2650 - loss 0.40215072 throughput (samples/sec): 101.91 -2019-08-09 03:09:40,110 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:09:40,110 EPOCH 48 done: loss 0.4027 - lr 0.1000 -2019-08-09 03:09:40,110 BAD EPOCHS (no improvement): 0 -2019-08-09 03:09:40,110 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:09:40,481 epoch 49 - iter 0/2650 - loss 0.56035733 throughput (samples/sec): 23132.95 -2019-08-09 03:11:03,010 epoch 49 - iter 265/2650 - loss 0.38373974 throughput (samples/sec): 102.80 -2019-08-09 03:12:25,559 epoch 49 - iter 530/2650 - loss 0.38894997 throughput (samples/sec): 102.78 -2019-08-09 03:13:48,310 epoch 49 - iter 795/2650 - loss 0.39254129 throughput (samples/sec): 102.53 -2019-08-09 03:15:08,201 epoch 49 - iter 1060/2650 - loss 0.38904442 throughput (samples/sec): 106.20 -2019-08-09 03:16:28,336 epoch 49 - iter 1325/2650 - loss 0.38974436 throughput (samples/sec): 105.88 -2019-08-09 03:17:50,521 epoch 49 - iter 1590/2650 - loss 0.39178658 throughput (samples/sec): 103.23 -2019-08-09 03:19:13,397 epoch 49 - iter 1855/2650 - loss 0.39449179 throughput (samples/sec): 102.37 -2019-08-09 03:20:35,407 epoch 49 - iter 2120/2650 - loss 0.39248150 throughput (samples/sec): 103.45 -2019-08-09 03:21:58,527 epoch 49 - iter 2385/2650 - loss 0.39889454 throughput (samples/sec): 102.07 -2019-08-09 03:23:18,399 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:23:18,399 EPOCH 49 done: loss 0.3975 - lr 0.1000 -2019-08-09 03:23:18,399 BAD EPOCHS (no improvement): 0 -2019-08-09 03:23:18,399 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:23:18,754 epoch 50 - iter 0/2650 - loss 0.34840292 throughput (samples/sec): 24173.32 -2019-08-09 03:24:38,571 epoch 50 - iter 265/2650 - loss 0.37441844 throughput (samples/sec): 106.30 -2019-08-09 03:26:00,918 epoch 50 - iter 530/2650 - loss 0.37847099 throughput (samples/sec): 103.03 -2019-08-09 03:27:21,769 epoch 50 - iter 795/2650 - loss 0.37656764 throughput (samples/sec): 104.94 -2019-08-09 03:28:44,907 epoch 50 - iter 1060/2650 - loss 0.38001706 throughput (samples/sec): 102.05 -2019-08-09 03:30:09,385 epoch 50 - iter 1325/2650 - loss 0.38195739 throughput (samples/sec): 100.43 -2019-08-09 03:31:34,284 epoch 50 - iter 1590/2650 - loss 0.38235569 throughput (samples/sec): 99.93 -2019-08-09 03:32:59,669 epoch 50 - iter 1855/2650 - loss 0.38732230 throughput (samples/sec): 99.37 -2019-08-09 03:34:24,773 epoch 50 - iter 2120/2650 - loss 0.39039516 throughput (samples/sec): 99.69 -2019-08-09 03:35:46,161 epoch 50 - iter 2385/2650 - loss 0.39218949 throughput (samples/sec): 104.25 -2019-08-09 03:37:09,545 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:37:09,545 EPOCH 50 done: loss 0.3948 - lr 0.1000 -2019-08-09 03:37:09,545 BAD EPOCHS (no improvement): 0 -2019-08-09 03:37:09,546 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:37:09,821 epoch 51 - iter 0/2650 - loss 0.42671373 throughput (samples/sec): 31256.96 -2019-08-09 03:38:31,825 epoch 51 - iter 265/2650 - loss 0.35030310 throughput (samples/sec): 103.47 -2019-08-09 03:39:54,231 epoch 51 - iter 530/2650 - loss 0.37385965 throughput (samples/sec): 102.96 -2019-08-09 03:41:17,250 epoch 51 - iter 795/2650 - loss 0.37512289 throughput (samples/sec): 102.20 -2019-08-09 03:42:39,228 epoch 51 - iter 1060/2650 - loss 0.37661802 throughput (samples/sec): 103.49 -2019-08-09 03:44:01,478 epoch 51 - iter 1325/2650 - loss 0.37098422 throughput (samples/sec): 103.15 -2019-08-09 03:45:24,343 epoch 51 - iter 1590/2650 - loss 0.37032315 throughput (samples/sec): 102.39 -2019-08-09 03:46:45,380 epoch 51 - iter 1855/2650 - loss 0.37231756 throughput (samples/sec): 104.70 -2019-08-09 03:48:06,091 epoch 51 - iter 2120/2650 - loss 0.37530691 throughput (samples/sec): 105.12 -2019-08-09 03:49:28,283 epoch 51 - iter 2385/2650 - loss 0.37533393 throughput (samples/sec): 103.22 -2019-08-09 03:50:51,837 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:50:51,837 EPOCH 51 done: loss 0.3783 - lr 0.1000 -2019-08-09 03:50:51,837 BAD EPOCHS (no improvement): 0 -2019-08-09 03:50:51,837 ---------------------------------------------------------------------------------------------------- -2019-08-09 03:50:52,198 epoch 52 - iter 0/2650 - loss 0.32138366 throughput (samples/sec): 23766.32 -2019-08-09 03:52:12,426 epoch 52 - iter 265/2650 - loss 0.38075190 throughput (samples/sec): 105.75 -2019-08-09 03:53:36,628 epoch 52 - iter 530/2650 - loss 0.38534498 throughput (samples/sec): 100.76 -2019-08-09 03:54:59,938 epoch 52 - iter 795/2650 - loss 0.37978250 throughput (samples/sec): 101.84 -2019-08-09 03:56:21,005 epoch 52 - iter 1060/2650 - loss 0.38100786 throughput (samples/sec): 104.66 -2019-08-09 03:57:41,092 epoch 52 - iter 1325/2650 - loss 0.38463024 throughput (samples/sec): 105.94 -2019-08-09 03:59:04,506 epoch 52 - iter 1590/2650 - loss 0.38575654 throughput (samples/sec): 101.71 -2019-08-09 04:00:25,699 epoch 52 - iter 1855/2650 - loss 0.38743834 throughput (samples/sec): 104.50 -2019-08-09 04:01:46,075 epoch 52 - iter 2120/2650 - loss 0.38978106 throughput (samples/sec): 105.56 -2019-08-09 04:03:07,275 epoch 52 - iter 2385/2650 - loss 0.38746934 throughput (samples/sec): 104.49 -2019-08-09 04:04:29,364 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:04:29,364 EPOCH 52 done: loss 0.3866 - lr 0.1000 -2019-08-09 04:04:29,364 BAD EPOCHS (no improvement): 1 -2019-08-09 04:04:29,364 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:04:29,663 epoch 53 - iter 0/2650 - loss 0.96016634 throughput (samples/sec): 28741.92 -2019-08-09 04:05:51,944 epoch 53 - iter 265/2650 - loss 0.36788617 throughput (samples/sec): 103.11 -2019-08-09 04:07:14,924 epoch 53 - iter 530/2650 - loss 0.36201771 throughput (samples/sec): 102.24 -2019-08-09 04:08:37,451 epoch 53 - iter 795/2650 - loss 0.37307642 throughput (samples/sec): 102.80 -2019-08-09 04:09:59,423 epoch 53 - iter 1060/2650 - loss 0.37638337 throughput (samples/sec): 103.50 -2019-08-09 04:11:20,554 epoch 53 - iter 1325/2650 - loss 0.37590030 throughput (samples/sec): 104.57 -2019-08-09 04:12:40,090 epoch 53 - iter 1590/2650 - loss 0.37146758 throughput (samples/sec): 106.67 -2019-08-09 04:14:02,413 epoch 53 - iter 1855/2650 - loss 0.37406649 throughput (samples/sec): 103.06 -2019-08-09 04:15:24,350 epoch 53 - iter 2120/2650 - loss 0.37736768 throughput (samples/sec): 103.55 -2019-08-09 04:16:46,704 epoch 53 - iter 2385/2650 - loss 0.37778713 throughput (samples/sec): 103.02 -2019-08-09 04:18:06,980 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:18:06,980 EPOCH 53 done: loss 0.3819 - lr 0.1000 -2019-08-09 04:18:06,980 BAD EPOCHS (no improvement): 2 -2019-08-09 04:18:06,980 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:18:07,252 epoch 54 - iter 0/2650 - loss 0.19311208 throughput (samples/sec): 31590.35 -2019-08-09 04:19:29,074 epoch 54 - iter 265/2650 - loss 0.34620017 throughput (samples/sec): 103.69 -2019-08-09 04:20:48,095 epoch 54 - iter 530/2650 - loss 0.34598219 throughput (samples/sec): 107.37 -2019-08-09 04:22:09,617 epoch 54 - iter 795/2650 - loss 0.35371051 throughput (samples/sec): 104.07 -2019-08-09 04:23:31,756 epoch 54 - iter 1060/2650 - loss 0.36097205 throughput (samples/sec): 103.29 -2019-08-09 04:24:52,607 epoch 54 - iter 1325/2650 - loss 0.36584073 throughput (samples/sec): 104.94 -2019-08-09 04:26:14,908 epoch 54 - iter 1590/2650 - loss 0.37072044 throughput (samples/sec): 103.09 -2019-08-09 04:27:37,111 epoch 54 - iter 1855/2650 - loss 0.37388738 throughput (samples/sec): 103.21 -2019-08-09 04:28:59,777 epoch 54 - iter 2120/2650 - loss 0.37469160 throughput (samples/sec): 102.63 -2019-08-09 04:30:24,151 epoch 54 - iter 2385/2650 - loss 0.37666623 throughput (samples/sec): 100.56 -2019-08-09 04:31:49,853 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:31:49,853 EPOCH 54 done: loss 0.3788 - lr 0.1000 -2019-08-09 04:31:49,853 BAD EPOCHS (no improvement): 3 -2019-08-09 04:31:49,853 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:31:50,161 epoch 55 - iter 0/2650 - loss 0.41208774 throughput (samples/sec): 27942.61 -2019-08-09 04:33:11,607 epoch 55 - iter 265/2650 - loss 0.36019776 throughput (samples/sec): 104.17 -2019-08-09 04:34:30,563 epoch 55 - iter 530/2650 - loss 0.35552481 throughput (samples/sec): 107.46 -2019-08-09 04:35:55,983 epoch 55 - iter 795/2650 - loss 0.35558068 throughput (samples/sec): 99.32 -2019-08-09 04:37:18,961 epoch 55 - iter 1060/2650 - loss 0.36421235 throughput (samples/sec): 102.25 -2019-08-09 04:38:39,675 epoch 55 - iter 1325/2650 - loss 0.36292161 throughput (samples/sec): 105.12 -2019-08-09 04:40:03,298 epoch 55 - iter 1590/2650 - loss 0.36742625 throughput (samples/sec): 101.46 -2019-08-09 04:41:27,224 epoch 55 - iter 1855/2650 - loss 0.36758587 throughput (samples/sec): 101.09 -2019-08-09 04:42:48,956 epoch 55 - iter 2120/2650 - loss 0.37130072 throughput (samples/sec): 103.81 -2019-08-09 04:44:12,761 epoch 55 - iter 2385/2650 - loss 0.37405403 throughput (samples/sec): 101.24 -2019-08-09 04:45:34,192 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:45:34,192 EPOCH 55 done: loss 0.3759 - lr 0.1000 -2019-08-09 04:45:34,192 BAD EPOCHS (no improvement): 0 -2019-08-09 04:45:34,193 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:45:34,674 epoch 56 - iter 0/2650 - loss 0.39523354 throughput (samples/sec): 17753.52 -2019-08-09 04:46:56,261 epoch 56 - iter 265/2650 - loss 0.38054205 throughput (samples/sec): 103.99 -2019-08-09 04:48:18,325 epoch 56 - iter 530/2650 - loss 0.36511348 throughput (samples/sec): 103.39 -2019-08-09 04:49:40,371 epoch 56 - iter 795/2650 - loss 0.36025029 throughput (samples/sec): 103.41 -2019-08-09 04:51:04,912 epoch 56 - iter 1060/2650 - loss 0.36118110 throughput (samples/sec): 100.36 -2019-08-09 04:52:27,800 epoch 56 - iter 1325/2650 - loss 0.36366280 throughput (samples/sec): 102.36 -2019-08-09 04:53:51,435 epoch 56 - iter 1590/2650 - loss 0.36591783 throughput (samples/sec): 101.45 -2019-08-09 04:55:15,182 epoch 56 - iter 1855/2650 - loss 0.37313964 throughput (samples/sec): 101.31 -2019-08-09 04:56:38,719 epoch 56 - iter 2120/2650 - loss 0.37310173 throughput (samples/sec): 101.56 -2019-08-09 04:57:59,557 epoch 56 - iter 2385/2650 - loss 0.37356643 throughput (samples/sec): 104.96 -2019-08-09 04:59:24,266 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:59:24,266 EPOCH 56 done: loss 0.3726 - lr 0.1000 -2019-08-09 04:59:24,266 BAD EPOCHS (no improvement): 0 -2019-08-09 04:59:24,266 ---------------------------------------------------------------------------------------------------- -2019-08-09 04:59:24,501 epoch 57 - iter 0/2650 - loss 0.31967568 throughput (samples/sec): 36768.60 -2019-08-09 05:00:47,272 epoch 57 - iter 265/2650 - loss 0.34276648 throughput (samples/sec): 102.50 -2019-08-09 05:02:08,871 epoch 57 - iter 530/2650 - loss 0.34742869 throughput (samples/sec): 103.98 -2019-08-09 05:03:31,227 epoch 57 - iter 795/2650 - loss 0.35018497 throughput (samples/sec): 103.02 -2019-08-09 05:04:55,878 epoch 57 - iter 1060/2650 - loss 0.35649967 throughput (samples/sec): 100.23 -2019-08-09 05:06:19,234 epoch 57 - iter 1325/2650 - loss 0.36231566 throughput (samples/sec): 101.78 -2019-08-09 05:07:39,809 epoch 57 - iter 1590/2650 - loss 0.36394844 throughput (samples/sec): 105.30 -2019-08-09 05:09:03,561 epoch 57 - iter 1855/2650 - loss 0.36700867 throughput (samples/sec): 101.30 -2019-08-09 05:10:28,874 epoch 57 - iter 2120/2650 - loss 0.37239521 throughput (samples/sec): 99.45 -2019-08-09 05:11:49,358 epoch 57 - iter 2385/2650 - loss 0.37272001 throughput (samples/sec): 105.42 -2019-08-09 05:13:10,979 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:13:10,979 EPOCH 57 done: loss 0.3708 - lr 0.1000 -2019-08-09 05:13:10,979 BAD EPOCHS (no improvement): 0 -2019-08-09 05:13:10,979 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:13:11,276 epoch 58 - iter 0/2650 - loss 0.45986718 throughput (samples/sec): 28961.26 -2019-08-09 05:14:33,436 epoch 58 - iter 265/2650 - loss 0.33569934 throughput (samples/sec): 103.27 -2019-08-09 05:15:57,934 epoch 58 - iter 530/2650 - loss 0.34781552 throughput (samples/sec): 100.41 -2019-08-09 05:17:20,589 epoch 58 - iter 795/2650 - loss 0.35998244 throughput (samples/sec): 102.65 -2019-08-09 05:18:43,874 epoch 58 - iter 1060/2650 - loss 0.35887228 throughput (samples/sec): 101.87 -2019-08-09 05:20:05,603 epoch 58 - iter 1325/2650 - loss 0.36416661 throughput (samples/sec): 103.81 -2019-08-09 05:21:29,037 epoch 58 - iter 1590/2650 - loss 0.36386127 throughput (samples/sec): 101.69 -2019-08-09 05:22:49,588 epoch 58 - iter 1855/2650 - loss 0.36639726 throughput (samples/sec): 105.33 -2019-08-09 05:24:12,078 epoch 58 - iter 2120/2650 - loss 0.36931416 throughput (samples/sec): 102.85 -2019-08-09 05:25:36,320 epoch 58 - iter 2385/2650 - loss 0.37100326 throughput (samples/sec): 100.71 -2019-08-09 05:26:58,972 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:26:58,973 EPOCH 58 done: loss 0.3720 - lr 0.1000 -2019-08-09 05:26:58,973 BAD EPOCHS (no improvement): 1 -2019-08-09 05:26:58,973 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:26:59,195 epoch 59 - iter 0/2650 - loss 0.31457928 throughput (samples/sec): 38919.01 -2019-08-09 05:28:20,391 epoch 59 - iter 265/2650 - loss 0.36688158 throughput (samples/sec): 104.49 -2019-08-09 05:29:41,081 epoch 59 - iter 530/2650 - loss 0.36697246 throughput (samples/sec): 105.15 -2019-08-09 05:31:02,696 epoch 59 - iter 795/2650 - loss 0.36374481 throughput (samples/sec): 103.96 -2019-08-09 05:32:26,010 epoch 59 - iter 1060/2650 - loss 0.36388361 throughput (samples/sec): 101.83 -2019-08-09 05:33:46,469 epoch 59 - iter 1325/2650 - loss 0.36275394 throughput (samples/sec): 105.45 -2019-08-09 05:35:09,203 epoch 59 - iter 1590/2650 - loss 0.36347244 throughput (samples/sec): 102.55 -2019-08-09 05:36:31,668 epoch 59 - iter 1855/2650 - loss 0.36301514 throughput (samples/sec): 102.88 -2019-08-09 05:37:53,474 epoch 59 - iter 2120/2650 - loss 0.36279557 throughput (samples/sec): 103.71 -2019-08-09 05:39:16,274 epoch 59 - iter 2385/2650 - loss 0.36415255 throughput (samples/sec): 102.47 -2019-08-09 05:40:39,909 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:40:39,910 EPOCH 59 done: loss 0.3670 - lr 0.1000 -2019-08-09 05:40:39,910 BAD EPOCHS (no improvement): 0 -2019-08-09 05:40:39,910 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:40:40,496 epoch 60 - iter 0/2650 - loss 0.26972023 throughput (samples/sec): 14548.73 -2019-08-09 05:42:03,708 epoch 60 - iter 265/2650 - loss 0.35596939 throughput (samples/sec): 101.96 -2019-08-09 05:43:26,879 epoch 60 - iter 530/2650 - loss 0.34652247 throughput (samples/sec): 102.01 -2019-08-09 05:44:47,930 epoch 60 - iter 795/2650 - loss 0.35251211 throughput (samples/sec): 104.68 -2019-08-09 05:46:10,838 epoch 60 - iter 1060/2650 - loss 0.35858719 throughput (samples/sec): 102.34 -2019-08-09 05:47:31,712 epoch 60 - iter 1325/2650 - loss 0.36346615 throughput (samples/sec): 104.91 -2019-08-09 05:48:56,080 epoch 60 - iter 1590/2650 - loss 0.36325367 throughput (samples/sec): 100.56 -2019-08-09 05:50:18,609 epoch 60 - iter 1855/2650 - loss 0.36322803 throughput (samples/sec): 102.81 -2019-08-09 05:51:42,326 epoch 60 - iter 2120/2650 - loss 0.36251073 throughput (samples/sec): 101.35 -2019-08-09 05:53:06,199 epoch 60 - iter 2385/2650 - loss 0.36531086 throughput (samples/sec): 101.16 -2019-08-09 05:54:27,454 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:54:27,454 EPOCH 60 done: loss 0.3675 - lr 0.1000 -2019-08-09 05:54:27,454 BAD EPOCHS (no improvement): 1 -2019-08-09 05:54:27,454 ---------------------------------------------------------------------------------------------------- -2019-08-09 05:54:27,777 epoch 61 - iter 0/2650 - loss 0.68050355 throughput (samples/sec): 26611.12 -2019-08-09 05:55:50,938 epoch 61 - iter 265/2650 - loss 0.33620053 throughput (samples/sec): 102.02 -2019-08-09 05:57:16,214 epoch 61 - iter 530/2650 - loss 0.34450372 throughput (samples/sec): 99.49 -2019-08-09 05:58:40,326 epoch 61 - iter 795/2650 - loss 0.34794200 throughput (samples/sec): 100.87 -2019-08-09 06:00:02,108 epoch 61 - iter 1060/2650 - loss 0.35209426 throughput (samples/sec): 103.74 -2019-08-09 06:01:23,113 epoch 61 - iter 1325/2650 - loss 0.35038437 throughput (samples/sec): 104.74 -2019-08-09 06:02:45,687 epoch 61 - iter 1590/2650 - loss 0.35224204 throughput (samples/sec): 102.75 -2019-08-09 06:04:09,537 epoch 61 - iter 1855/2650 - loss 0.35873282 throughput (samples/sec): 101.19 -2019-08-09 06:05:31,570 epoch 61 - iter 2120/2650 - loss 0.36019087 throughput (samples/sec): 103.43 -2019-08-09 06:06:54,340 epoch 61 - iter 2385/2650 - loss 0.36080942 throughput (samples/sec): 102.51 -2019-08-09 06:08:17,502 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:08:17,502 EPOCH 61 done: loss 0.3628 - lr 0.1000 -2019-08-09 06:08:17,502 BAD EPOCHS (no improvement): 0 -2019-08-09 06:08:17,502 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:08:17,885 epoch 62 - iter 0/2650 - loss 0.30890334 throughput (samples/sec): 22366.92 -2019-08-09 06:09:39,853 epoch 62 - iter 265/2650 - loss 0.32484659 throughput (samples/sec): 103.51 -2019-08-09 06:11:01,481 epoch 62 - iter 530/2650 - loss 0.33426627 throughput (samples/sec): 103.94 -2019-08-09 06:12:25,266 epoch 62 - iter 795/2650 - loss 0.33956285 throughput (samples/sec): 101.26 -2019-08-09 06:13:47,406 epoch 62 - iter 1060/2650 - loss 0.34668590 throughput (samples/sec): 103.29 -2019-08-09 06:15:09,560 epoch 62 - iter 1325/2650 - loss 0.34699311 throughput (samples/sec): 103.27 -2019-08-09 06:16:32,966 epoch 62 - iter 1590/2650 - loss 0.35044802 throughput (samples/sec): 101.73 -2019-08-09 06:17:56,546 epoch 62 - iter 1855/2650 - loss 0.35164225 throughput (samples/sec): 101.51 -2019-08-09 06:19:18,214 epoch 62 - iter 2120/2650 - loss 0.35043199 throughput (samples/sec): 103.89 -2019-08-09 06:20:39,762 epoch 62 - iter 2385/2650 - loss 0.35430279 throughput (samples/sec): 104.04 -2019-08-09 06:22:00,187 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:22:00,187 EPOCH 62 done: loss 0.3564 - lr 0.1000 -2019-08-09 06:22:00,187 BAD EPOCHS (no improvement): 0 -2019-08-09 06:22:00,188 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:22:00,533 epoch 63 - iter 0/2650 - loss 0.03154677 throughput (samples/sec): 24783.52 -2019-08-09 06:23:23,464 epoch 63 - iter 265/2650 - loss 0.35144677 throughput (samples/sec): 102.30 -2019-08-09 06:24:45,239 epoch 63 - iter 530/2650 - loss 0.35472407 throughput (samples/sec): 103.75 -2019-08-09 06:26:08,350 epoch 63 - iter 795/2650 - loss 0.34541597 throughput (samples/sec): 102.08 -2019-08-09 06:27:33,245 epoch 63 - iter 1060/2650 - loss 0.34827135 throughput (samples/sec): 99.94 -2019-08-09 06:28:57,288 epoch 63 - iter 1325/2650 - loss 0.35060088 throughput (samples/sec): 100.95 -2019-08-09 06:30:20,739 epoch 63 - iter 1590/2650 - loss 0.35375431 throughput (samples/sec): 101.67 -2019-08-09 06:31:43,634 epoch 63 - iter 1855/2650 - loss 0.35328191 throughput (samples/sec): 102.35 -2019-08-09 06:33:08,463 epoch 63 - iter 2120/2650 - loss 0.35263203 throughput (samples/sec): 100.02 -2019-08-09 06:34:31,381 epoch 63 - iter 2385/2650 - loss 0.35155876 throughput (samples/sec): 102.32 -2019-08-09 06:35:56,760 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:35:56,760 EPOCH 63 done: loss 0.3536 - lr 0.1000 -2019-08-09 06:35:56,760 BAD EPOCHS (no improvement): 0 -2019-08-09 06:35:56,761 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:35:57,015 epoch 64 - iter 0/2650 - loss 0.49458182 throughput (samples/sec): 33762.61 -2019-08-09 06:37:19,867 epoch 64 - iter 265/2650 - loss 0.33807563 throughput (samples/sec): 102.40 -2019-08-09 06:38:44,453 epoch 64 - iter 530/2650 - loss 0.35150931 throughput (samples/sec): 100.30 -2019-08-09 06:40:08,657 epoch 64 - iter 795/2650 - loss 0.35073512 throughput (samples/sec): 100.76 -2019-08-09 06:41:30,829 epoch 64 - iter 1060/2650 - loss 0.35228758 throughput (samples/sec): 103.25 -2019-08-09 06:42:51,518 epoch 64 - iter 1325/2650 - loss 0.35157623 throughput (samples/sec): 105.15 -2019-08-09 06:44:13,511 epoch 64 - iter 1590/2650 - loss 0.34838364 throughput (samples/sec): 103.48 -2019-08-09 06:45:35,846 epoch 64 - iter 1855/2650 - loss 0.35110597 throughput (samples/sec): 103.05 -2019-08-09 06:46:59,023 epoch 64 - iter 2120/2650 - loss 0.34871531 throughput (samples/sec): 102.00 -2019-08-09 06:48:20,512 epoch 64 - iter 2385/2650 - loss 0.34812533 throughput (samples/sec): 104.12 -2019-08-09 06:49:42,223 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:49:42,223 EPOCH 64 done: loss 0.3473 - lr 0.1000 -2019-08-09 06:49:42,223 BAD EPOCHS (no improvement): 0 -2019-08-09 06:49:42,224 ---------------------------------------------------------------------------------------------------- -2019-08-09 06:49:42,587 epoch 65 - iter 0/2650 - loss 0.60719252 throughput (samples/sec): 23607.91 -2019-08-09 06:51:07,390 epoch 65 - iter 265/2650 - loss 0.31520389 throughput (samples/sec): 100.05 -2019-08-09 06:52:27,616 epoch 65 - iter 530/2650 - loss 0.32423416 throughput (samples/sec): 105.76 -2019-08-09 06:53:49,968 epoch 65 - iter 795/2650 - loss 0.32984044 throughput (samples/sec): 103.03 -2019-08-09 06:55:11,748 epoch 65 - iter 1060/2650 - loss 0.34077694 throughput (samples/sec): 103.74 -2019-08-09 06:56:33,135 epoch 65 - iter 1325/2650 - loss 0.33595393 throughput (samples/sec): 104.25 -2019-08-09 06:57:56,075 epoch 65 - iter 1590/2650 - loss 0.33927080 throughput (samples/sec): 102.29 -2019-08-09 06:59:20,130 epoch 65 - iter 1855/2650 - loss 0.34398690 throughput (samples/sec): 100.94 -2019-08-09 07:00:42,888 epoch 65 - iter 2120/2650 - loss 0.34478157 throughput (samples/sec): 102.52 -2019-08-09 07:02:07,189 epoch 65 - iter 2385/2650 - loss 0.34748996 throughput (samples/sec): 100.64 -2019-08-09 07:03:30,341 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:03:30,342 EPOCH 65 done: loss 0.3479 - lr 0.1000 -2019-08-09 07:03:30,342 BAD EPOCHS (no improvement): 1 -2019-08-09 07:03:30,342 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:03:30,668 epoch 66 - iter 0/2650 - loss 0.24990249 throughput (samples/sec): 26309.71 -2019-08-09 07:04:56,771 epoch 66 - iter 265/2650 - loss 0.32923589 throughput (samples/sec): 98.53 -2019-08-09 07:06:21,966 epoch 66 - iter 530/2650 - loss 0.33574829 throughput (samples/sec): 99.59 -2019-08-09 07:07:46,538 epoch 66 - iter 795/2650 - loss 0.33981214 throughput (samples/sec): 100.32 -2019-08-09 07:09:09,342 epoch 66 - iter 1060/2650 - loss 0.34213201 throughput (samples/sec): 102.46 -2019-08-09 07:10:32,507 epoch 66 - iter 1325/2650 - loss 0.34627009 throughput (samples/sec): 102.02 -2019-08-09 07:11:55,283 epoch 66 - iter 1590/2650 - loss 0.34442420 throughput (samples/sec): 102.50 -2019-08-09 07:13:16,536 epoch 66 - iter 1855/2650 - loss 0.34665045 throughput (samples/sec): 104.42 -2019-08-09 07:14:37,756 epoch 66 - iter 2120/2650 - loss 0.34795122 throughput (samples/sec): 104.46 -2019-08-09 07:15:59,636 epoch 66 - iter 2385/2650 - loss 0.34921750 throughput (samples/sec): 103.62 -2019-08-09 07:17:20,423 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:17:20,423 EPOCH 66 done: loss 0.3514 - lr 0.1000 -2019-08-09 07:17:20,423 BAD EPOCHS (no improvement): 2 -2019-08-09 07:17:20,423 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:17:20,680 epoch 67 - iter 0/2650 - loss 0.23841500 throughput (samples/sec): 33449.19 -2019-08-09 07:18:40,457 epoch 67 - iter 265/2650 - loss 0.33053121 throughput (samples/sec): 106.35 -2019-08-09 07:20:01,493 epoch 67 - iter 530/2650 - loss 0.32953256 throughput (samples/sec): 104.70 -2019-08-09 07:21:22,145 epoch 67 - iter 795/2650 - loss 0.33071661 throughput (samples/sec): 105.20 -2019-08-09 07:22:43,137 epoch 67 - iter 1060/2650 - loss 0.33691458 throughput (samples/sec): 104.75 -2019-08-09 07:24:04,865 epoch 67 - iter 1325/2650 - loss 0.34296311 throughput (samples/sec): 103.81 -2019-08-09 07:25:27,105 epoch 67 - iter 1590/2650 - loss 0.34678174 throughput (samples/sec): 103.16 -2019-08-09 07:26:49,446 epoch 67 - iter 1855/2650 - loss 0.34619060 throughput (samples/sec): 103.04 -2019-08-09 07:28:12,933 epoch 67 - iter 2120/2650 - loss 0.34612955 throughput (samples/sec): 101.62 -2019-08-09 07:29:33,943 epoch 67 - iter 2385/2650 - loss 0.34510879 throughput (samples/sec): 104.73 -2019-08-09 07:30:55,377 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:30:55,378 EPOCH 67 done: loss 0.3470 - lr 0.1000 -2019-08-09 07:30:55,378 BAD EPOCHS (no improvement): 0 -2019-08-09 07:30:55,378 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:30:55,804 epoch 68 - iter 0/2650 - loss 0.30723965 throughput (samples/sec): 20057.39 -2019-08-09 07:32:16,725 epoch 68 - iter 265/2650 - loss 0.31669102 throughput (samples/sec): 104.85 -2019-08-09 07:33:41,889 epoch 68 - iter 530/2650 - loss 0.32888064 throughput (samples/sec): 99.62 -2019-08-09 07:35:05,272 epoch 68 - iter 795/2650 - loss 0.33417488 throughput (samples/sec): 101.75 -2019-08-09 07:36:28,303 epoch 68 - iter 1060/2650 - loss 0.33628580 throughput (samples/sec): 102.18 -2019-08-09 07:37:48,640 epoch 68 - iter 1325/2650 - loss 0.33765216 throughput (samples/sec): 105.61 -2019-08-09 07:39:11,007 epoch 68 - iter 1590/2650 - loss 0.33971018 throughput (samples/sec): 103.00 -2019-08-09 07:40:31,991 epoch 68 - iter 1855/2650 - loss 0.34018416 throughput (samples/sec): 104.77 -2019-08-09 07:41:56,703 epoch 68 - iter 2120/2650 - loss 0.34198386 throughput (samples/sec): 100.15 -2019-08-09 07:43:20,000 epoch 68 - iter 2385/2650 - loss 0.34498222 throughput (samples/sec): 101.85 -2019-08-09 07:44:43,160 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:44:43,160 EPOCH 68 done: loss 0.3462 - lr 0.1000 -2019-08-09 07:44:43,160 BAD EPOCHS (no improvement): 0 -2019-08-09 07:44:43,160 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:44:43,430 epoch 69 - iter 0/2650 - loss 0.40565690 throughput (samples/sec): 31896.56 -2019-08-09 07:46:05,717 epoch 69 - iter 265/2650 - loss 0.31545964 throughput (samples/sec): 103.10 -2019-08-09 07:47:25,139 epoch 69 - iter 530/2650 - loss 0.31466262 throughput (samples/sec): 106.83 -2019-08-09 07:48:47,890 epoch 69 - iter 795/2650 - loss 0.32178738 throughput (samples/sec): 102.53 -2019-08-09 07:50:11,742 epoch 69 - iter 1060/2650 - loss 0.32333840 throughput (samples/sec): 101.18 -2019-08-09 07:51:35,414 epoch 69 - iter 1325/2650 - loss 0.33016077 throughput (samples/sec): 101.40 -2019-08-09 07:52:56,475 epoch 69 - iter 1590/2650 - loss 0.33248403 throughput (samples/sec): 104.67 -2019-08-09 07:54:17,446 epoch 69 - iter 1855/2650 - loss 0.33080408 throughput (samples/sec): 104.78 -2019-08-09 07:55:41,211 epoch 69 - iter 2120/2650 - loss 0.33508073 throughput (samples/sec): 101.28 -2019-08-09 07:57:03,936 epoch 69 - iter 2385/2650 - loss 0.33791405 throughput (samples/sec): 102.56 -2019-08-09 07:58:26,735 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:58:26,735 EPOCH 69 done: loss 0.3412 - lr 0.1000 -2019-08-09 07:58:26,735 BAD EPOCHS (no improvement): 0 -2019-08-09 07:58:26,735 ---------------------------------------------------------------------------------------------------- -2019-08-09 07:58:27,008 epoch 70 - iter 0/2650 - loss 0.47725016 throughput (samples/sec): 31557.67 -2019-08-09 07:59:49,724 epoch 70 - iter 265/2650 - loss 0.34151898 throughput (samples/sec): 102.57 -2019-08-09 08:01:10,322 epoch 70 - iter 530/2650 - loss 0.33867500 throughput (samples/sec): 105.27 -2019-08-09 08:02:31,949 epoch 70 - iter 795/2650 - loss 0.34070681 throughput (samples/sec): 103.94 -2019-08-09 08:03:52,031 epoch 70 - iter 1060/2650 - loss 0.33965867 throughput (samples/sec): 105.95 -2019-08-09 08:05:13,968 epoch 70 - iter 1325/2650 - loss 0.33856695 throughput (samples/sec): 103.55 -2019-08-09 08:06:39,087 epoch 70 - iter 1590/2650 - loss 0.33996088 throughput (samples/sec): 99.67 -2019-08-09 08:08:01,013 epoch 70 - iter 1855/2650 - loss 0.34262736 throughput (samples/sec): 103.56 -2019-08-09 08:09:23,299 epoch 70 - iter 2120/2650 - loss 0.33986874 throughput (samples/sec): 103.11 -2019-08-09 08:10:45,280 epoch 70 - iter 2385/2650 - loss 0.34047718 throughput (samples/sec): 103.49 -2019-08-09 08:12:05,451 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:12:05,451 EPOCH 70 done: loss 0.3431 - lr 0.1000 -2019-08-09 08:12:05,451 BAD EPOCHS (no improvement): 1 -2019-08-09 08:12:05,451 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:12:05,725 epoch 71 - iter 0/2650 - loss 0.29786670 throughput (samples/sec): 31383.77 -2019-08-09 08:13:26,599 epoch 71 - iter 265/2650 - loss 0.33736401 throughput (samples/sec): 104.91 -2019-08-09 08:14:48,224 epoch 71 - iter 530/2650 - loss 0.32454814 throughput (samples/sec): 103.94 -2019-08-09 08:16:09,595 epoch 71 - iter 795/2650 - loss 0.32779859 throughput (samples/sec): 104.27 -2019-08-09 08:17:35,389 epoch 71 - iter 1060/2650 - loss 0.33001096 throughput (samples/sec): 98.89 -2019-08-09 08:18:57,093 epoch 71 - iter 1325/2650 - loss 0.33005569 throughput (samples/sec): 103.84 -2019-08-09 08:20:20,939 epoch 71 - iter 1590/2650 - loss 0.33259240 throughput (samples/sec): 101.19 -2019-08-09 08:21:42,727 epoch 71 - iter 1855/2650 - loss 0.33435206 throughput (samples/sec): 103.74 -2019-08-09 08:23:04,561 epoch 71 - iter 2120/2650 - loss 0.33684745 throughput (samples/sec): 103.68 -2019-08-09 08:24:26,684 epoch 71 - iter 2385/2650 - loss 0.34071832 throughput (samples/sec): 103.31 -2019-08-09 08:25:49,580 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:25:49,580 EPOCH 71 done: loss 0.3418 - lr 0.1000 -2019-08-09 08:25:49,580 BAD EPOCHS (no improvement): 2 -2019-08-09 08:25:49,581 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:25:49,986 epoch 72 - iter 0/2650 - loss 0.23228300 throughput (samples/sec): 21138.11 -2019-08-09 08:27:25,693 epoch 72 - iter 265/2650 - loss 0.31584713 throughput (samples/sec): 88.64 -2019-08-09 08:28:55,599 epoch 72 - iter 530/2650 - loss 0.32362408 throughput (samples/sec): 94.37 -2019-08-09 08:30:26,582 epoch 72 - iter 795/2650 - loss 0.33195156 throughput (samples/sec): 93.25 -2019-08-09 08:32:04,142 epoch 72 - iter 1060/2650 - loss 0.33623729 throughput (samples/sec): 86.96 -2019-08-09 08:33:45,588 epoch 72 - iter 1325/2650 - loss 0.33332673 throughput (samples/sec): 83.63 -2019-08-09 08:35:17,915 epoch 72 - iter 1590/2650 - loss 0.33417906 throughput (samples/sec): 91.89 -2019-08-09 08:36:44,090 epoch 72 - iter 1855/2650 - loss 0.33468434 throughput (samples/sec): 98.45 -2019-08-09 08:38:09,038 epoch 72 - iter 2120/2650 - loss 0.33609853 throughput (samples/sec): 99.87 -2019-08-09 08:39:43,660 epoch 72 - iter 2385/2650 - loss 0.33561242 throughput (samples/sec): 89.66 -2019-08-09 08:41:15,501 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:41:15,501 EPOCH 72 done: loss 0.3355 - lr 0.1000 -2019-08-09 08:41:15,501 BAD EPOCHS (no improvement): 0 -2019-08-09 08:41:15,501 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:41:15,812 epoch 73 - iter 0/2650 - loss 0.26158822 throughput (samples/sec): 27630.16 -2019-08-09 08:42:49,873 epoch 73 - iter 265/2650 - loss 0.33235066 throughput (samples/sec): 90.19 -2019-08-09 08:44:25,264 epoch 73 - iter 530/2650 - loss 0.32843048 throughput (samples/sec): 88.93 -2019-08-09 08:46:00,777 epoch 73 - iter 795/2650 - loss 0.33052716 throughput (samples/sec): 88.82 -2019-08-09 08:47:43,765 epoch 73 - iter 1060/2650 - loss 0.32837260 throughput (samples/sec): 82.37 -2019-08-09 08:49:18,238 epoch 73 - iter 1325/2650 - loss 0.33065898 throughput (samples/sec): 89.80 -2019-08-09 08:50:58,921 epoch 73 - iter 1590/2650 - loss 0.32848799 throughput (samples/sec): 84.26 -2019-08-09 08:52:32,300 epoch 73 - iter 1855/2650 - loss 0.33179161 throughput (samples/sec): 90.86 -2019-08-09 08:54:14,805 epoch 73 - iter 2120/2650 - loss 0.33076263 throughput (samples/sec): 82.76 -2019-08-09 08:55:53,316 epoch 73 - iter 2385/2650 - loss 0.32963617 throughput (samples/sec): 86.12 -2019-08-09 08:57:33,403 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:57:33,403 EPOCH 73 done: loss 0.3342 - lr 0.1000 -2019-08-09 08:57:33,403 BAD EPOCHS (no improvement): 0 -2019-08-09 08:57:33,404 ---------------------------------------------------------------------------------------------------- -2019-08-09 08:57:33,653 epoch 74 - iter 0/2650 - loss 0.08657974 throughput (samples/sec): 34530.81 -2019-08-09 08:59:09,648 epoch 74 - iter 265/2650 - loss 0.32324335 throughput (samples/sec): 88.38 -2019-08-09 09:00:47,306 epoch 74 - iter 530/2650 - loss 0.32153569 throughput (samples/sec): 86.87 -2019-08-09 09:02:25,366 epoch 74 - iter 795/2650 - loss 0.32676304 throughput (samples/sec): 86.51 -2019-08-09 09:03:58,105 epoch 74 - iter 1060/2650 - loss 0.32842641 throughput (samples/sec): 91.48 -2019-08-09 09:05:37,146 epoch 74 - iter 1325/2650 - loss 0.32855754 throughput (samples/sec): 85.66 -2019-08-09 09:07:11,876 epoch 74 - iter 1590/2650 - loss 0.32878555 throughput (samples/sec): 89.56 -2019-08-09 09:08:51,117 epoch 74 - iter 1855/2650 - loss 0.32984982 throughput (samples/sec): 85.49 -2019-08-09 09:10:23,855 epoch 74 - iter 2120/2650 - loss 0.33248968 throughput (samples/sec): 91.48 -2019-08-09 09:12:06,696 epoch 74 - iter 2385/2650 - loss 0.33254522 throughput (samples/sec): 82.49 -2019-08-09 09:13:39,281 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:13:39,282 EPOCH 74 done: loss 0.3336 - lr 0.1000 -2019-08-09 09:13:39,282 BAD EPOCHS (no improvement): 0 -2019-08-09 09:13:39,282 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:13:39,552 epoch 75 - iter 0/2650 - loss 0.09408331 throughput (samples/sec): 31800.43 -2019-08-09 09:15:21,989 epoch 75 - iter 265/2650 - loss 0.33156495 throughput (samples/sec): 82.82 -2019-08-09 09:16:54,041 epoch 75 - iter 530/2650 - loss 0.33490143 throughput (samples/sec): 92.16 -2019-08-09 09:18:40,102 epoch 75 - iter 795/2650 - loss 0.32275260 throughput (samples/sec): 79.99 -2019-08-09 09:20:12,665 epoch 75 - iter 1060/2650 - loss 0.32605747 throughput (samples/sec): 91.65 -2019-08-09 09:21:53,430 epoch 75 - iter 1325/2650 - loss 0.32688760 throughput (samples/sec): 84.19 -2019-08-09 09:23:26,525 epoch 75 - iter 1590/2650 - loss 0.32824917 throughput (samples/sec): 91.13 -2019-08-09 09:25:07,180 epoch 75 - iter 1855/2650 - loss 0.33006532 throughput (samples/sec): 84.28 -2019-08-09 09:26:37,763 epoch 75 - iter 2120/2650 - loss 0.33221342 throughput (samples/sec): 93.66 -2019-08-09 09:28:01,772 epoch 75 - iter 2385/2650 - loss 0.33427798 throughput (samples/sec): 100.99 -2019-08-09 09:29:28,696 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:29:28,697 EPOCH 75 done: loss 0.3325 - lr 0.1000 -2019-08-09 09:29:28,697 BAD EPOCHS (no improvement): 0 -2019-08-09 09:29:28,697 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:29:29,341 epoch 76 - iter 0/2650 - loss 0.16890788 throughput (samples/sec): 13242.19 -2019-08-09 09:31:25,378 epoch 76 - iter 265/2650 - loss 0.34698483 throughput (samples/sec): 73.11 -2019-08-09 09:33:02,315 epoch 76 - iter 530/2650 - loss 0.34180761 throughput (samples/sec): 87.52 -2019-08-09 09:34:21,732 epoch 76 - iter 795/2650 - loss 0.33286836 throughput (samples/sec): 106.83 -2019-08-09 09:35:45,420 epoch 76 - iter 1060/2650 - loss 0.33298006 throughput (samples/sec): 101.38 -2019-08-09 09:37:08,700 epoch 76 - iter 1325/2650 - loss 0.33354120 throughput (samples/sec): 101.88 -2019-08-09 09:38:32,416 epoch 76 - iter 1590/2650 - loss 0.33247678 throughput (samples/sec): 101.35 -2019-08-09 09:39:57,178 epoch 76 - iter 1855/2650 - loss 0.33164240 throughput (samples/sec): 100.09 -2019-08-09 09:41:16,920 epoch 76 - iter 2120/2650 - loss 0.33182812 throughput (samples/sec): 106.40 -2019-08-09 09:42:39,985 epoch 76 - iter 2385/2650 - loss 0.33241933 throughput (samples/sec): 102.14 -2019-08-09 09:44:00,036 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:44:00,036 EPOCH 76 done: loss 0.3332 - lr 0.1000 -2019-08-09 09:44:00,036 BAD EPOCHS (no improvement): 1 -2019-08-09 09:44:00,037 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:44:00,341 epoch 77 - iter 0/2650 - loss 0.24152076 throughput (samples/sec): 28191.86 -2019-08-09 09:45:21,976 epoch 77 - iter 265/2650 - loss 0.29650343 throughput (samples/sec): 103.93 -2019-08-09 09:46:43,369 epoch 77 - iter 530/2650 - loss 0.30038449 throughput (samples/sec): 104.24 -2019-08-09 09:48:05,563 epoch 77 - iter 795/2650 - loss 0.30312418 throughput (samples/sec): 103.22 -2019-08-09 09:49:30,999 epoch 77 - iter 1060/2650 - loss 0.30719886 throughput (samples/sec): 99.30 -2019-08-09 09:50:53,423 epoch 77 - iter 1325/2650 - loss 0.30930167 throughput (samples/sec): 102.93 -2019-08-09 09:52:16,703 epoch 77 - iter 1590/2650 - loss 0.31038801 throughput (samples/sec): 101.88 -2019-08-09 09:53:40,647 epoch 77 - iter 1855/2650 - loss 0.31518836 throughput (samples/sec): 101.07 -2019-08-09 09:55:04,746 epoch 77 - iter 2120/2650 - loss 0.31659367 throughput (samples/sec): 100.89 -2019-08-09 09:56:29,989 epoch 77 - iter 2385/2650 - loss 0.31764185 throughput (samples/sec): 99.53 -2019-08-09 09:57:53,627 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:57:53,627 EPOCH 77 done: loss 0.3208 - lr 0.1000 -2019-08-09 09:57:53,627 BAD EPOCHS (no improvement): 0 -2019-08-09 09:57:53,627 ---------------------------------------------------------------------------------------------------- -2019-08-09 09:57:53,928 epoch 78 - iter 0/2650 - loss 0.45161021 throughput (samples/sec): 28586.46 -2019-08-09 09:59:17,726 epoch 78 - iter 265/2650 - loss 0.30364715 throughput (samples/sec): 101.25 -2019-08-09 10:00:40,869 epoch 78 - iter 530/2650 - loss 0.31254427 throughput (samples/sec): 102.04 -2019-08-09 10:02:04,983 epoch 78 - iter 795/2650 - loss 0.30816190 throughput (samples/sec): 100.87 -2019-08-09 10:03:28,964 epoch 78 - iter 1060/2650 - loss 0.31017545 throughput (samples/sec): 101.03 -2019-08-09 10:04:51,818 epoch 78 - iter 1325/2650 - loss 0.31560525 throughput (samples/sec): 102.40 -2019-08-09 10:06:15,625 epoch 78 - iter 1590/2650 - loss 0.31630532 throughput (samples/sec): 101.24 -2019-08-09 10:07:37,931 epoch 78 - iter 1855/2650 - loss 0.31797836 throughput (samples/sec): 103.08 -2019-08-09 10:09:08,897 epoch 78 - iter 2120/2650 - loss 0.31952762 throughput (samples/sec): 93.27 -2019-08-09 10:11:06,975 epoch 78 - iter 2385/2650 - loss 0.31945613 throughput (samples/sec): 71.84 -2019-08-09 10:12:52,596 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:12:52,596 EPOCH 78 done: loss 0.3206 - lr 0.1000 -2019-08-09 10:12:52,596 BAD EPOCHS (no improvement): 0 -2019-08-09 10:12:52,596 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:12:52,854 epoch 79 - iter 0/2650 - loss 0.21588692 throughput (samples/sec): 33426.87 -2019-08-09 10:14:17,366 epoch 79 - iter 265/2650 - loss 0.32367463 throughput (samples/sec): 100.39 -2019-08-09 10:15:41,259 epoch 79 - iter 530/2650 - loss 0.31082837 throughput (samples/sec): 101.13 -2019-08-09 10:17:04,813 epoch 79 - iter 795/2650 - loss 0.31142644 throughput (samples/sec): 101.55 -2019-08-09 10:18:27,519 epoch 79 - iter 1060/2650 - loss 0.31490493 throughput (samples/sec): 102.59 -2019-08-09 10:19:52,885 epoch 79 - iter 1325/2650 - loss 0.32007455 throughput (samples/sec): 99.39 -2019-08-09 10:21:15,284 epoch 79 - iter 1590/2650 - loss 0.32058432 throughput (samples/sec): 102.97 -2019-08-09 10:22:40,494 epoch 79 - iter 1855/2650 - loss 0.32037777 throughput (samples/sec): 99.57 -2019-08-09 10:24:03,672 epoch 79 - iter 2120/2650 - loss 0.31987012 throughput (samples/sec): 102.00 -2019-08-09 10:25:29,194 epoch 79 - iter 2385/2650 - loss 0.32033809 throughput (samples/sec): 99.20 -2019-08-09 10:26:53,817 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:26:53,818 EPOCH 79 done: loss 0.3231 - lr 0.1000 -2019-08-09 10:26:53,818 BAD EPOCHS (no improvement): 1 -2019-08-09 10:26:53,818 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:26:54,066 epoch 80 - iter 0/2650 - loss 0.23076129 throughput (samples/sec): 34649.05 -2019-08-09 10:28:17,911 epoch 80 - iter 265/2650 - loss 0.31810135 throughput (samples/sec): 101.19 -2019-08-09 10:29:42,986 epoch 80 - iter 530/2650 - loss 0.32409668 throughput (samples/sec): 99.73 -2019-08-09 10:31:06,159 epoch 80 - iter 795/2650 - loss 0.31993939 throughput (samples/sec): 102.01 -2019-08-09 10:32:29,436 epoch 80 - iter 1060/2650 - loss 0.32170192 throughput (samples/sec): 101.88 -2019-08-09 10:33:53,308 epoch 80 - iter 1325/2650 - loss 0.32047657 throughput (samples/sec): 101.16 -2019-08-09 10:35:16,109 epoch 80 - iter 1590/2650 - loss 0.31846327 throughput (samples/sec): 102.47 -2019-08-09 10:36:38,861 epoch 80 - iter 1855/2650 - loss 0.31717777 throughput (samples/sec): 102.53 -2019-08-09 10:38:02,017 epoch 80 - iter 2120/2650 - loss 0.31817937 throughput (samples/sec): 102.03 -2019-08-09 10:39:25,733 epoch 80 - iter 2385/2650 - loss 0.31957387 throughput (samples/sec): 101.34 -2019-08-09 10:41:07,432 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:41:07,432 EPOCH 80 done: loss 0.3206 - lr 0.1000 -2019-08-09 10:41:07,433 BAD EPOCHS (no improvement): 2 -2019-08-09 10:41:07,433 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:41:07,821 epoch 81 - iter 0/2650 - loss 0.36149973 throughput (samples/sec): 22023.03 -2019-08-09 10:43:05,045 epoch 81 - iter 265/2650 - loss 0.30808720 throughput (samples/sec): 72.37 -2019-08-09 10:44:54,702 epoch 81 - iter 530/2650 - loss 0.31844341 throughput (samples/sec): 77.36 -2019-08-09 10:46:48,399 epoch 81 - iter 795/2650 - loss 0.31905251 throughput (samples/sec): 74.61 -2019-08-09 10:48:40,058 epoch 81 - iter 1060/2650 - loss 0.31885485 throughput (samples/sec): 75.98 -2019-08-09 10:50:25,693 epoch 81 - iter 1325/2650 - loss 0.31720529 throughput (samples/sec): 80.31 -2019-08-09 10:52:09,632 epoch 81 - iter 1590/2650 - loss 0.32266336 throughput (samples/sec): 81.62 -2019-08-09 10:53:54,891 epoch 81 - iter 1855/2650 - loss 0.32366253 throughput (samples/sec): 80.60 -2019-08-09 10:55:43,273 epoch 81 - iter 2120/2650 - loss 0.32280080 throughput (samples/sec): 78.27 -2019-08-09 10:57:30,966 epoch 81 - iter 2385/2650 - loss 0.32165641 throughput (samples/sec): 78.78 -2019-08-09 10:59:17,949 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:59:17,949 EPOCH 81 done: loss 0.3234 - lr 0.1000 -2019-08-09 10:59:17,949 BAD EPOCHS (no improvement): 3 -2019-08-09 10:59:17,949 ---------------------------------------------------------------------------------------------------- -2019-08-09 10:59:18,246 epoch 82 - iter 0/2650 - loss 0.09390438 throughput (samples/sec): 28943.23 -2019-08-09 11:01:12,509 epoch 82 - iter 265/2650 - loss 0.30881999 throughput (samples/sec): 74.24 -2019-08-09 11:03:10,304 epoch 82 - iter 530/2650 - loss 0.30554365 throughput (samples/sec): 72.02 -2019-08-09 11:05:06,690 epoch 82 - iter 795/2650 - loss 0.31037079 throughput (samples/sec): 72.89 -2019-08-09 11:07:08,557 epoch 82 - iter 1060/2650 - loss 0.31102019 throughput (samples/sec): 69.61 -2019-08-09 11:09:01,284 epoch 82 - iter 1325/2650 - loss 0.31431890 throughput (samples/sec): 75.26 -2019-08-09 11:10:49,543 epoch 82 - iter 1590/2650 - loss 0.31369377 throughput (samples/sec): 78.36 -2019-08-09 11:12:37,270 epoch 82 - iter 1855/2650 - loss 0.31542990 throughput (samples/sec): 78.75 -2019-08-09 11:14:20,352 epoch 82 - iter 2120/2650 - loss 0.31785667 throughput (samples/sec): 82.30 -2019-08-09 11:16:01,180 epoch 82 - iter 2385/2650 - loss 0.31716505 throughput (samples/sec): 84.14 -2019-08-09 11:17:44,912 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:17:44,912 EPOCH 82 done: loss 0.3164 - lr 0.1000 -2019-08-09 11:17:44,912 BAD EPOCHS (no improvement): 0 -2019-08-09 11:17:44,913 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:17:45,182 epoch 83 - iter 0/2650 - loss 0.12523782 throughput (samples/sec): 31950.20 -2019-08-09 11:19:09,348 epoch 83 - iter 265/2650 - loss 0.32279298 throughput (samples/sec): 100.81 -2019-08-09 11:20:36,495 epoch 83 - iter 530/2650 - loss 0.31575641 throughput (samples/sec): 97.35 -2019-08-09 11:22:04,208 epoch 83 - iter 795/2650 - loss 0.30964619 throughput (samples/sec): 96.73 -2019-08-09 11:24:02,394 epoch 83 - iter 1060/2650 - loss 0.30747100 throughput (samples/sec): 71.78 -2019-08-09 11:25:56,757 epoch 83 - iter 1325/2650 - loss 0.30866441 throughput (samples/sec): 74.18 -2019-08-09 11:27:46,346 epoch 83 - iter 1590/2650 - loss 0.30978024 throughput (samples/sec): 77.41 -2019-08-09 11:29:34,084 epoch 83 - iter 1855/2650 - loss 0.31268292 throughput (samples/sec): 78.74 -2019-08-09 11:31:20,213 epoch 83 - iter 2120/2650 - loss 0.31330531 throughput (samples/sec): 79.93 -2019-08-09 11:33:05,553 epoch 83 - iter 2385/2650 - loss 0.31625315 throughput (samples/sec): 80.53 -2019-08-09 11:34:50,402 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:34:50,403 EPOCH 83 done: loss 0.3161 - lr 0.1000 -2019-08-09 11:34:50,403 BAD EPOCHS (no improvement): 0 -2019-08-09 11:34:50,403 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:34:50,894 epoch 84 - iter 0/2650 - loss 0.23676512 throughput (samples/sec): 17414.20 -2019-08-09 11:36:36,654 epoch 84 - iter 265/2650 - loss 0.31754365 throughput (samples/sec): 80.21 -2019-08-09 11:38:19,516 epoch 84 - iter 530/2650 - loss 0.30778167 throughput (samples/sec): 82.48 -2019-08-09 11:40:05,418 epoch 84 - iter 795/2650 - loss 0.31047747 throughput (samples/sec): 80.11 -2019-08-09 11:41:48,560 epoch 84 - iter 1060/2650 - loss 0.31234196 throughput (samples/sec): 82.25 -2019-08-09 11:43:45,101 epoch 84 - iter 1325/2650 - loss 0.31654055 throughput (samples/sec): 72.79 -2019-08-09 11:45:33,749 epoch 84 - iter 1590/2650 - loss 0.31794147 throughput (samples/sec): 78.08 -2019-08-09 11:47:20,927 epoch 84 - iter 1855/2650 - loss 0.31430145 throughput (samples/sec): 79.15 -2019-08-09 11:49:08,230 epoch 84 - iter 2120/2650 - loss 0.31527663 throughput (samples/sec): 79.06 -2019-08-09 11:50:57,547 epoch 84 - iter 2385/2650 - loss 0.31596165 throughput (samples/sec): 77.60 -2019-08-09 11:52:47,876 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:52:47,876 EPOCH 84 done: loss 0.3172 - lr 0.1000 -2019-08-09 11:52:47,877 BAD EPOCHS (no improvement): 1 -2019-08-09 11:52:47,877 ---------------------------------------------------------------------------------------------------- -2019-08-09 11:52:48,190 epoch 85 - iter 0/2650 - loss 0.23364073 throughput (samples/sec): 27393.71 -2019-08-09 11:54:36,764 epoch 85 - iter 265/2650 - loss 0.30844214 throughput (samples/sec): 78.13 -2019-08-09 11:56:24,841 epoch 85 - iter 530/2650 - loss 0.31941710 throughput (samples/sec): 78.49 -2019-08-09 11:58:11,105 epoch 85 - iter 795/2650 - loss 0.31451801 throughput (samples/sec): 79.83 -2019-08-09 12:00:04,398 epoch 85 - iter 1060/2650 - loss 0.31300057 throughput (samples/sec): 74.88 -2019-08-09 12:01:51,721 epoch 85 - iter 1325/2650 - loss 0.31051471 throughput (samples/sec): 79.05 -2019-08-09 12:03:39,218 epoch 85 - iter 1590/2650 - loss 0.30991266 throughput (samples/sec): 78.92 -2019-08-09 12:05:28,300 epoch 85 - iter 1855/2650 - loss 0.31232493 throughput (samples/sec): 77.77 -2019-08-09 12:07:15,737 epoch 85 - iter 2120/2650 - loss 0.31502842 throughput (samples/sec): 78.96 -2019-08-09 12:09:03,458 epoch 85 - iter 2385/2650 - loss 0.31612818 throughput (samples/sec): 78.75 -2019-08-09 12:10:51,247 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:10:51,247 EPOCH 85 done: loss 0.3170 - lr 0.1000 -2019-08-09 12:10:51,247 BAD EPOCHS (no improvement): 2 -2019-08-09 12:10:51,247 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:10:51,642 epoch 86 - iter 0/2650 - loss 0.10628381 throughput (samples/sec): 21672.00 -2019-08-09 12:12:40,048 epoch 86 - iter 265/2650 - loss 0.29654681 throughput (samples/sec): 78.26 -2019-08-09 12:14:27,213 epoch 86 - iter 530/2650 - loss 0.29961680 throughput (samples/sec): 79.16 -2019-08-09 12:16:11,621 epoch 86 - iter 795/2650 - loss 0.29664991 throughput (samples/sec): 81.25 -2019-08-09 12:18:01,362 epoch 86 - iter 1060/2650 - loss 0.29925065 throughput (samples/sec): 77.30 -2019-08-09 12:19:53,746 epoch 86 - iter 1325/2650 - loss 0.29965120 throughput (samples/sec): 75.48 -2019-08-09 12:21:43,334 epoch 86 - iter 1590/2650 - loss 0.30312743 throughput (samples/sec): 77.41 -2019-08-09 12:23:33,879 epoch 86 - iter 1855/2650 - loss 0.30471124 throughput (samples/sec): 76.74 -2019-08-09 12:25:13,210 epoch 86 - iter 2120/2650 - loss 0.30685823 throughput (samples/sec): 85.41 -2019-08-09 12:26:39,166 epoch 86 - iter 2385/2650 - loss 0.31026556 throughput (samples/sec): 98.70 -2019-08-09 12:28:13,266 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:28:13,266 EPOCH 86 done: loss 0.3120 - lr 0.1000 -2019-08-09 12:28:13,266 BAD EPOCHS (no improvement): 0 -2019-08-09 12:28:13,266 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:28:13,866 epoch 87 - iter 0/2650 - loss 0.22007853 throughput (samples/sec): 14235.57 -2019-08-09 12:30:11,399 epoch 87 - iter 265/2650 - loss 0.30172238 throughput (samples/sec): 72.18 -2019-08-09 12:32:05,490 epoch 87 - iter 530/2650 - loss 0.31807023 throughput (samples/sec): 74.35 -2019-08-09 12:33:54,253 epoch 87 - iter 795/2650 - loss 0.31263915 throughput (samples/sec): 78.00 -2019-08-09 12:35:41,615 epoch 87 - iter 1060/2650 - loss 0.31363948 throughput (samples/sec): 79.02 -2019-08-09 12:37:22,563 epoch 87 - iter 1325/2650 - loss 0.31468301 throughput (samples/sec): 84.04 -2019-08-09 12:39:06,866 epoch 87 - iter 1590/2650 - loss 0.31422009 throughput (samples/sec): 81.34 -2019-08-09 12:40:49,996 epoch 87 - iter 1855/2650 - loss 0.31053367 throughput (samples/sec): 82.26 -2019-08-09 12:42:34,170 epoch 87 - iter 2120/2650 - loss 0.31093491 throughput (samples/sec): 81.44 -2019-08-09 12:44:29,291 epoch 87 - iter 2385/2650 - loss 0.31188087 throughput (samples/sec): 73.69 -2019-08-09 12:46:18,007 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:46:18,008 EPOCH 87 done: loss 0.3125 - lr 0.1000 -2019-08-09 12:46:18,008 BAD EPOCHS (no improvement): 1 -2019-08-09 12:46:18,008 ---------------------------------------------------------------------------------------------------- -2019-08-09 12:46:18,585 epoch 88 - iter 0/2650 - loss 0.02627647 throughput (samples/sec): 14801.87 -2019-08-09 12:48:08,105 epoch 88 - iter 265/2650 - loss 0.29575289 throughput (samples/sec): 77.46 -2019-08-09 12:49:58,541 epoch 88 - iter 530/2650 - loss 0.29558848 throughput (samples/sec): 76.82 -2019-08-09 12:51:49,825 epoch 88 - iter 795/2650 - loss 0.30101028 throughput (samples/sec): 76.23 -2019-08-09 12:53:48,586 epoch 88 - iter 1060/2650 - loss 0.30606669 throughput (samples/sec): 71.43 -2019-08-09 12:55:34,867 epoch 88 - iter 1325/2650 - loss 0.30203230 throughput (samples/sec): 79.82 -2019-08-09 12:57:19,469 epoch 88 - iter 1590/2650 - loss 0.30367818 throughput (samples/sec): 81.10 -2019-08-09 12:59:09,879 epoch 88 - iter 1855/2650 - loss 0.30503473 throughput (samples/sec): 76.83 -2019-08-09 13:00:52,421 epoch 88 - iter 2120/2650 - loss 0.30700152 throughput (samples/sec): 82.73 -2019-08-09 13:02:45,349 epoch 88 - iter 2385/2650 - loss 0.30881051 throughput (samples/sec): 75.12 -2019-08-09 13:04:34,197 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:04:34,197 EPOCH 88 done: loss 0.3086 - lr 0.1000 -2019-08-09 13:04:34,197 BAD EPOCHS (no improvement): 0 -2019-08-09 13:04:34,197 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:04:34,573 epoch 89 - iter 0/2650 - loss 0.10099247 throughput (samples/sec): 22810.20 -2019-08-09 13:06:24,623 epoch 89 - iter 265/2650 - loss 0.28996917 throughput (samples/sec): 77.09 -2019-08-09 13:08:15,427 epoch 89 - iter 530/2650 - loss 0.28865078 throughput (samples/sec): 76.56 -2019-08-09 13:10:06,436 epoch 89 - iter 795/2650 - loss 0.29535016 throughput (samples/sec): 76.42 -2019-08-09 13:11:50,238 epoch 89 - iter 1060/2650 - loss 0.29370426 throughput (samples/sec): 81.73 -2019-08-09 13:13:34,197 epoch 89 - iter 1325/2650 - loss 0.29962337 throughput (samples/sec): 81.61 -2019-08-09 13:15:25,998 epoch 89 - iter 1590/2650 - loss 0.30303764 throughput (samples/sec): 75.88 -2019-08-09 13:17:15,890 epoch 89 - iter 1855/2650 - loss 0.30639216 throughput (samples/sec): 77.20 -2019-08-09 13:19:05,984 epoch 89 - iter 2120/2650 - loss 0.30543797 throughput (samples/sec): 77.06 -2019-08-09 13:20:55,446 epoch 89 - iter 2385/2650 - loss 0.30864249 throughput (samples/sec): 77.51 -2019-08-09 13:22:49,169 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:22:49,169 EPOCH 89 done: loss 0.3121 - lr 0.1000 -2019-08-09 13:22:49,170 BAD EPOCHS (no improvement): 1 -2019-08-09 13:22:49,170 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:22:49,540 epoch 90 - iter 0/2650 - loss 0.20215017 throughput (samples/sec): 23124.72 -2019-08-09 13:24:42,781 epoch 90 - iter 265/2650 - loss 0.29885339 throughput (samples/sec): 74.91 -2019-08-09 13:26:36,941 epoch 90 - iter 530/2650 - loss 0.29496773 throughput (samples/sec): 74.31 -2019-08-09 13:28:20,974 epoch 90 - iter 795/2650 - loss 0.29037722 throughput (samples/sec): 81.55 -2019-08-09 13:30:12,125 epoch 90 - iter 1060/2650 - loss 0.29541223 throughput (samples/sec): 76.32 -2019-08-09 13:32:03,604 epoch 90 - iter 1325/2650 - loss 0.29861942 throughput (samples/sec): 76.10 -2019-08-09 13:33:53,568 epoch 90 - iter 1590/2650 - loss 0.29821055 throughput (samples/sec): 77.15 -2019-08-09 13:35:39,385 epoch 90 - iter 1855/2650 - loss 0.30377975 throughput (samples/sec): 80.17 -2019-08-09 13:37:04,995 epoch 90 - iter 2120/2650 - loss 0.30581935 throughput (samples/sec): 99.10 -2019-08-09 13:38:30,700 epoch 90 - iter 2385/2650 - loss 0.30766437 throughput (samples/sec): 98.99 -2019-08-09 13:39:54,054 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:39:54,054 EPOCH 90 done: loss 0.3092 - lr 0.1000 -2019-08-09 13:39:54,055 BAD EPOCHS (no improvement): 2 -2019-08-09 13:39:54,055 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:39:54,353 epoch 91 - iter 0/2650 - loss 0.17892426 throughput (samples/sec): 28825.99 -2019-08-09 13:41:48,768 epoch 91 - iter 265/2650 - loss 0.27129175 throughput (samples/sec): 74.14 -2019-08-09 13:43:41,061 epoch 91 - iter 530/2650 - loss 0.27576541 throughput (samples/sec): 75.55 -2019-08-09 13:45:27,028 epoch 91 - iter 795/2650 - loss 0.28631601 throughput (samples/sec): 80.06 -2019-08-09 13:47:10,809 epoch 91 - iter 1060/2650 - loss 0.29203248 throughput (samples/sec): 81.74 -2019-08-09 13:48:57,061 epoch 91 - iter 1325/2650 - loss 0.30155762 throughput (samples/sec): 79.84 -2019-08-09 13:50:51,623 epoch 91 - iter 1590/2650 - loss 0.30146061 throughput (samples/sec): 74.05 -2019-08-09 13:52:34,337 epoch 91 - iter 1855/2650 - loss 0.30257189 throughput (samples/sec): 82.59 -2019-08-09 13:54:18,468 epoch 91 - iter 2120/2650 - loss 0.30689028 throughput (samples/sec): 81.47 -2019-08-09 13:56:01,940 epoch 91 - iter 2385/2650 - loss 0.30887435 throughput (samples/sec): 81.99 -2019-08-09 13:57:50,520 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:57:50,520 EPOCH 91 done: loss 0.3099 - lr 0.1000 -2019-08-09 13:57:50,520 BAD EPOCHS (no improvement): 3 -2019-08-09 13:57:50,520 ---------------------------------------------------------------------------------------------------- -2019-08-09 13:57:50,984 epoch 92 - iter 0/2650 - loss 0.36558709 throughput (samples/sec): 18427.47 -2019-08-09 13:59:37,570 epoch 92 - iter 265/2650 - loss 0.30643025 throughput (samples/sec): 79.59 -2019-08-09 14:01:18,927 epoch 92 - iter 530/2650 - loss 0.29875874 throughput (samples/sec): 83.70 -2019-08-09 14:03:02,638 epoch 92 - iter 795/2650 - loss 0.30067556 throughput (samples/sec): 81.80 -2019-08-09 14:04:46,947 epoch 92 - iter 1060/2650 - loss 0.30881100 throughput (samples/sec): 81.33 -2019-08-09 14:06:38,380 epoch 92 - iter 1325/2650 - loss 0.31108038 throughput (samples/sec): 76.14 -2019-08-09 14:08:28,404 epoch 92 - iter 1590/2650 - loss 0.31077439 throughput (samples/sec): 77.10 -2019-08-09 14:10:09,862 epoch 92 - iter 1855/2650 - loss 0.31490980 throughput (samples/sec): 83.62 -2019-08-09 14:12:01,135 epoch 92 - iter 2120/2650 - loss 0.31244124 throughput (samples/sec): 76.24 -2019-08-09 14:13:46,168 epoch 92 - iter 2385/2650 - loss 0.31261539 throughput (samples/sec): 80.78 -2019-08-09 14:15:37,704 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:15:37,705 EPOCH 92 done: loss 0.3127 - lr 0.1000 -2019-08-09 14:15:37,705 BAD EPOCHS (no improvement): 4 -2019-08-09 14:15:37,705 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:15:38,217 epoch 93 - iter 0/2650 - loss 0.11494464 throughput (samples/sec): 16682.50 -2019-08-09 14:17:29,621 epoch 93 - iter 265/2650 - loss 0.26940429 throughput (samples/sec): 76.15 -2019-08-09 14:19:21,659 epoch 93 - iter 530/2650 - loss 0.27738051 throughput (samples/sec): 75.72 -2019-08-09 14:21:06,523 epoch 93 - iter 795/2650 - loss 0.27494573 throughput (samples/sec): 80.90 -2019-08-09 14:23:00,226 epoch 93 - iter 1060/2650 - loss 0.27674720 throughput (samples/sec): 74.62 -2019-08-09 14:24:49,224 epoch 93 - iter 1325/2650 - loss 0.27541002 throughput (samples/sec): 77.83 -2019-08-09 14:26:36,492 epoch 93 - iter 1590/2650 - loss 0.27722643 throughput (samples/sec): 79.09 -2019-08-09 14:28:24,986 epoch 93 - iter 1855/2650 - loss 0.27880891 throughput (samples/sec): 78.19 -2019-08-09 14:30:10,234 epoch 93 - iter 2120/2650 - loss 0.27872711 throughput (samples/sec): 80.61 -2019-08-09 14:32:03,056 epoch 93 - iter 2385/2650 - loss 0.28003129 throughput (samples/sec): 75.19 -2019-08-09 14:33:48,021 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:33:48,022 EPOCH 93 done: loss 0.2806 - lr 0.0500 -2019-08-09 14:33:48,022 BAD EPOCHS (no improvement): 0 -2019-08-09 14:33:48,022 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:33:48,572 epoch 94 - iter 0/2650 - loss 0.32541719 throughput (samples/sec): 15515.13 -2019-08-09 14:35:33,710 epoch 94 - iter 265/2650 - loss 0.25842507 throughput (samples/sec): 80.69 -2019-08-09 14:37:28,091 epoch 94 - iter 530/2650 - loss 0.27138626 throughput (samples/sec): 74.17 -2019-08-09 14:39:17,832 epoch 94 - iter 795/2650 - loss 0.27203143 throughput (samples/sec): 77.30 -2019-08-09 14:41:14,079 epoch 94 - iter 1060/2650 - loss 0.27024718 throughput (samples/sec): 72.98 -2019-08-09 14:43:03,747 epoch 94 - iter 1325/2650 - loss 0.26890203 throughput (samples/sec): 77.36 -2019-08-09 14:44:53,867 epoch 94 - iter 1590/2650 - loss 0.26841286 throughput (samples/sec): 77.04 -2019-08-09 14:46:45,693 epoch 94 - iter 1855/2650 - loss 0.26914454 throughput (samples/sec): 75.86 -2019-08-09 14:48:36,067 epoch 94 - iter 2120/2650 - loss 0.26858237 throughput (samples/sec): 76.86 -2019-08-09 14:50:30,756 epoch 94 - iter 2385/2650 - loss 0.27005549 throughput (samples/sec): 73.97 -2019-08-09 14:52:20,776 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:52:20,776 EPOCH 94 done: loss 0.2712 - lr 0.0500 -2019-08-09 14:52:20,776 BAD EPOCHS (no improvement): 0 -2019-08-09 14:52:20,776 ---------------------------------------------------------------------------------------------------- -2019-08-09 14:52:21,108 epoch 95 - iter 0/2650 - loss 0.15731183 throughput (samples/sec): 25874.08 -2019-08-09 14:54:04,119 epoch 95 - iter 265/2650 - loss 0.25124321 throughput (samples/sec): 82.36 -2019-08-09 14:55:47,863 epoch 95 - iter 530/2650 - loss 0.26668266 throughput (samples/sec): 81.78 -2019-08-09 14:57:34,145 epoch 95 - iter 795/2650 - loss 0.26562406 throughput (samples/sec): 79.83 -2019-08-09 14:59:20,859 epoch 95 - iter 1060/2650 - loss 0.26693008 throughput (samples/sec): 79.50 -2019-08-09 15:01:03,416 epoch 95 - iter 1325/2650 - loss 0.26903069 throughput (samples/sec): 82.72 -2019-08-09 15:02:53,066 epoch 95 - iter 1590/2650 - loss 0.26897401 throughput (samples/sec): 77.37 -2019-08-09 15:04:36,355 epoch 95 - iter 1855/2650 - loss 0.27021161 throughput (samples/sec): 82.13 -2019-08-09 15:06:17,699 epoch 95 - iter 2120/2650 - loss 0.26811980 throughput (samples/sec): 83.71 -2019-08-09 15:08:00,945 epoch 95 - iter 2385/2650 - loss 0.27047032 throughput (samples/sec): 82.17 -2019-08-09 15:09:40,936 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:09:40,936 EPOCH 95 done: loss 0.2696 - lr 0.0500 -2019-08-09 15:09:40,936 BAD EPOCHS (no improvement): 0 -2019-08-09 15:09:40,937 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:09:41,258 epoch 96 - iter 0/2650 - loss 0.81395197 throughput (samples/sec): 26971.83 -2019-08-09 15:11:33,060 epoch 96 - iter 265/2650 - loss 0.27542288 throughput (samples/sec): 75.88 -2019-08-09 15:13:17,529 epoch 96 - iter 530/2650 - loss 0.27402686 throughput (samples/sec): 81.22 -2019-08-09 15:15:05,456 epoch 96 - iter 795/2650 - loss 0.26894739 throughput (samples/sec): 78.60 -2019-08-09 15:16:47,059 epoch 96 - iter 1060/2650 - loss 0.27229514 throughput (samples/sec): 83.50 -2019-08-09 15:18:31,243 epoch 96 - iter 1325/2650 - loss 0.26849639 throughput (samples/sec): 81.43 -2019-08-09 15:20:11,963 epoch 96 - iter 1590/2650 - loss 0.26581905 throughput (samples/sec): 84.23 -2019-08-09 15:21:52,980 epoch 96 - iter 1855/2650 - loss 0.26327022 throughput (samples/sec): 83.98 -2019-08-09 15:23:47,966 epoch 96 - iter 2120/2650 - loss 0.26388711 throughput (samples/sec): 73.78 -2019-08-09 15:25:31,942 epoch 96 - iter 2385/2650 - loss 0.26398323 throughput (samples/sec): 81.59 -2019-08-09 15:27:16,386 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:27:16,386 EPOCH 96 done: loss 0.2643 - lr 0.0500 -2019-08-09 15:27:16,386 BAD EPOCHS (no improvement): 0 -2019-08-09 15:27:16,386 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:27:16,697 epoch 97 - iter 0/2650 - loss 0.38118172 throughput (samples/sec): 27584.39 -2019-08-09 15:29:00,244 epoch 97 - iter 265/2650 - loss 0.27257933 throughput (samples/sec): 81.93 -2019-08-09 15:30:42,083 epoch 97 - iter 530/2650 - loss 0.26098282 throughput (samples/sec): 83.30 -2019-08-09 15:32:25,335 epoch 97 - iter 795/2650 - loss 0.25660099 throughput (samples/sec): 82.16 -2019-08-09 15:34:09,855 epoch 97 - iter 1060/2650 - loss 0.25296103 throughput (samples/sec): 81.17 -2019-08-09 15:35:55,033 epoch 97 - iter 1325/2650 - loss 0.25397170 throughput (samples/sec): 80.66 -2019-08-09 15:37:37,255 epoch 97 - iter 1590/2650 - loss 0.25395968 throughput (samples/sec): 82.99 -2019-08-09 15:39:17,614 epoch 97 - iter 1855/2650 - loss 0.25698687 throughput (samples/sec): 84.53 -2019-08-09 15:40:58,876 epoch 97 - iter 2120/2650 - loss 0.25585684 throughput (samples/sec): 83.78 -2019-08-09 15:42:34,551 epoch 97 - iter 2385/2650 - loss 0.25692746 throughput (samples/sec): 88.67 -2019-08-09 15:43:59,322 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:43:59,322 EPOCH 97 done: loss 0.2584 - lr 0.0500 -2019-08-09 15:43:59,322 BAD EPOCHS (no improvement): 0 -2019-08-09 15:43:59,322 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:43:59,587 epoch 98 - iter 0/2650 - loss 0.10197657 throughput (samples/sec): 32523.94 -2019-08-09 15:45:23,173 epoch 98 - iter 265/2650 - loss 0.25026029 throughput (samples/sec): 101.51 -2019-08-09 15:46:48,135 epoch 98 - iter 530/2650 - loss 0.24379541 throughput (samples/sec): 99.86 -2019-08-09 15:48:12,311 epoch 98 - iter 795/2650 - loss 0.24921573 throughput (samples/sec): 100.80 -2019-08-09 15:49:37,564 epoch 98 - iter 1060/2650 - loss 0.25263249 throughput (samples/sec): 99.52 -2019-08-09 15:51:05,912 epoch 98 - iter 1325/2650 - loss 0.25502680 throughput (samples/sec): 96.03 -2019-08-09 15:52:31,362 epoch 98 - iter 1590/2650 - loss 0.25332021 throughput (samples/sec): 99.29 -2019-08-09 15:53:56,826 epoch 98 - iter 1855/2650 - loss 0.25334900 throughput (samples/sec): 99.28 -2019-08-09 15:55:21,807 epoch 98 - iter 2120/2650 - loss 0.25441679 throughput (samples/sec): 99.84 -2019-08-09 15:56:46,923 epoch 98 - iter 2385/2650 - loss 0.25613155 throughput (samples/sec): 99.68 -2019-08-09 15:58:09,539 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:58:09,540 EPOCH 98 done: loss 0.2559 - lr 0.0500 -2019-08-09 15:58:09,540 BAD EPOCHS (no improvement): 0 -2019-08-09 15:58:09,540 ---------------------------------------------------------------------------------------------------- -2019-08-09 15:58:09,831 epoch 99 - iter 0/2650 - loss 0.06508607 throughput (samples/sec): 29513.41 -2019-08-09 15:59:34,531 epoch 99 - iter 265/2650 - loss 0.25851105 throughput (samples/sec): 100.17 -2019-08-09 16:01:00,064 epoch 99 - iter 530/2650 - loss 0.25412830 throughput (samples/sec): 99.20 -2019-08-09 16:02:26,700 epoch 99 - iter 795/2650 - loss 0.25043615 throughput (samples/sec): 97.93 -2019-08-09 16:03:54,254 epoch 99 - iter 1060/2650 - loss 0.25093803 throughput (samples/sec): 96.90 -2019-08-09 16:05:17,747 epoch 99 - iter 1325/2650 - loss 0.25015119 throughput (samples/sec): 101.62 -2019-08-09 16:06:43,465 epoch 99 - iter 1590/2650 - loss 0.25174813 throughput (samples/sec): 98.98 -2019-08-09 16:08:06,421 epoch 99 - iter 1855/2650 - loss 0.25126307 throughput (samples/sec): 102.28 -2019-08-09 16:09:31,584 epoch 99 - iter 2120/2650 - loss 0.25216684 throughput (samples/sec): 99.63 -2019-08-09 16:10:56,899 epoch 99 - iter 2385/2650 - loss 0.25207643 throughput (samples/sec): 99.45 -2019-08-09 16:12:21,370 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:12:21,370 EPOCH 99 done: loss 0.2522 - lr 0.0500 -2019-08-09 16:12:21,370 BAD EPOCHS (no improvement): 0 -2019-08-09 16:12:21,370 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:12:21,711 epoch 100 - iter 0/2650 - loss 0.17370641 throughput (samples/sec): 25190.21 -2019-08-09 16:13:45,424 epoch 100 - iter 265/2650 - loss 0.24480405 throughput (samples/sec): 101.35 -2019-08-09 16:15:09,396 epoch 100 - iter 530/2650 - loss 0.24022113 throughput (samples/sec): 101.04 -2019-08-09 16:16:32,273 epoch 100 - iter 795/2650 - loss 0.23901105 throughput (samples/sec): 102.37 -2019-08-09 16:17:55,944 epoch 100 - iter 1060/2650 - loss 0.24017788 throughput (samples/sec): 101.40 -2019-08-09 16:19:17,543 epoch 100 - iter 1325/2650 - loss 0.23850306 throughput (samples/sec): 103.98 -2019-08-09 16:20:41,664 epoch 100 - iter 1590/2650 - loss 0.23892193 throughput (samples/sec): 100.86 -2019-08-09 16:22:04,915 epoch 100 - iter 1855/2650 - loss 0.24000315 throughput (samples/sec): 101.91 -2019-08-09 16:23:26,062 epoch 100 - iter 2120/2650 - loss 0.24370720 throughput (samples/sec): 104.55 -2019-08-09 16:24:51,361 epoch 100 - iter 2385/2650 - loss 0.24356150 throughput (samples/sec): 99.46 -2019-08-09 16:26:16,042 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:26:16,042 EPOCH 100 done: loss 0.2449 - lr 0.0500 -2019-08-09 16:26:16,042 BAD EPOCHS (no improvement): 0 -2019-08-09 16:26:16,042 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:26:16,346 epoch 101 - iter 0/2650 - loss 0.16320592 throughput (samples/sec): 28261.42 -2019-08-09 16:27:42,685 epoch 101 - iter 265/2650 - loss 0.23851625 throughput (samples/sec): 98.27 -2019-08-09 16:29:06,788 epoch 101 - iter 530/2650 - loss 0.23938307 throughput (samples/sec): 100.88 -2019-08-09 16:30:27,277 epoch 101 - iter 795/2650 - loss 0.24074946 throughput (samples/sec): 105.41 -2019-08-09 16:31:51,743 epoch 101 - iter 1060/2650 - loss 0.23986924 throughput (samples/sec): 100.45 -2019-08-09 16:33:13,501 epoch 101 - iter 1325/2650 - loss 0.23814713 throughput (samples/sec): 103.77 -2019-08-09 16:34:37,314 epoch 101 - iter 1590/2650 - loss 0.23836466 throughput (samples/sec): 101.23 -2019-08-09 16:36:00,472 epoch 101 - iter 1855/2650 - loss 0.23925975 throughput (samples/sec): 102.03 -2019-08-09 16:37:25,326 epoch 101 - iter 2120/2650 - loss 0.24245886 throughput (samples/sec): 99.99 -2019-08-09 16:38:48,469 epoch 101 - iter 2385/2650 - loss 0.24391449 throughput (samples/sec): 102.04 -2019-08-09 16:40:11,503 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:40:11,503 EPOCH 101 done: loss 0.2464 - lr 0.0500 -2019-08-09 16:40:11,504 BAD EPOCHS (no improvement): 1 -2019-08-09 16:40:11,504 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:40:11,778 epoch 102 - iter 0/2650 - loss 0.80398458 throughput (samples/sec): 31321.31 -2019-08-09 16:41:34,643 epoch 102 - iter 265/2650 - loss 0.25881238 throughput (samples/sec): 102.39 -2019-08-09 16:43:00,629 epoch 102 - iter 530/2650 - loss 0.24342620 throughput (samples/sec): 98.67 -2019-08-09 16:44:24,756 epoch 102 - iter 795/2650 - loss 0.24214646 throughput (samples/sec): 100.86 -2019-08-09 16:45:47,785 epoch 102 - iter 1060/2650 - loss 0.24384495 throughput (samples/sec): 102.19 -2019-08-09 16:47:11,165 epoch 102 - iter 1325/2650 - loss 0.25012255 throughput (samples/sec): 101.76 -2019-08-09 16:48:35,749 epoch 102 - iter 1590/2650 - loss 0.24765099 throughput (samples/sec): 100.31 -2019-08-09 16:50:01,669 epoch 102 - iter 1855/2650 - loss 0.24772664 throughput (samples/sec): 98.75 -2019-08-09 16:51:27,982 epoch 102 - iter 2120/2650 - loss 0.24632108 throughput (samples/sec): 98.30 -2019-08-09 16:52:55,526 epoch 102 - iter 2385/2650 - loss 0.24705535 throughput (samples/sec): 96.92 -2019-08-09 16:54:19,183 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:54:19,184 EPOCH 102 done: loss 0.2458 - lr 0.0500 -2019-08-09 16:54:19,184 BAD EPOCHS (no improvement): 2 -2019-08-09 16:54:19,184 ---------------------------------------------------------------------------------------------------- -2019-08-09 16:54:19,431 epoch 103 - iter 0/2650 - loss 0.21282291 throughput (samples/sec): 34809.78 -2019-08-09 16:55:44,430 epoch 103 - iter 265/2650 - loss 0.23995078 throughput (samples/sec): 99.82 -2019-08-09 16:57:08,791 epoch 103 - iter 530/2650 - loss 0.23811789 throughput (samples/sec): 100.57 -2019-08-09 16:58:33,294 epoch 103 - iter 795/2650 - loss 0.24076214 throughput (samples/sec): 100.40 -2019-08-09 16:59:57,314 epoch 103 - iter 1060/2650 - loss 0.24133839 throughput (samples/sec): 100.98 -2019-08-09 17:01:20,608 epoch 103 - iter 1325/2650 - loss 0.24115426 throughput (samples/sec): 101.86 -2019-08-09 17:02:47,295 epoch 103 - iter 1590/2650 - loss 0.24330976 throughput (samples/sec): 97.87 -2019-08-09 17:04:09,371 epoch 103 - iter 1855/2650 - loss 0.24172970 throughput (samples/sec): 103.37 -2019-08-09 17:05:33,029 epoch 103 - iter 2120/2650 - loss 0.24487150 throughput (samples/sec): 101.42 -2019-08-09 17:06:56,462 epoch 103 - iter 2385/2650 - loss 0.24272507 throughput (samples/sec): 101.69 -2019-08-09 17:08:20,136 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:08:20,136 EPOCH 103 done: loss 0.2426 - lr 0.0500 -2019-08-09 17:08:20,137 BAD EPOCHS (no improvement): 0 -2019-08-09 17:08:20,137 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:08:20,449 epoch 104 - iter 0/2650 - loss 0.03208941 throughput (samples/sec): 27481.74 -2019-08-09 17:09:42,994 epoch 104 - iter 265/2650 - loss 0.22679482 throughput (samples/sec): 102.79 -2019-08-09 17:11:06,190 epoch 104 - iter 530/2650 - loss 0.22838473 throughput (samples/sec): 101.98 -2019-08-09 17:12:32,334 epoch 104 - iter 795/2650 - loss 0.23330951 throughput (samples/sec): 98.49 -2019-08-09 17:13:55,777 epoch 104 - iter 1060/2650 - loss 0.23197015 throughput (samples/sec): 101.68 -2019-08-09 17:15:20,599 epoch 104 - iter 1325/2650 - loss 0.23195518 throughput (samples/sec): 100.03 -2019-08-09 17:16:44,472 epoch 104 - iter 1590/2650 - loss 0.23281399 throughput (samples/sec): 101.16 -2019-08-09 17:18:09,517 epoch 104 - iter 1855/2650 - loss 0.23261438 throughput (samples/sec): 99.76 -2019-08-09 17:19:32,809 epoch 104 - iter 2120/2650 - loss 0.23228148 throughput (samples/sec): 101.86 -2019-08-09 17:20:55,764 epoch 104 - iter 2385/2650 - loss 0.23370856 throughput (samples/sec): 102.28 -2019-08-09 17:22:21,358 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:22:21,358 EPOCH 104 done: loss 0.2345 - lr 0.0500 -2019-08-09 17:22:21,358 BAD EPOCHS (no improvement): 0 -2019-08-09 17:22:21,359 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:22:21,660 epoch 105 - iter 0/2650 - loss 0.11039340 throughput (samples/sec): 28483.96 -2019-08-09 17:23:48,613 epoch 105 - iter 265/2650 - loss 0.21982614 throughput (samples/sec): 97.57 -2019-08-09 17:25:10,618 epoch 105 - iter 530/2650 - loss 0.22369656 throughput (samples/sec): 103.46 -2019-08-09 17:26:33,661 epoch 105 - iter 795/2650 - loss 0.23076508 throughput (samples/sec): 102.17 -2019-08-09 17:27:56,655 epoch 105 - iter 1060/2650 - loss 0.23178673 throughput (samples/sec): 102.23 -2019-08-09 17:29:22,391 epoch 105 - iter 1325/2650 - loss 0.23157241 throughput (samples/sec): 98.96 -2019-08-09 17:30:51,833 epoch 105 - iter 1590/2650 - loss 0.23448857 throughput (samples/sec): 94.86 -2019-08-09 17:32:34,994 epoch 105 - iter 1855/2650 - loss 0.23568599 throughput (samples/sec): 82.24 -2019-08-09 17:34:13,131 epoch 105 - iter 2120/2650 - loss 0.23725458 throughput (samples/sec): 86.45 -2019-08-09 17:35:49,550 epoch 105 - iter 2385/2650 - loss 0.23429908 throughput (samples/sec): 87.99 -2019-08-09 17:37:23,798 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:37:23,798 EPOCH 105 done: loss 0.2338 - lr 0.0500 -2019-08-09 17:37:23,798 BAD EPOCHS (no improvement): 0 -2019-08-09 17:37:23,798 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:37:24,183 epoch 106 - iter 0/2650 - loss 0.20378536 throughput (samples/sec): 22257.58 -2019-08-09 17:39:00,947 epoch 106 - iter 265/2650 - loss 0.22376266 throughput (samples/sec): 87.67 -2019-08-09 17:40:26,539 epoch 106 - iter 530/2650 - loss 0.22996000 throughput (samples/sec): 99.13 -2019-08-09 17:41:50,757 epoch 106 - iter 795/2650 - loss 0.22836409 throughput (samples/sec): 100.75 -2019-08-09 17:43:44,118 epoch 106 - iter 1060/2650 - loss 0.23013537 throughput (samples/sec): 74.83 -2019-08-09 17:45:43,173 epoch 106 - iter 1325/2650 - loss 0.23051916 throughput (samples/sec): 71.25 -2019-08-09 17:47:39,458 epoch 106 - iter 1590/2650 - loss 0.23345125 throughput (samples/sec): 72.95 -2019-08-09 17:49:37,887 epoch 106 - iter 1855/2650 - loss 0.23730810 throughput (samples/sec): 71.63 -2019-08-09 17:51:37,452 epoch 106 - iter 2120/2650 - loss 0.23598298 throughput (samples/sec): 70.95 -2019-08-09 17:53:31,697 epoch 106 - iter 2385/2650 - loss 0.23602764 throughput (samples/sec): 74.25 -2019-08-09 17:55:27,398 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:55:27,398 EPOCH 106 done: loss 0.2374 - lr 0.0500 -2019-08-09 17:55:27,398 BAD EPOCHS (no improvement): 1 -2019-08-09 17:55:27,398 ---------------------------------------------------------------------------------------------------- -2019-08-09 17:55:27,934 epoch 107 - iter 0/2650 - loss 0.27520251 throughput (samples/sec): 15927.51 -2019-08-09 17:57:21,793 epoch 107 - iter 265/2650 - loss 0.21932524 throughput (samples/sec): 74.51 -2019-08-09 17:59:19,890 epoch 107 - iter 530/2650 - loss 0.22978173 throughput (samples/sec): 71.83 -2019-08-09 18:00:53,768 epoch 107 - iter 795/2650 - loss 0.22919778 throughput (samples/sec): 90.37 -2019-08-09 18:02:18,262 epoch 107 - iter 1060/2650 - loss 0.23104903 throughput (samples/sec): 100.41 -2019-08-09 18:03:45,080 epoch 107 - iter 1325/2650 - loss 0.23319572 throughput (samples/sec): 97.72 -2019-08-09 18:05:11,123 epoch 107 - iter 1590/2650 - loss 0.23314294 throughput (samples/sec): 98.61 -2019-08-09 18:06:33,120 epoch 107 - iter 1855/2650 - loss 0.23067058 throughput (samples/sec): 103.47 -2019-08-09 18:07:58,710 epoch 107 - iter 2120/2650 - loss 0.22973563 throughput (samples/sec): 99.13 -2019-08-09 18:09:22,059 epoch 107 - iter 2385/2650 - loss 0.23120475 throughput (samples/sec): 101.79 -2019-08-09 18:10:48,367 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:10:48,367 EPOCH 107 done: loss 0.2325 - lr 0.0500 -2019-08-09 18:10:48,367 BAD EPOCHS (no improvement): 0 -2019-08-09 18:10:48,368 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:10:48,641 epoch 108 - iter 0/2650 - loss 0.07675159 throughput (samples/sec): 31421.34 -2019-08-09 18:12:14,299 epoch 108 - iter 265/2650 - loss 0.22919055 throughput (samples/sec): 99.05 -2019-08-09 18:13:40,218 epoch 108 - iter 530/2650 - loss 0.22864574 throughput (samples/sec): 98.75 -2019-08-09 18:15:02,672 epoch 108 - iter 795/2650 - loss 0.22468357 throughput (samples/sec): 102.90 -2019-08-09 18:16:27,112 epoch 108 - iter 1060/2650 - loss 0.22770427 throughput (samples/sec): 100.48 -2019-08-09 18:17:55,494 epoch 108 - iter 1325/2650 - loss 0.23026592 throughput (samples/sec): 96.00 -2019-08-09 18:19:23,351 epoch 108 - iter 1590/2650 - loss 0.23018116 throughput (samples/sec): 96.57 -2019-08-09 18:20:50,983 epoch 108 - iter 1855/2650 - loss 0.23005749 throughput (samples/sec): 96.82 -2019-08-09 18:22:17,398 epoch 108 - iter 2120/2650 - loss 0.23103762 throughput (samples/sec): 98.18 -2019-08-09 18:23:46,590 epoch 108 - iter 2385/2650 - loss 0.23125387 throughput (samples/sec): 95.12 -2019-08-09 18:25:11,748 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:25:11,748 EPOCH 108 done: loss 0.2315 - lr 0.0500 -2019-08-09 18:25:11,748 BAD EPOCHS (no improvement): 0 -2019-08-09 18:25:11,748 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:25:12,147 epoch 109 - iter 0/2650 - loss 0.34282446 throughput (samples/sec): 21492.08 -2019-08-09 18:26:40,519 epoch 109 - iter 265/2650 - loss 0.22013577 throughput (samples/sec): 96.01 -2019-08-09 18:28:07,704 epoch 109 - iter 530/2650 - loss 0.21811325 throughput (samples/sec): 97.31 -2019-08-09 18:29:31,513 epoch 109 - iter 795/2650 - loss 0.21612593 throughput (samples/sec): 101.24 -2019-08-09 18:30:56,766 epoch 109 - iter 1060/2650 - loss 0.22092911 throughput (samples/sec): 99.52 -2019-08-09 18:32:22,572 epoch 109 - iter 1325/2650 - loss 0.22324463 throughput (samples/sec): 98.88 -2019-08-09 18:34:04,712 epoch 109 - iter 1590/2650 - loss 0.22381843 throughput (samples/sec): 83.06 -2019-08-09 18:35:55,869 epoch 109 - iter 1855/2650 - loss 0.22546361 throughput (samples/sec): 76.32 -2019-08-09 18:37:43,157 epoch 109 - iter 2120/2650 - loss 0.22607088 throughput (samples/sec): 79.07 -2019-08-09 18:39:29,477 epoch 109 - iter 2385/2650 - loss 0.22960233 throughput (samples/sec): 79.79 -2019-08-09 18:41:14,796 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:41:14,796 EPOCH 109 done: loss 0.2282 - lr 0.0500 -2019-08-09 18:41:14,796 BAD EPOCHS (no improvement): 0 -2019-08-09 18:41:14,796 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:41:15,211 epoch 110 - iter 0/2650 - loss 0.20416713 throughput (samples/sec): 20616.28 -2019-08-09 18:43:04,828 epoch 110 - iter 265/2650 - loss 0.23626773 throughput (samples/sec): 77.39 -2019-08-09 18:44:54,949 epoch 110 - iter 530/2650 - loss 0.23297388 throughput (samples/sec): 77.04 -2019-08-09 18:46:40,834 epoch 110 - iter 795/2650 - loss 0.22909098 throughput (samples/sec): 80.12 -2019-08-09 18:48:27,804 epoch 110 - iter 1060/2650 - loss 0.22772738 throughput (samples/sec): 79.31 -2019-08-09 18:50:19,484 epoch 110 - iter 1325/2650 - loss 0.22945078 throughput (samples/sec): 75.96 -2019-08-09 18:52:02,762 epoch 110 - iter 1590/2650 - loss 0.22784361 throughput (samples/sec): 82.14 -2019-08-09 18:53:54,985 epoch 110 - iter 1855/2650 - loss 0.22710611 throughput (samples/sec): 75.59 -2019-08-09 18:55:44,818 epoch 110 - iter 2120/2650 - loss 0.22711218 throughput (samples/sec): 77.24 -2019-08-09 18:57:34,576 epoch 110 - iter 2385/2650 - loss 0.22783602 throughput (samples/sec): 77.29 -2019-08-09 18:59:26,048 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:59:26,048 EPOCH 110 done: loss 0.2287 - lr 0.0500 -2019-08-09 18:59:26,048 BAD EPOCHS (no improvement): 1 -2019-08-09 18:59:26,048 ---------------------------------------------------------------------------------------------------- -2019-08-09 18:59:26,920 epoch 111 - iter 0/2650 - loss 0.21031165 throughput (samples/sec): 9766.37 -2019-08-09 19:01:17,056 epoch 111 - iter 265/2650 - loss 0.23103102 throughput (samples/sec): 77.03 -2019-08-09 19:03:09,234 epoch 111 - iter 530/2650 - loss 0.22365123 throughput (samples/sec): 75.62 -2019-08-09 19:05:02,127 epoch 111 - iter 795/2650 - loss 0.21807118 throughput (samples/sec): 75.15 -2019-08-09 19:06:46,275 epoch 111 - iter 1060/2650 - loss 0.21954240 throughput (samples/sec): 81.46 -2019-08-09 19:08:36,624 epoch 111 - iter 1325/2650 - loss 0.22174528 throughput (samples/sec): 76.88 -2019-08-09 19:10:12,332 epoch 111 - iter 1590/2650 - loss 0.22331248 throughput (samples/sec): 88.64 -2019-08-09 19:11:39,637 epoch 111 - iter 1855/2650 - loss 0.22349684 throughput (samples/sec): 97.18 -2019-08-09 19:13:05,349 epoch 111 - iter 2120/2650 - loss 0.22225760 throughput (samples/sec): 98.98 -2019-08-09 19:14:30,215 epoch 111 - iter 2385/2650 - loss 0.22276006 throughput (samples/sec): 99.97 -2019-08-09 19:15:54,518 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:15:54,518 EPOCH 111 done: loss 0.2229 - lr 0.0500 -2019-08-09 19:15:54,519 BAD EPOCHS (no improvement): 0 -2019-08-09 19:15:54,519 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:15:54,805 epoch 112 - iter 0/2650 - loss 0.12059826 throughput (samples/sec): 29982.17 -2019-08-09 19:17:18,447 epoch 112 - iter 265/2650 - loss 0.21842452 throughput (samples/sec): 101.44 -2019-08-09 19:18:43,543 epoch 112 - iter 530/2650 - loss 0.22276559 throughput (samples/sec): 99.71 -2019-08-09 19:20:10,096 epoch 112 - iter 795/2650 - loss 0.22419261 throughput (samples/sec): 98.03 -2019-08-09 19:21:32,589 epoch 112 - iter 1060/2650 - loss 0.22359778 throughput (samples/sec): 102.85 -2019-08-09 19:22:56,850 epoch 112 - iter 1325/2650 - loss 0.22639391 throughput (samples/sec): 100.69 -2019-08-09 19:24:21,315 epoch 112 - iter 1590/2650 - loss 0.22465550 throughput (samples/sec): 100.45 -2019-08-09 19:25:46,681 epoch 112 - iter 1855/2650 - loss 0.22594658 throughput (samples/sec): 99.39 -2019-08-09 19:27:11,908 epoch 112 - iter 2120/2650 - loss 0.22684695 throughput (samples/sec): 99.55 -2019-08-09 19:28:36,853 epoch 112 - iter 2385/2650 - loss 0.22385662 throughput (samples/sec): 99.88 -2019-08-09 19:30:03,034 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:30:03,034 EPOCH 112 done: loss 0.2253 - lr 0.0500 -2019-08-09 19:30:03,034 BAD EPOCHS (no improvement): 1 -2019-08-09 19:30:03,034 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:30:03,279 epoch 113 - iter 0/2650 - loss 0.47397578 throughput (samples/sec): 35161.51 -2019-08-09 19:31:26,729 epoch 113 - iter 265/2650 - loss 0.22766175 throughput (samples/sec): 101.67 -2019-08-09 19:32:51,736 epoch 113 - iter 530/2650 - loss 0.23273358 throughput (samples/sec): 99.81 -2019-08-09 19:34:17,807 epoch 113 - iter 795/2650 - loss 0.22542203 throughput (samples/sec): 98.57 -2019-08-09 19:35:41,855 epoch 113 - iter 1060/2650 - loss 0.22357073 throughput (samples/sec): 100.95 -2019-08-09 19:37:06,052 epoch 113 - iter 1325/2650 - loss 0.22434004 throughput (samples/sec): 100.77 -2019-08-09 19:38:34,254 epoch 113 - iter 1590/2650 - loss 0.22199538 throughput (samples/sec): 96.19 -2019-08-09 19:40:02,297 epoch 113 - iter 1855/2650 - loss 0.22256637 throughput (samples/sec): 96.37 -2019-08-09 19:41:29,045 epoch 113 - iter 2120/2650 - loss 0.21878375 throughput (samples/sec): 97.80 -2019-08-09 19:42:58,553 epoch 113 - iter 2385/2650 - loss 0.21951930 throughput (samples/sec): 94.79 -2019-08-09 19:44:24,543 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:44:24,544 EPOCH 113 done: loss 0.2195 - lr 0.0500 -2019-08-09 19:44:24,544 BAD EPOCHS (no improvement): 0 -2019-08-09 19:44:24,544 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:44:24,851 epoch 114 - iter 0/2650 - loss 0.31130242 throughput (samples/sec): 27964.47 -2019-08-09 19:45:49,178 epoch 114 - iter 265/2650 - loss 0.21054818 throughput (samples/sec): 100.61 -2019-08-09 19:47:16,614 epoch 114 - iter 530/2650 - loss 0.21694362 throughput (samples/sec): 97.03 -2019-08-09 19:48:41,597 epoch 114 - iter 795/2650 - loss 0.21024441 throughput (samples/sec): 99.84 -2019-08-09 19:50:07,777 epoch 114 - iter 1060/2650 - loss 0.21233952 throughput (samples/sec): 98.45 -2019-08-09 19:51:34,797 epoch 114 - iter 1325/2650 - loss 0.21154502 throughput (samples/sec): 97.50 -2019-08-09 19:53:02,869 epoch 114 - iter 1590/2650 - loss 0.21354331 throughput (samples/sec): 96.33 -2019-08-09 19:54:28,603 epoch 114 - iter 1855/2650 - loss 0.21448387 throughput (samples/sec): 98.96 -2019-08-09 19:55:55,363 epoch 114 - iter 2120/2650 - loss 0.21679913 throughput (samples/sec): 97.79 -2019-08-09 19:57:22,535 epoch 114 - iter 2385/2650 - loss 0.21831593 throughput (samples/sec): 97.33 -2019-08-09 19:58:48,281 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:58:48,281 EPOCH 114 done: loss 0.2178 - lr 0.0500 -2019-08-09 19:58:48,281 BAD EPOCHS (no improvement): 0 -2019-08-09 19:58:48,282 ---------------------------------------------------------------------------------------------------- -2019-08-09 19:58:48,695 epoch 115 - iter 0/2650 - loss 0.40401989 throughput (samples/sec): 20721.49 -2019-08-09 20:00:13,479 epoch 115 - iter 265/2650 - loss 0.20444066 throughput (samples/sec): 100.07 -2019-08-09 20:01:35,803 epoch 115 - iter 530/2650 - loss 0.20640637 throughput (samples/sec): 103.06 -2019-08-09 20:03:02,624 epoch 115 - iter 795/2650 - loss 0.21402562 throughput (samples/sec): 97.72 -2019-08-09 20:04:26,891 epoch 115 - iter 1060/2650 - loss 0.21551842 throughput (samples/sec): 100.69 -2019-08-09 20:05:50,901 epoch 115 - iter 1325/2650 - loss 0.21305151 throughput (samples/sec): 100.99 -2019-08-09 20:07:17,635 epoch 115 - iter 1590/2650 - loss 0.21330313 throughput (samples/sec): 97.82 -2019-08-09 20:08:46,344 epoch 115 - iter 1855/2650 - loss 0.21411255 throughput (samples/sec): 95.64 -2019-08-09 20:10:12,264 epoch 115 - iter 2120/2650 - loss 0.21441253 throughput (samples/sec): 98.75 -2019-08-09 20:11:37,642 epoch 115 - iter 2385/2650 - loss 0.21370619 throughput (samples/sec): 99.37 -2019-08-09 20:13:02,214 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:13:02,214 EPOCH 115 done: loss 0.2144 - lr 0.0500 -2019-08-09 20:13:02,214 BAD EPOCHS (no improvement): 0 -2019-08-09 20:13:02,214 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:13:02,490 epoch 116 - iter 0/2650 - loss 0.26621729 throughput (samples/sec): 31176.24 -2019-08-09 20:14:30,081 epoch 116 - iter 265/2650 - loss 0.22059336 throughput (samples/sec): 96.86 -2019-08-09 20:15:57,601 epoch 116 - iter 530/2650 - loss 0.22501244 throughput (samples/sec): 96.94 -2019-08-09 20:17:21,284 epoch 116 - iter 795/2650 - loss 0.22357816 throughput (samples/sec): 101.39 -2019-08-09 20:18:49,410 epoch 116 - iter 1060/2650 - loss 0.22132770 throughput (samples/sec): 96.27 -2019-08-09 20:20:14,983 epoch 116 - iter 1325/2650 - loss 0.22359544 throughput (samples/sec): 99.15 -2019-08-09 20:21:37,819 epoch 116 - iter 1590/2650 - loss 0.22258272 throughput (samples/sec): 102.42 -2019-08-09 20:23:02,323 epoch 116 - iter 1855/2650 - loss 0.22173152 throughput (samples/sec): 100.40 -2019-08-09 20:24:25,174 epoch 116 - iter 2120/2650 - loss 0.22265625 throughput (samples/sec): 102.40 -2019-08-09 20:25:47,008 epoch 116 - iter 2385/2650 - loss 0.22188380 throughput (samples/sec): 103.68 -2019-08-09 20:27:09,034 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:27:09,034 EPOCH 116 done: loss 0.2230 - lr 0.0500 -2019-08-09 20:27:09,034 BAD EPOCHS (no improvement): 1 -2019-08-09 20:27:09,034 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:27:09,352 epoch 117 - iter 0/2650 - loss 0.26855314 throughput (samples/sec): 26984.76 -2019-08-09 20:28:33,263 epoch 117 - iter 265/2650 - loss 0.23216449 throughput (samples/sec): 101.11 -2019-08-09 20:29:57,586 epoch 117 - iter 530/2650 - loss 0.21893011 throughput (samples/sec): 100.62 -2019-08-09 20:31:22,311 epoch 117 - iter 795/2650 - loss 0.22006820 throughput (samples/sec): 100.14 -2019-08-09 20:32:44,338 epoch 117 - iter 1060/2650 - loss 0.21473808 throughput (samples/sec): 103.44 -2019-08-09 20:34:08,859 epoch 117 - iter 1325/2650 - loss 0.21526154 throughput (samples/sec): 100.38 -2019-08-09 20:35:33,793 epoch 117 - iter 1590/2650 - loss 0.21565836 throughput (samples/sec): 99.89 -2019-08-09 20:36:56,958 epoch 117 - iter 1855/2650 - loss 0.21584024 throughput (samples/sec): 102.02 -2019-08-09 20:38:21,162 epoch 117 - iter 2120/2650 - loss 0.21557498 throughput (samples/sec): 100.76 -2019-08-09 20:39:43,312 epoch 117 - iter 2385/2650 - loss 0.21615244 throughput (samples/sec): 103.28 -2019-08-09 20:41:05,241 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:41:05,241 EPOCH 117 done: loss 0.2176 - lr 0.0500 -2019-08-09 20:41:05,241 BAD EPOCHS (no improvement): 2 -2019-08-09 20:41:05,241 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:41:05,591 epoch 118 - iter 0/2650 - loss 0.16174036 throughput (samples/sec): 24478.72 -2019-08-09 20:42:28,328 epoch 118 - iter 265/2650 - loss 0.22271493 throughput (samples/sec): 102.55 -2019-08-09 20:43:50,298 epoch 118 - iter 530/2650 - loss 0.21889377 throughput (samples/sec): 103.51 -2019-08-09 20:45:14,552 epoch 118 - iter 795/2650 - loss 0.20936358 throughput (samples/sec): 100.70 -2019-08-09 20:46:38,449 epoch 118 - iter 1060/2650 - loss 0.20972610 throughput (samples/sec): 101.13 -2019-08-09 20:48:01,920 epoch 118 - iter 1325/2650 - loss 0.21154286 throughput (samples/sec): 101.64 -2019-08-09 20:49:26,146 epoch 118 - iter 1590/2650 - loss 0.21314913 throughput (samples/sec): 100.73 -2019-08-09 20:50:49,082 epoch 118 - iter 1855/2650 - loss 0.21365355 throughput (samples/sec): 102.30 -2019-08-09 20:52:11,239 epoch 118 - iter 2120/2650 - loss 0.21570415 throughput (samples/sec): 103.27 -2019-08-09 20:53:35,783 epoch 118 - iter 2385/2650 - loss 0.21457670 throughput (samples/sec): 100.35 -2019-08-09 20:54:57,758 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:54:57,758 EPOCH 118 done: loss 0.2158 - lr 0.0500 -2019-08-09 20:54:57,758 BAD EPOCHS (no improvement): 3 -2019-08-09 20:54:57,758 ---------------------------------------------------------------------------------------------------- -2019-08-09 20:54:57,964 epoch 119 - iter 0/2650 - loss 0.19877988 throughput (samples/sec): 41949.72 -2019-08-09 20:56:20,814 epoch 119 - iter 265/2650 - loss 0.20190120 throughput (samples/sec): 102.41 -2019-08-09 20:57:44,534 epoch 119 - iter 530/2650 - loss 0.21290144 throughput (samples/sec): 101.34 -2019-08-09 20:59:09,379 epoch 119 - iter 795/2650 - loss 0.21833885 throughput (samples/sec): 100.00 -2019-08-09 21:00:31,628 epoch 119 - iter 1060/2650 - loss 0.21585275 throughput (samples/sec): 103.15 -2019-08-09 21:01:54,384 epoch 119 - iter 1325/2650 - loss 0.21448388 throughput (samples/sec): 102.52 -2019-08-09 21:03:15,836 epoch 119 - iter 1590/2650 - loss 0.21652773 throughput (samples/sec): 104.16 -2019-08-09 21:04:39,692 epoch 119 - iter 1855/2650 - loss 0.21524439 throughput (samples/sec): 101.18 -2019-08-09 21:06:04,325 epoch 119 - iter 2120/2650 - loss 0.21494046 throughput (samples/sec): 100.25 -2019-08-09 21:07:29,587 epoch 119 - iter 2385/2650 - loss 0.21460512 throughput (samples/sec): 99.51 -2019-08-09 21:08:52,037 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:08:52,038 EPOCH 119 done: loss 0.2161 - lr 0.0500 -2019-08-09 21:08:52,038 BAD EPOCHS (no improvement): 4 -2019-08-09 21:08:52,038 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:08:52,286 epoch 120 - iter 0/2650 - loss 0.09104347 throughput (samples/sec): 34740.87 -2019-08-09 21:10:16,117 epoch 120 - iter 265/2650 - loss 0.19921830 throughput (samples/sec): 101.21 -2019-08-09 21:11:39,503 epoch 120 - iter 530/2650 - loss 0.20454328 throughput (samples/sec): 101.75 -2019-08-09 21:13:04,593 epoch 120 - iter 795/2650 - loss 0.20414639 throughput (samples/sec): 99.71 -2019-08-09 21:14:29,734 epoch 120 - iter 1060/2650 - loss 0.20164337 throughput (samples/sec): 99.65 -2019-08-09 21:15:54,682 epoch 120 - iter 1325/2650 - loss 0.20293894 throughput (samples/sec): 99.88 -2019-08-09 21:17:17,924 epoch 120 - iter 1590/2650 - loss 0.20513871 throughput (samples/sec): 101.93 -2019-08-09 21:18:40,829 epoch 120 - iter 1855/2650 - loss 0.20413065 throughput (samples/sec): 102.34 -2019-08-09 21:20:04,701 epoch 120 - iter 2120/2650 - loss 0.20553182 throughput (samples/sec): 101.16 -2019-08-09 21:21:30,498 epoch 120 - iter 2385/2650 - loss 0.20397526 throughput (samples/sec): 98.89 -2019-08-09 21:22:53,570 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:22:53,571 EPOCH 120 done: loss 0.2059 - lr 0.0250 -2019-08-09 21:22:53,571 BAD EPOCHS (no improvement): 0 -2019-08-09 21:22:53,571 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:22:54,233 epoch 121 - iter 0/2650 - loss 0.53145009 throughput (samples/sec): 12887.05 -2019-08-09 21:24:16,113 epoch 121 - iter 265/2650 - loss 0.20391241 throughput (samples/sec): 103.62 -2019-08-09 21:25:38,857 epoch 121 - iter 530/2650 - loss 0.20374159 throughput (samples/sec): 102.54 -2019-08-09 21:27:02,891 epoch 121 - iter 795/2650 - loss 0.20298432 throughput (samples/sec): 100.96 -2019-08-09 21:28:27,356 epoch 121 - iter 1060/2650 - loss 0.19986761 throughput (samples/sec): 100.45 -2019-08-09 21:29:53,727 epoch 121 - iter 1325/2650 - loss 0.20292822 throughput (samples/sec): 98.23 -2019-08-09 21:31:39,420 epoch 121 - iter 1590/2650 - loss 0.20469300 throughput (samples/sec): 80.26 -2019-08-09 21:33:30,780 epoch 121 - iter 1855/2650 - loss 0.20611931 throughput (samples/sec): 76.18 -2019-08-09 21:35:19,102 epoch 121 - iter 2120/2650 - loss 0.20507691 throughput (samples/sec): 78.32 -2019-08-09 21:36:56,956 epoch 121 - iter 2385/2650 - loss 0.20624145 throughput (samples/sec): 86.70 -2019-08-09 21:38:19,330 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:38:19,331 EPOCH 121 done: loss 0.2052 - lr 0.0250 -2019-08-09 21:38:19,331 BAD EPOCHS (no improvement): 0 -2019-08-09 21:38:19,331 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:38:19,640 epoch 122 - iter 0/2650 - loss 0.37430096 throughput (samples/sec): 27770.71 -2019-08-09 21:39:48,118 epoch 122 - iter 265/2650 - loss 0.20541239 throughput (samples/sec): 95.89 -2019-08-09 21:41:14,453 epoch 122 - iter 530/2650 - loss 0.20394396 throughput (samples/sec): 98.27 -2019-08-09 21:42:57,607 epoch 122 - iter 795/2650 - loss 0.20181570 throughput (samples/sec): 82.24 -2019-08-09 21:44:58,918 epoch 122 - iter 1060/2650 - loss 0.20281468 throughput (samples/sec): 69.93 -2019-08-09 21:46:44,276 epoch 122 - iter 1325/2650 - loss 0.20084101 throughput (samples/sec): 80.52 -2019-08-09 21:48:28,322 epoch 122 - iter 1590/2650 - loss 0.20265630 throughput (samples/sec): 81.54 -2019-08-09 21:50:10,938 epoch 122 - iter 1855/2650 - loss 0.20570190 throughput (samples/sec): 82.67 -2019-08-09 21:51:57,162 epoch 122 - iter 2120/2650 - loss 0.20514385 throughput (samples/sec): 79.86 -2019-08-09 21:53:42,294 epoch 122 - iter 2385/2650 - loss 0.20423951 throughput (samples/sec): 80.69 -2019-08-09 21:55:28,032 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:55:28,033 EPOCH 122 done: loss 0.2046 - lr 0.0250 -2019-08-09 21:55:28,033 BAD EPOCHS (no improvement): 0 -2019-08-09 21:55:28,033 ---------------------------------------------------------------------------------------------------- -2019-08-09 21:55:28,480 epoch 123 - iter 0/2650 - loss 0.46486497 throughput (samples/sec): 19127.75 -2019-08-09 21:57:16,459 epoch 123 - iter 265/2650 - loss 0.20169438 throughput (samples/sec): 78.56 -2019-08-09 21:59:02,835 epoch 123 - iter 530/2650 - loss 0.20813837 throughput (samples/sec): 79.75 -2019-08-09 22:00:53,035 epoch 123 - iter 795/2650 - loss 0.20445215 throughput (samples/sec): 76.98 -2019-08-09 22:02:36,242 epoch 123 - iter 1060/2650 - loss 0.20139125 throughput (samples/sec): 82.21 -2019-08-09 22:04:25,648 epoch 123 - iter 1325/2650 - loss 0.20118176 throughput (samples/sec): 77.55 -2019-08-09 22:06:18,741 epoch 123 - iter 1590/2650 - loss 0.20269608 throughput (samples/sec): 75.01 -2019-08-09 22:08:10,015 epoch 123 - iter 1855/2650 - loss 0.20038729 throughput (samples/sec): 76.24 -2019-08-09 22:10:00,173 epoch 123 - iter 2120/2650 - loss 0.20155346 throughput (samples/sec): 77.01 -2019-08-09 22:11:45,394 epoch 123 - iter 2385/2650 - loss 0.20062042 throughput (samples/sec): 80.63 -2019-08-09 22:13:31,357 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:13:31,357 EPOCH 123 done: loss 0.2016 - lr 0.0250 -2019-08-09 22:13:31,357 BAD EPOCHS (no improvement): 0 -2019-08-09 22:13:31,358 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:13:31,766 epoch 124 - iter 0/2650 - loss 0.42024410 throughput (samples/sec): 20948.55 -2019-08-09 22:15:19,313 epoch 124 - iter 265/2650 - loss 0.20436236 throughput (samples/sec): 78.88 -2019-08-09 22:17:08,066 epoch 124 - iter 530/2650 - loss 0.19784566 throughput (samples/sec): 78.01 -2019-08-09 22:18:54,412 epoch 124 - iter 795/2650 - loss 0.19521471 throughput (samples/sec): 79.77 -2019-08-09 22:20:43,516 epoch 124 - iter 1060/2650 - loss 0.19569441 throughput (samples/sec): 77.76 -2019-08-09 22:22:13,815 epoch 124 - iter 1325/2650 - loss 0.19346101 throughput (samples/sec): 93.96 -2019-08-09 22:23:36,055 epoch 124 - iter 1590/2650 - loss 0.19051046 throughput (samples/sec): 103.16 -2019-08-09 22:25:05,346 epoch 124 - iter 1855/2650 - loss 0.19350757 throughput (samples/sec): 95.02 -2019-08-09 22:27:02,397 epoch 124 - iter 2120/2650 - loss 0.19509785 throughput (samples/sec): 72.47 -2019-08-09 22:28:49,930 epoch 124 - iter 2385/2650 - loss 0.19519362 throughput (samples/sec): 78.89 -2019-08-09 22:30:35,196 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:30:35,197 EPOCH 124 done: loss 0.1957 - lr 0.0250 -2019-08-09 22:30:35,197 BAD EPOCHS (no improvement): 0 -2019-08-09 22:30:35,197 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:30:35,550 epoch 125 - iter 0/2650 - loss 0.03123158 throughput (samples/sec): 24258.70 -2019-08-09 22:32:20,477 epoch 125 - iter 265/2650 - loss 0.19248549 throughput (samples/sec): 80.85 -2019-08-09 22:34:05,872 epoch 125 - iter 530/2650 - loss 0.19717052 throughput (samples/sec): 80.49 -2019-08-09 22:35:51,037 epoch 125 - iter 795/2650 - loss 0.19851121 throughput (samples/sec): 80.67 -2019-08-09 22:37:39,303 epoch 125 - iter 1060/2650 - loss 0.19345602 throughput (samples/sec): 78.36 -2019-08-09 22:39:22,131 epoch 125 - iter 1325/2650 - loss 0.19281290 throughput (samples/sec): 82.50 -2019-08-09 22:41:06,648 epoch 125 - iter 1590/2650 - loss 0.19492478 throughput (samples/sec): 81.17 -2019-08-09 22:42:30,566 epoch 125 - iter 1855/2650 - loss 0.19434351 throughput (samples/sec): 101.10 -2019-08-09 22:43:53,967 epoch 125 - iter 2120/2650 - loss 0.19256156 throughput (samples/sec): 101.73 -2019-08-09 22:45:39,620 epoch 125 - iter 2385/2650 - loss 0.19385741 throughput (samples/sec): 80.29 -2019-08-09 22:47:37,762 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:47:37,762 EPOCH 125 done: loss 0.1934 - lr 0.0250 -2019-08-09 22:47:37,762 BAD EPOCHS (no improvement): 0 -2019-08-09 22:47:37,762 ---------------------------------------------------------------------------------------------------- -2019-08-09 22:47:38,087 epoch 126 - iter 0/2650 - loss 0.20917296 throughput (samples/sec): 26419.38 -2019-08-09 22:49:26,352 epoch 126 - iter 265/2650 - loss 0.18804332 throughput (samples/sec): 78.36 -2019-08-09 22:51:16,517 epoch 126 - iter 530/2650 - loss 0.19530081 throughput (samples/sec): 77.01 -2019-08-09 22:52:40,581 epoch 126 - iter 795/2650 - loss 0.18573199 throughput (samples/sec): 100.93 -2019-08-09 22:54:04,810 epoch 126 - iter 1060/2650 - loss 0.18589906 throughput (samples/sec): 100.73 -2019-08-09 22:55:58,221 epoch 126 - iter 1325/2650 - loss 0.19082970 throughput (samples/sec): 74.80 -2019-08-09 22:57:47,238 epoch 126 - iter 1590/2650 - loss 0.19276735 throughput (samples/sec): 77.82 -2019-08-09 22:59:30,509 epoch 126 - iter 1855/2650 - loss 0.19279483 throughput (samples/sec): 82.15 -2019-08-09 23:01:22,414 epoch 126 - iter 2120/2650 - loss 0.19357098 throughput (samples/sec): 75.81 -2019-08-09 23:03:12,588 epoch 126 - iter 2385/2650 - loss 0.19391250 throughput (samples/sec): 77.00 -2019-08-09 23:05:14,097 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:05:14,097 EPOCH 126 done: loss 0.1944 - lr 0.0250 -2019-08-09 23:05:14,097 BAD EPOCHS (no improvement): 1 -2019-08-09 23:05:14,098 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:05:14,503 epoch 127 - iter 0/2650 - loss 0.36565596 throughput (samples/sec): 21130.79 -2019-08-09 23:06:43,718 epoch 127 - iter 265/2650 - loss 0.19406638 throughput (samples/sec): 95.10 -2019-08-09 23:08:33,949 epoch 127 - iter 530/2650 - loss 0.19744848 throughput (samples/sec): 76.96 -2019-08-09 23:10:22,214 epoch 127 - iter 795/2650 - loss 0.19736364 throughput (samples/sec): 78.36 -2019-08-09 23:12:13,074 epoch 127 - iter 1060/2650 - loss 0.19719290 throughput (samples/sec): 76.52 -2019-08-09 23:14:00,841 epoch 127 - iter 1325/2650 - loss 0.19661644 throughput (samples/sec): 78.72 -2019-08-09 23:15:51,695 epoch 127 - iter 1590/2650 - loss 0.19471353 throughput (samples/sec): 76.53 -2019-08-09 23:17:41,412 epoch 127 - iter 1855/2650 - loss 0.19518438 throughput (samples/sec): 77.32 -2019-08-09 23:19:31,335 epoch 127 - iter 2120/2650 - loss 0.19443762 throughput (samples/sec): 77.18 -2019-08-09 23:21:25,150 epoch 127 - iter 2385/2650 - loss 0.19610389 throughput (samples/sec): 74.54 -2019-08-09 23:23:05,858 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:23:05,858 EPOCH 127 done: loss 0.1957 - lr 0.0250 -2019-08-09 23:23:05,858 BAD EPOCHS (no improvement): 2 -2019-08-09 23:23:05,859 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:23:06,250 epoch 128 - iter 0/2650 - loss 0.26048845 throughput (samples/sec): 21849.18 -2019-08-09 23:24:47,813 epoch 128 - iter 265/2650 - loss 0.19307294 throughput (samples/sec): 83.53 -2019-08-09 23:26:35,847 epoch 128 - iter 530/2650 - loss 0.18844957 throughput (samples/sec): 78.52 -2019-08-09 23:28:26,834 epoch 128 - iter 795/2650 - loss 0.18990338 throughput (samples/sec): 76.43 -2019-08-09 23:30:18,731 epoch 128 - iter 1060/2650 - loss 0.19202078 throughput (samples/sec): 75.81 -2019-08-09 23:32:05,768 epoch 128 - iter 1325/2650 - loss 0.19572903 throughput (samples/sec): 79.26 -2019-08-09 23:33:54,293 epoch 128 - iter 1590/2650 - loss 0.19591281 throughput (samples/sec): 78.17 -2019-08-09 23:35:43,176 epoch 128 - iter 1855/2650 - loss 0.19808757 throughput (samples/sec): 77.91 -2019-08-09 23:37:32,131 epoch 128 - iter 2120/2650 - loss 0.19702168 throughput (samples/sec): 77.86 -2019-08-09 23:39:12,317 epoch 128 - iter 2385/2650 - loss 0.19638159 throughput (samples/sec): 84.68 -2019-08-09 23:40:56,784 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:40:56,784 EPOCH 128 done: loss 0.1954 - lr 0.0250 -2019-08-09 23:40:56,785 BAD EPOCHS (no improvement): 3 -2019-08-09 23:40:56,785 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:40:57,270 epoch 129 - iter 0/2650 - loss 0.11749345 throughput (samples/sec): 17623.76 -2019-08-09 23:42:45,558 epoch 129 - iter 265/2650 - loss 0.17531263 throughput (samples/sec): 78.34 -2019-08-09 23:44:34,725 epoch 129 - iter 530/2650 - loss 0.18601146 throughput (samples/sec): 77.71 -2019-08-09 23:46:24,332 epoch 129 - iter 795/2650 - loss 0.18077094 throughput (samples/sec): 77.40 -2019-08-09 23:48:10,059 epoch 129 - iter 1060/2650 - loss 0.18148291 throughput (samples/sec): 80.24 -2019-08-09 23:49:58,013 epoch 129 - iter 1325/2650 - loss 0.18393423 throughput (samples/sec): 78.58 -2019-08-09 23:51:47,843 epoch 129 - iter 1590/2650 - loss 0.18655159 throughput (samples/sec): 77.24 -2019-08-09 23:53:41,902 epoch 129 - iter 1855/2650 - loss 0.18710320 throughput (samples/sec): 74.37 -2019-08-09 23:55:18,957 epoch 129 - iter 2120/2650 - loss 0.18724295 throughput (samples/sec): 87.41 -2019-08-09 23:57:08,323 epoch 129 - iter 2385/2650 - loss 0.18909187 throughput (samples/sec): 77.57 -2019-08-09 23:58:55,781 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:58:55,782 EPOCH 129 done: loss 0.1892 - lr 0.0250 -2019-08-09 23:58:55,782 BAD EPOCHS (no improvement): 0 -2019-08-09 23:58:55,782 ---------------------------------------------------------------------------------------------------- -2019-08-09 23:58:56,163 epoch 130 - iter 0/2650 - loss 0.61453879 throughput (samples/sec): 22441.92 -2019-08-10 00:00:46,987 epoch 130 - iter 265/2650 - loss 0.17348825 throughput (samples/sec): 76.55 -2019-08-10 00:02:32,832 epoch 130 - iter 530/2650 - loss 0.17511855 throughput (samples/sec): 80.15 -2019-08-10 00:04:23,000 epoch 130 - iter 795/2650 - loss 0.18297108 throughput (samples/sec): 77.00 -2019-08-10 00:06:11,482 epoch 130 - iter 1060/2650 - loss 0.18253241 throughput (samples/sec): 78.20 -2019-08-10 00:08:02,538 epoch 130 - iter 1325/2650 - loss 0.18466496 throughput (samples/sec): 76.39 -2019-08-10 00:09:53,660 epoch 130 - iter 1590/2650 - loss 0.18495772 throughput (samples/sec): 76.34 -2019-08-10 00:11:26,293 epoch 130 - iter 1855/2650 - loss 0.18527675 throughput (samples/sec): 91.58 -2019-08-10 00:13:15,933 epoch 130 - iter 2120/2650 - loss 0.18578505 throughput (samples/sec): 77.37 -2019-08-10 00:15:05,906 epoch 130 - iter 2385/2650 - loss 0.18650379 throughput (samples/sec): 77.14 -2019-08-10 00:16:51,071 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:16:51,071 EPOCH 130 done: loss 0.1866 - lr 0.0250 -2019-08-10 00:16:51,072 BAD EPOCHS (no improvement): 0 -2019-08-10 00:16:51,072 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:16:51,433 epoch 131 - iter 0/2650 - loss 0.24921054 throughput (samples/sec): 23731.67 -2019-08-10 00:18:40,856 epoch 131 - iter 265/2650 - loss 0.18559888 throughput (samples/sec): 77.53 -2019-08-10 00:20:29,939 epoch 131 - iter 530/2650 - loss 0.18787522 throughput (samples/sec): 77.77 -2019-08-10 00:22:23,007 epoch 131 - iter 795/2650 - loss 0.18336057 throughput (samples/sec): 75.03 -2019-08-10 00:24:12,384 epoch 131 - iter 1060/2650 - loss 0.18566722 throughput (samples/sec): 77.56 -2019-08-10 00:25:58,049 epoch 131 - iter 1325/2650 - loss 0.18327694 throughput (samples/sec): 80.29 -2019-08-10 00:27:32,357 epoch 131 - iter 1590/2650 - loss 0.18489253 throughput (samples/sec): 89.96 -2019-08-10 00:29:21,354 epoch 131 - iter 1855/2650 - loss 0.18694890 throughput (samples/sec): 77.84 -2019-08-10 00:31:08,161 epoch 131 - iter 2120/2650 - loss 0.18508102 throughput (samples/sec): 79.43 -2019-08-10 00:32:57,703 epoch 131 - iter 2385/2650 - loss 0.18520474 throughput (samples/sec): 77.44 -2019-08-10 00:34:49,626 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:34:49,626 EPOCH 131 done: loss 0.1855 - lr 0.0250 -2019-08-10 00:34:49,626 BAD EPOCHS (no improvement): 0 -2019-08-10 00:34:49,626 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:34:49,975 epoch 132 - iter 0/2650 - loss 0.19269896 throughput (samples/sec): 24617.02 -2019-08-10 00:36:37,887 epoch 132 - iter 265/2650 - loss 0.17520606 throughput (samples/sec): 78.61 -2019-08-10 00:38:24,726 epoch 132 - iter 530/2650 - loss 0.18098655 throughput (samples/sec): 79.40 -2019-08-10 00:40:11,982 epoch 132 - iter 795/2650 - loss 0.18610073 throughput (samples/sec): 79.09 -2019-08-10 00:41:58,881 epoch 132 - iter 1060/2650 - loss 0.18931578 throughput (samples/sec): 79.36 -2019-08-10 00:43:36,828 epoch 132 - iter 1325/2650 - loss 0.18889622 throughput (samples/sec): 86.61 -2019-08-10 00:45:24,091 epoch 132 - iter 1590/2650 - loss 0.18673762 throughput (samples/sec): 79.09 -2019-08-10 00:47:12,883 epoch 132 - iter 1855/2650 - loss 0.18632328 throughput (samples/sec): 77.98 -2019-08-10 00:49:01,722 epoch 132 - iter 2120/2650 - loss 0.18567351 throughput (samples/sec): 77.94 -2019-08-10 00:50:48,475 epoch 132 - iter 2385/2650 - loss 0.18541436 throughput (samples/sec): 79.47 -2019-08-10 00:52:41,776 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:52:41,776 EPOCH 132 done: loss 0.1851 - lr 0.0250 -2019-08-10 00:52:41,776 BAD EPOCHS (no improvement): 0 -2019-08-10 00:52:41,776 ---------------------------------------------------------------------------------------------------- -2019-08-10 00:52:42,128 epoch 133 - iter 0/2650 - loss 0.24629915 throughput (samples/sec): 24369.20 -2019-08-10 00:54:32,060 epoch 133 - iter 265/2650 - loss 0.19527730 throughput (samples/sec): 77.17 -2019-08-10 00:56:23,753 epoch 133 - iter 530/2650 - loss 0.18402669 throughput (samples/sec): 75.95 -2019-08-10 00:58:09,619 epoch 133 - iter 795/2650 - loss 0.18586471 throughput (samples/sec): 80.13 -2019-08-10 00:59:46,321 epoch 133 - iter 1060/2650 - loss 0.18487641 throughput (samples/sec): 87.73 -2019-08-10 01:01:35,705 epoch 133 - iter 1325/2650 - loss 0.18247311 throughput (samples/sec): 77.55 -2019-08-10 01:03:23,133 epoch 133 - iter 1590/2650 - loss 0.18299255 throughput (samples/sec): 78.97 -2019-08-10 01:05:10,067 epoch 133 - iter 1855/2650 - loss 0.18214147 throughput (samples/sec): 79.33 -2019-08-10 01:06:57,026 epoch 133 - iter 2120/2650 - loss 0.18143098 throughput (samples/sec): 79.31 -2019-08-10 01:08:45,207 epoch 133 - iter 2385/2650 - loss 0.18131246 throughput (samples/sec): 78.42 -2019-08-10 01:10:33,504 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:10:33,504 EPOCH 133 done: loss 0.1807 - lr 0.0250 -2019-08-10 01:10:33,504 BAD EPOCHS (no improvement): 0 -2019-08-10 01:10:33,504 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:10:34,122 epoch 134 - iter 0/2650 - loss 0.13186166 throughput (samples/sec): 13809.54 -2019-08-10 01:12:20,797 epoch 134 - iter 265/2650 - loss 0.18865665 throughput (samples/sec): 79.52 -2019-08-10 01:14:06,617 epoch 134 - iter 530/2650 - loss 0.18680504 throughput (samples/sec): 80.17 -2019-08-10 01:15:41,385 epoch 134 - iter 795/2650 - loss 0.18949294 throughput (samples/sec): 89.52 -2019-08-10 01:17:28,827 epoch 134 - iter 1060/2650 - loss 0.19001371 throughput (samples/sec): 78.96 -2019-08-10 01:19:18,305 epoch 134 - iter 1325/2650 - loss 0.19019353 throughput (samples/sec): 77.50 -2019-08-10 01:21:06,685 epoch 134 - iter 1590/2650 - loss 0.19063459 throughput (samples/sec): 78.27 -2019-08-10 01:22:55,340 epoch 134 - iter 1855/2650 - loss 0.19202276 throughput (samples/sec): 78.07 -2019-08-10 01:24:44,227 epoch 134 - iter 2120/2650 - loss 0.19195708 throughput (samples/sec): 77.91 -2019-08-10 01:26:32,147 epoch 134 - iter 2385/2650 - loss 0.19219322 throughput (samples/sec): 78.61 -2019-08-10 01:28:19,267 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:28:19,267 EPOCH 134 done: loss 0.1929 - lr 0.0250 -2019-08-10 01:28:19,267 BAD EPOCHS (no improvement): 1 -2019-08-10 01:28:19,267 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:28:19,747 epoch 135 - iter 0/2650 - loss 0.15560481 throughput (samples/sec): 17827.94 -2019-08-10 01:30:07,302 epoch 135 - iter 265/2650 - loss 0.18728462 throughput (samples/sec): 78.87 -2019-08-10 01:31:46,484 epoch 135 - iter 530/2650 - loss 0.17920028 throughput (samples/sec): 85.53 -2019-08-10 01:33:25,420 epoch 135 - iter 795/2650 - loss 0.18176951 throughput (samples/sec): 85.75 -2019-08-10 01:35:11,772 epoch 135 - iter 1060/2650 - loss 0.18259239 throughput (samples/sec): 79.77 -2019-08-10 01:36:59,760 epoch 135 - iter 1325/2650 - loss 0.18204821 throughput (samples/sec): 78.56 -2019-08-10 01:38:47,117 epoch 135 - iter 1590/2650 - loss 0.18389355 throughput (samples/sec): 79.02 -2019-08-10 01:40:31,978 epoch 135 - iter 1855/2650 - loss 0.18370575 throughput (samples/sec): 80.90 -2019-08-10 01:42:20,043 epoch 135 - iter 2120/2650 - loss 0.18393650 throughput (samples/sec): 78.50 -2019-08-10 01:44:10,023 epoch 135 - iter 2385/2650 - loss 0.18350489 throughput (samples/sec): 77.13 -2019-08-10 01:45:57,366 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:45:57,366 EPOCH 135 done: loss 0.1842 - lr 0.0250 -2019-08-10 01:45:57,366 BAD EPOCHS (no improvement): 2 -2019-08-10 01:45:57,367 ---------------------------------------------------------------------------------------------------- -2019-08-10 01:45:57,691 epoch 136 - iter 0/2650 - loss 0.08344352 throughput (samples/sec): 26466.05 -2019-08-10 01:47:41,297 epoch 136 - iter 265/2650 - loss 0.18181312 throughput (samples/sec): 81.88 -2019-08-10 01:49:19,925 epoch 136 - iter 530/2650 - loss 0.17681686 throughput (samples/sec): 86.02 -2019-08-10 01:51:07,331 epoch 136 - iter 795/2650 - loss 0.17803025 throughput (samples/sec): 78.98 -2019-08-10 01:52:54,499 epoch 136 - iter 1060/2650 - loss 0.17948562 throughput (samples/sec): 79.16 -2019-08-10 01:54:43,518 epoch 136 - iter 1325/2650 - loss 0.18448388 throughput (samples/sec): 77.81 -2019-08-10 01:56:30,879 epoch 136 - iter 1590/2650 - loss 0.18321804 throughput (samples/sec): 79.02 -2019-08-10 01:58:19,803 epoch 136 - iter 1855/2650 - loss 0.18464254 throughput (samples/sec): 77.88 -2019-08-10 02:00:07,200 epoch 136 - iter 2120/2650 - loss 0.18476599 throughput (samples/sec): 78.99 -2019-08-10 02:01:54,967 epoch 136 - iter 2385/2650 - loss 0.18498930 throughput (samples/sec): 78.72 -2019-08-10 02:03:34,577 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:03:34,577 EPOCH 136 done: loss 0.1846 - lr 0.0250 -2019-08-10 02:03:34,577 BAD EPOCHS (no improvement): 3 -2019-08-10 02:03:34,577 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:03:34,882 epoch 137 - iter 0/2650 - loss 0.11519110 throughput (samples/sec): 28163.71 -2019-08-10 02:05:16,473 epoch 137 - iter 265/2650 - loss 0.18362697 throughput (samples/sec): 83.51 -2019-08-10 02:07:03,518 epoch 137 - iter 530/2650 - loss 0.18703275 throughput (samples/sec): 79.25 -2019-08-10 02:08:51,814 epoch 137 - iter 795/2650 - loss 0.18737962 throughput (samples/sec): 78.34 -2019-08-10 02:10:38,876 epoch 137 - iter 1060/2650 - loss 0.18414842 throughput (samples/sec): 79.24 -2019-08-10 02:12:26,696 epoch 137 - iter 1325/2650 - loss 0.18342032 throughput (samples/sec): 78.68 -2019-08-10 02:14:13,623 epoch 137 - iter 1590/2650 - loss 0.18573354 throughput (samples/sec): 79.34 -2019-08-10 02:16:05,000 epoch 137 - iter 1855/2650 - loss 0.18518509 throughput (samples/sec): 76.17 -2019-08-10 02:17:56,781 epoch 137 - iter 2120/2650 - loss 0.18507248 throughput (samples/sec): 75.89 -2019-08-10 02:19:39,106 epoch 137 - iter 2385/2650 - loss 0.18469363 throughput (samples/sec): 82.91 -2019-08-10 02:21:19,318 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:21:19,319 EPOCH 137 done: loss 0.1846 - lr 0.0250 -2019-08-10 02:21:19,319 BAD EPOCHS (no improvement): 4 -2019-08-10 02:21:19,319 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:21:19,793 epoch 138 - iter 0/2650 - loss 0.00819188 throughput (samples/sec): 18014.65 -2019-08-10 02:23:06,965 epoch 138 - iter 265/2650 - loss 0.17843646 throughput (samples/sec): 79.16 -2019-08-10 02:24:55,628 epoch 138 - iter 530/2650 - loss 0.17606421 throughput (samples/sec): 78.07 -2019-08-10 02:26:42,834 epoch 138 - iter 795/2650 - loss 0.17713702 throughput (samples/sec): 79.13 -2019-08-10 02:28:32,506 epoch 138 - iter 1060/2650 - loss 0.17209984 throughput (samples/sec): 77.35 -2019-08-10 02:30:20,677 epoch 138 - iter 1325/2650 - loss 0.17469157 throughput (samples/sec): 78.42 -2019-08-10 02:32:10,236 epoch 138 - iter 1590/2650 - loss 0.17469658 throughput (samples/sec): 77.43 -2019-08-10 02:34:01,247 epoch 138 - iter 1855/2650 - loss 0.17402000 throughput (samples/sec): 76.42 -2019-08-10 02:35:42,241 epoch 138 - iter 2120/2650 - loss 0.17537370 throughput (samples/sec): 84.00 -2019-08-10 02:37:22,565 epoch 138 - iter 2385/2650 - loss 0.17833447 throughput (samples/sec): 84.56 -2019-08-10 02:39:11,695 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:39:11,695 EPOCH 138 done: loss 0.1792 - lr 0.0125 -2019-08-10 02:39:11,695 BAD EPOCHS (no improvement): 0 -2019-08-10 02:39:11,696 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:39:12,036 epoch 139 - iter 0/2650 - loss 0.23919314 throughput (samples/sec): 25170.32 -2019-08-10 02:41:03,105 epoch 139 - iter 265/2650 - loss 0.19486463 throughput (samples/sec): 76.38 -2019-08-10 02:42:50,923 epoch 139 - iter 530/2650 - loss 0.17844562 throughput (samples/sec): 78.68 -2019-08-10 02:44:40,299 epoch 139 - iter 795/2650 - loss 0.18081222 throughput (samples/sec): 77.56 -2019-08-10 02:46:30,050 epoch 139 - iter 1060/2650 - loss 0.17831633 throughput (samples/sec): 77.29 -2019-08-10 02:48:17,478 epoch 139 - iter 1325/2650 - loss 0.18008940 throughput (samples/sec): 78.97 -2019-08-10 02:50:05,056 epoch 139 - iter 1590/2650 - loss 0.17899172 throughput (samples/sec): 78.86 -2019-08-10 02:51:44,093 epoch 139 - iter 1855/2650 - loss 0.17885841 throughput (samples/sec): 85.66 -2019-08-10 02:53:26,070 epoch 139 - iter 2120/2650 - loss 0.17750583 throughput (samples/sec): 83.19 -2019-08-10 02:55:15,508 epoch 139 - iter 2385/2650 - loss 0.17697864 throughput (samples/sec): 77.52 -2019-08-10 02:57:04,415 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:57:04,416 EPOCH 139 done: loss 0.1763 - lr 0.0125 -2019-08-10 02:57:04,416 BAD EPOCHS (no improvement): 0 -2019-08-10 02:57:04,416 ---------------------------------------------------------------------------------------------------- -2019-08-10 02:57:04,950 epoch 140 - iter 0/2650 - loss 0.22677469 throughput (samples/sec): 15989.55 -2019-08-10 02:58:54,401 epoch 140 - iter 265/2650 - loss 0.18830966 throughput (samples/sec): 77.51 -2019-08-10 03:00:41,362 epoch 140 - iter 530/2650 - loss 0.18567131 throughput (samples/sec): 79.31 -2019-08-10 03:02:32,602 epoch 140 - iter 795/2650 - loss 0.18905803 throughput (samples/sec): 76.26 -2019-08-10 03:04:22,575 epoch 140 - iter 1060/2650 - loss 0.18271995 throughput (samples/sec): 77.14 -2019-08-10 03:06:11,665 epoch 140 - iter 1325/2650 - loss 0.18039573 throughput (samples/sec): 77.76 -2019-08-10 03:07:53,209 epoch 140 - iter 1590/2650 - loss 0.18164763 throughput (samples/sec): 83.55 -2019-08-10 03:09:37,577 epoch 140 - iter 1855/2650 - loss 0.18116883 throughput (samples/sec): 81.28 -2019-08-10 03:11:26,985 epoch 140 - iter 2120/2650 - loss 0.17959660 throughput (samples/sec): 77.54 -2019-08-10 03:13:15,989 epoch 140 - iter 2385/2650 - loss 0.17915805 throughput (samples/sec): 77.83 -2019-08-10 03:15:02,878 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:15:02,878 EPOCH 140 done: loss 0.1795 - lr 0.0125 -2019-08-10 03:15:02,878 BAD EPOCHS (no improvement): 1 -2019-08-10 03:15:02,878 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:15:03,361 epoch 141 - iter 0/2650 - loss 0.03540620 throughput (samples/sec): 17687.69 -2019-08-10 03:16:54,500 epoch 141 - iter 265/2650 - loss 0.18051554 throughput (samples/sec): 76.33 -2019-08-10 03:18:43,562 epoch 141 - iter 530/2650 - loss 0.18017139 throughput (samples/sec): 77.78 -2019-08-10 03:20:32,749 epoch 141 - iter 795/2650 - loss 0.18210806 throughput (samples/sec): 77.69 -2019-08-10 03:22:23,276 epoch 141 - iter 1060/2650 - loss 0.17800211 throughput (samples/sec): 76.75 -2019-08-10 03:23:59,192 epoch 141 - iter 1325/2650 - loss 0.17783820 throughput (samples/sec): 88.45 -2019-08-10 03:25:43,970 epoch 141 - iter 1590/2650 - loss 0.17567068 throughput (samples/sec): 80.97 -2019-08-10 03:27:31,375 epoch 141 - iter 1855/2650 - loss 0.17431688 throughput (samples/sec): 78.98 -2019-08-10 03:29:21,322 epoch 141 - iter 2120/2650 - loss 0.17544116 throughput (samples/sec): 77.16 -2019-08-10 03:31:08,474 epoch 141 - iter 2385/2650 - loss 0.17725825 throughput (samples/sec): 79.17 -2019-08-10 03:32:55,969 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:32:55,969 EPOCH 141 done: loss 0.1774 - lr 0.0125 -2019-08-10 03:32:55,970 BAD EPOCHS (no improvement): 2 -2019-08-10 03:32:55,970 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:32:56,414 epoch 142 - iter 0/2650 - loss 0.05217010 throughput (samples/sec): 19263.88 -2019-08-10 03:34:46,328 epoch 142 - iter 265/2650 - loss 0.17732616 throughput (samples/sec): 77.18 -2019-08-10 03:36:38,765 epoch 142 - iter 530/2650 - loss 0.18892347 throughput (samples/sec): 75.45 -2019-08-10 03:38:24,613 epoch 142 - iter 795/2650 - loss 0.18572100 throughput (samples/sec): 80.15 -2019-08-10 03:40:01,739 epoch 142 - iter 1060/2650 - loss 0.18375701 throughput (samples/sec): 87.35 -2019-08-10 03:41:49,085 epoch 142 - iter 1325/2650 - loss 0.18309947 throughput (samples/sec): 79.03 -2019-08-10 03:43:36,627 epoch 142 - iter 1590/2650 - loss 0.18268902 throughput (samples/sec): 78.88 -2019-08-10 03:45:24,236 epoch 142 - iter 1855/2650 - loss 0.18128570 throughput (samples/sec): 78.83 -2019-08-10 03:47:14,107 epoch 142 - iter 2120/2650 - loss 0.18071470 throughput (samples/sec): 77.21 -2019-08-10 03:49:00,644 epoch 142 - iter 2385/2650 - loss 0.18098626 throughput (samples/sec): 79.63 -2019-08-10 03:50:49,300 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:50:49,300 EPOCH 142 done: loss 0.1805 - lr 0.0125 -2019-08-10 03:50:49,300 BAD EPOCHS (no improvement): 3 -2019-08-10 03:50:49,300 ---------------------------------------------------------------------------------------------------- -2019-08-10 03:50:49,799 epoch 143 - iter 0/2650 - loss 0.15482467 throughput (samples/sec): 17130.24 -2019-08-10 03:52:40,471 epoch 143 - iter 265/2650 - loss 0.17464481 throughput (samples/sec): 76.65 -2019-08-10 03:54:27,943 epoch 143 - iter 530/2650 - loss 0.17123706 throughput (samples/sec): 78.93 -2019-08-10 03:56:01,443 epoch 143 - iter 795/2650 - loss 0.17323226 throughput (samples/sec): 90.73 -2019-08-10 03:57:49,549 epoch 143 - iter 1060/2650 - loss 0.17213741 throughput (samples/sec): 78.47 -2019-08-10 03:59:43,469 epoch 143 - iter 1325/2650 - loss 0.17081376 throughput (samples/sec): 74.46 -2019-08-10 04:01:31,276 epoch 143 - iter 1590/2650 - loss 0.17083161 throughput (samples/sec): 78.69 -2019-08-10 04:03:21,367 epoch 143 - iter 1855/2650 - loss 0.17269354 throughput (samples/sec): 77.06 -2019-08-10 04:05:08,465 epoch 143 - iter 2120/2650 - loss 0.17249753 throughput (samples/sec): 79.21 -2019-08-10 04:06:57,137 epoch 143 - iter 2385/2650 - loss 0.17375012 throughput (samples/sec): 78.06 -2019-08-10 04:08:47,158 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:08:47,158 EPOCH 143 done: loss 0.1742 - lr 0.0125 -2019-08-10 04:08:47,158 BAD EPOCHS (no improvement): 0 -2019-08-10 04:08:47,159 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:08:47,609 epoch 144 - iter 0/2650 - loss 0.09170043 throughput (samples/sec): 18972.04 -2019-08-10 04:10:33,693 epoch 144 - iter 265/2650 - loss 0.17060924 throughput (samples/sec): 79.97 -2019-08-10 04:12:09,654 epoch 144 - iter 530/2650 - loss 0.16801396 throughput (samples/sec): 88.41 -2019-08-10 04:13:55,185 epoch 144 - iter 795/2650 - loss 0.17021749 throughput (samples/sec): 80.39 -2019-08-10 04:15:45,917 epoch 144 - iter 1060/2650 - loss 0.17174738 throughput (samples/sec): 76.61 -2019-08-10 04:17:33,431 epoch 144 - iter 1325/2650 - loss 0.17332525 throughput (samples/sec): 78.90 -2019-08-10 04:19:20,505 epoch 144 - iter 1590/2650 - loss 0.17726685 throughput (samples/sec): 79.23 -2019-08-10 04:21:08,077 epoch 144 - iter 1855/2650 - loss 0.17486028 throughput (samples/sec): 78.86 -2019-08-10 04:22:57,698 epoch 144 - iter 2120/2650 - loss 0.17611449 throughput (samples/sec): 77.39 -2019-08-10 04:24:44,487 epoch 144 - iter 2385/2650 - loss 0.17704732 throughput (samples/sec): 79.44 -2019-08-10 04:26:30,083 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:26:30,083 EPOCH 144 done: loss 0.1769 - lr 0.0125 -2019-08-10 04:26:30,083 BAD EPOCHS (no improvement): 1 -2019-08-10 04:26:30,083 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:26:30,476 epoch 145 - iter 0/2650 - loss 0.05851460 throughput (samples/sec): 21810.97 -2019-08-10 04:28:05,668 epoch 145 - iter 265/2650 - loss 0.18658631 throughput (samples/sec): 89.12 -2019-08-10 04:29:52,397 epoch 145 - iter 530/2650 - loss 0.17748493 throughput (samples/sec): 79.48 -2019-08-10 04:31:40,472 epoch 145 - iter 795/2650 - loss 0.17884143 throughput (samples/sec): 78.49 -2019-08-10 04:33:24,769 epoch 145 - iter 1060/2650 - loss 0.17442886 throughput (samples/sec): 81.34 -2019-08-10 04:35:14,193 epoch 145 - iter 1325/2650 - loss 0.17237665 throughput (samples/sec): 77.52 -2019-08-10 04:37:01,413 epoch 145 - iter 1590/2650 - loss 0.17144569 throughput (samples/sec): 79.12 -2019-08-10 04:38:46,882 epoch 145 - iter 1855/2650 - loss 0.16966073 throughput (samples/sec): 80.43 -2019-08-10 04:40:35,750 epoch 145 - iter 2120/2650 - loss 0.17145831 throughput (samples/sec): 77.92 -2019-08-10 04:42:19,816 epoch 145 - iter 2385/2650 - loss 0.17287556 throughput (samples/sec): 81.52 -2019-08-10 04:43:57,466 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:43:57,466 EPOCH 145 done: loss 0.1742 - lr 0.0125 -2019-08-10 04:43:57,466 BAD EPOCHS (no improvement): 0 -2019-08-10 04:43:57,466 ---------------------------------------------------------------------------------------------------- -2019-08-10 04:43:57,776 epoch 146 - iter 0/2650 - loss 0.03001368 throughput (samples/sec): 27630.85 -2019-08-10 04:45:45,265 epoch 146 - iter 265/2650 - loss 0.17782751 throughput (samples/sec): 78.92 -2019-08-10 04:47:32,455 epoch 146 - iter 530/2650 - loss 0.17977952 throughput (samples/sec): 79.14 -2019-08-10 04:49:21,059 epoch 146 - iter 795/2650 - loss 0.17583682 throughput (samples/sec): 78.11 -2019-08-10 04:51:06,739 epoch 146 - iter 1060/2650 - loss 0.17278514 throughput (samples/sec): 80.27 -2019-08-10 04:52:53,917 epoch 146 - iter 1325/2650 - loss 0.17405615 throughput (samples/sec): 79.15 -2019-08-10 04:54:44,150 epoch 146 - iter 1590/2650 - loss 0.17519476 throughput (samples/sec): 76.95 -2019-08-10 04:56:34,425 epoch 146 - iter 1855/2650 - loss 0.17558699 throughput (samples/sec): 76.92 -2019-08-10 04:58:15,468 epoch 146 - iter 2120/2650 - loss 0.17741514 throughput (samples/sec): 83.96 -2019-08-10 04:59:56,109 epoch 146 - iter 2385/2650 - loss 0.17871923 throughput (samples/sec): 84.29 -2019-08-10 05:01:41,648 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:01:41,648 EPOCH 146 done: loss 0.1789 - lr 0.0125 -2019-08-10 05:01:41,648 BAD EPOCHS (no improvement): 1 -2019-08-10 05:01:41,648 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:01:42,238 epoch 147 - iter 0/2650 - loss 0.09026635 throughput (samples/sec): 14461.74 -2019-08-10 05:03:28,848 epoch 147 - iter 265/2650 - loss 0.18574277 throughput (samples/sec): 79.57 -2019-08-10 05:05:14,318 epoch 147 - iter 530/2650 - loss 0.17609867 throughput (samples/sec): 80.43 -2019-08-10 05:07:06,098 epoch 147 - iter 795/2650 - loss 0.17796564 throughput (samples/sec): 75.89 -2019-08-10 05:08:53,566 epoch 147 - iter 1060/2650 - loss 0.17530444 throughput (samples/sec): 78.94 -2019-08-10 05:10:39,631 epoch 147 - iter 1325/2650 - loss 0.17593918 throughput (samples/sec): 79.98 -2019-08-10 05:12:28,977 epoch 147 - iter 1590/2650 - loss 0.17679133 throughput (samples/sec): 77.58 -2019-08-10 05:14:03,971 epoch 147 - iter 1855/2650 - loss 0.17557958 throughput (samples/sec): 89.30 -2019-08-10 05:15:45,898 epoch 147 - iter 2120/2650 - loss 0.17360490 throughput (samples/sec): 83.23 -2019-08-10 05:17:34,012 epoch 147 - iter 2385/2650 - loss 0.17358304 throughput (samples/sec): 78.46 -2019-08-10 05:19:19,787 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:19:19,787 EPOCH 147 done: loss 0.1726 - lr 0.0125 -2019-08-10 05:19:19,787 BAD EPOCHS (no improvement): 0 -2019-08-10 05:19:19,788 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:19:20,158 epoch 148 - iter 0/2650 - loss 0.10176063 throughput (samples/sec): 23080.47 -2019-08-10 05:21:08,066 epoch 148 - iter 265/2650 - loss 0.19260470 throughput (samples/sec): 78.61 -2019-08-10 05:22:55,928 epoch 148 - iter 530/2650 - loss 0.18968114 throughput (samples/sec): 78.65 -2019-08-10 05:24:42,094 epoch 148 - iter 795/2650 - loss 0.17941401 throughput (samples/sec): 79.91 -2019-08-10 05:26:26,338 epoch 148 - iter 1060/2650 - loss 0.17974233 throughput (samples/sec): 81.38 -2019-08-10 05:28:12,305 epoch 148 - iter 1325/2650 - loss 0.17760838 throughput (samples/sec): 80.05 -2019-08-10 05:29:48,328 epoch 148 - iter 1590/2650 - loss 0.17524619 throughput (samples/sec): 88.35 -2019-08-10 05:31:39,556 epoch 148 - iter 1855/2650 - loss 0.17642495 throughput (samples/sec): 76.27 -2019-08-10 05:33:27,279 epoch 148 - iter 2120/2650 - loss 0.17516272 throughput (samples/sec): 78.75 -2019-08-10 05:35:24,438 epoch 148 - iter 2385/2650 - loss 0.17443842 throughput (samples/sec): 72.40 -2019-08-10 05:37:09,525 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:37:09,525 EPOCH 148 done: loss 0.1739 - lr 0.0125 -2019-08-10 05:37:09,525 BAD EPOCHS (no improvement): 1 -2019-08-10 05:37:09,526 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:37:09,989 epoch 149 - iter 0/2650 - loss 0.03973123 throughput (samples/sec): 18455.94 -2019-08-10 05:38:59,666 epoch 149 - iter 265/2650 - loss 0.17610629 throughput (samples/sec): 77.35 -2019-08-10 05:40:52,172 epoch 149 - iter 530/2650 - loss 0.17486749 throughput (samples/sec): 75.40 -2019-08-10 05:42:41,126 epoch 149 - iter 795/2650 - loss 0.17536686 throughput (samples/sec): 77.86 -2019-08-10 05:44:20,109 epoch 149 - iter 1060/2650 - loss 0.17368030 throughput (samples/sec): 85.71 -2019-08-10 05:45:56,572 epoch 149 - iter 1325/2650 - loss 0.17618373 throughput (samples/sec): 87.94 -2019-08-10 05:47:43,425 epoch 149 - iter 1590/2650 - loss 0.17475238 throughput (samples/sec): 79.39 -2019-08-10 05:49:29,020 epoch 149 - iter 1855/2650 - loss 0.17484268 throughput (samples/sec): 80.34 -2019-08-10 05:51:14,830 epoch 149 - iter 2120/2650 - loss 0.17398818 throughput (samples/sec): 80.17 -2019-08-10 05:53:01,015 epoch 149 - iter 2385/2650 - loss 0.17336181 throughput (samples/sec): 79.89 -2019-08-10 05:54:47,513 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:54:47,513 EPOCH 149 done: loss 0.1732 - lr 0.0125 -2019-08-10 05:54:47,514 BAD EPOCHS (no improvement): 2 -2019-08-10 05:54:47,514 ---------------------------------------------------------------------------------------------------- -2019-08-10 05:54:47,924 epoch 150 - iter 0/2650 - loss 0.10671207 throughput (samples/sec): 20868.87 -2019-08-10 05:56:31,905 epoch 150 - iter 265/2650 - loss 0.16753308 throughput (samples/sec): 81.58 -2019-08-10 05:58:19,832 epoch 150 - iter 530/2650 - loss 0.16438649 throughput (samples/sec): 78.60 -2019-08-10 06:00:01,083 epoch 150 - iter 795/2650 - loss 0.17087488 throughput (samples/sec): 83.79 -2019-08-10 06:01:43,708 epoch 150 - iter 1060/2650 - loss 0.16698422 throughput (samples/sec): 82.66 -2019-08-10 06:03:31,256 epoch 150 - iter 1325/2650 - loss 0.16843817 throughput (samples/sec): 78.88 -2019-08-10 06:05:17,098 epoch 150 - iter 1590/2650 - loss 0.16949002 throughput (samples/sec): 80.15 -2019-08-10 06:07:03,505 epoch 150 - iter 1855/2650 - loss 0.17115173 throughput (samples/sec): 79.72 -2019-08-10 06:08:47,863 epoch 150 - iter 2120/2650 - loss 0.17045474 throughput (samples/sec): 81.29 -2019-08-10 06:10:35,817 epoch 150 - iter 2385/2650 - loss 0.17136057 throughput (samples/sec): 78.58 -2019-08-10 06:12:22,453 ---------------------------------------------------------------------------------------------------- -2019-08-10 06:12:22,453 EPOCH 150 done: loss 0.1715 - lr 0.0125 -2019-08-10 06:12:22,453 BAD EPOCHS (no improvement): 0 -2019-08-10 06:12:39,109 ---------------------------------------------------------------------------------------------------- -2019-08-10 06:12:39,109 Testing using best model ... -2019-08-10 06:12:39,110 loading file resources/taggers/release-ner-ontonotes-0/best-model.pt -2019-08-10 06:20:44,706 0.0937 0.0311 0.0467 -2019-08-10 06:20:44,706 -MICRO_AVG: acc 0.0239 - f1-score 0.0467 -MACRO_AVG: acc 0.0074 - f1-score 0.013377777777777778 -CARDINAL tp: 1 - fp: 163 - fn: 934 - tn: 1 - precision: 0.0061 - recall: 0.0011 - accuracy: 0.0009 - f1-score: 0.0019 -DATE tp: 0 - fp: 207 - fn: 1602 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -EVENT tp: 0 - fp: 0 - fn: 63 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -FAC tp: 0 - fp: 1 - fn: 135 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -GPE tp: 323 - fp: 477 - fn: 1917 - tn: 323 - precision: 0.4037 - recall: 0.1442 - accuracy: 0.1189 - f1-score: 0.2125 -LANGUAGE tp: 0 - fp: 57 - fn: 22 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -LAW tp: 0 - fp: 0 - fn: 40 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -LOC tp: 0 - fp: 0 - fn: 179 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -MONEY tp: 0 - fp: 187 - fn: 314 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -NORP tp: 0 - fp: 330 - fn: 841 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -ORDINAL tp: 0 - fp: 384 - fn: 195 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -ORG tp: 21 - fp: 409 - fn: 1774 - tn: 21 - precision: 0.0488 - recall: 0.0117 - accuracy: 0.0095 - f1-score: 0.0189 -PERCENT tp: 0 - fp: 42 - fn: 349 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -PERSON tp: 2 - fp: 149 - fn: 1986 - tn: 2 - precision: 0.0132 - recall: 0.0010 - accuracy: 0.0009 - f1-score: 0.0019 -PRODUCT tp: 0 - fp: 37 - fn: 76 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -QUANTITY tp: 0 - fp: 0 - fn: 105 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -TIME tp: 0 - fp: 34 - fn: 212 - tn: 0 - precision: 0.0000 - recall: 0.0000 - accuracy: 0.0000 - f1-score: 0.0000 -WORK_OF_ART tp: 3 - fp: 908 - fn: 163 - tn: 3 - precision: 0.0033 - recall: 0.0181 - accuracy: 0.0028 - f1-score: 0.0056 -2019-08-10 06:20:44,706 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,038 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,039 Corpus: "Corpus: 75187 train + 9603 dev + 9479 test sentences" +2023-04-05 22:30:15,039 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,039 Parameters: +2023-04-05 22:30:15,039 - learning_rate: "0.100000" +2023-04-05 22:30:15,039 - mini_batch_size: "32" +2023-04-05 22:30:15,039 - patience: "3" +2023-04-05 22:30:15,039 - anneal_factor: "0.5" +2023-04-05 22:30:15,039 - max_epochs: "150" +2023-04-05 22:30:15,039 - shuffle: "True" +2023-04-05 22:30:15,039 - train_with_dev: "True" +2023-04-05 22:30:15,039 - batch_growth_annealing: "False" +2023-04-05 22:30:15,039 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,039 Model training base path: "resources/taggers/release-ner-ontonotes-0" +2023-04-05 22:30:15,039 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,039 Device: cuda:3 +2023-04-05 22:30:15,039 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:15,039 Embeddings storage mode: cpu +2023-04-05 22:30:15,039 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:30:32,814 epoch 1 - iter 265/2650 - loss 0.26753384 - time (sec): 17.77 - samples/sec: 3410.92 - lr: 0.100000 +2023-04-05 22:31:08,483 epoch 1 - iter 530/2650 - loss 0.27294258 - time (sec): 53.44 - samples/sec: 4058.67 - lr: 0.100000 +2023-04-05 22:31:51,964 epoch 1 - iter 795/2650 - loss 0.24279099 - time (sec): 96.93 - samples/sec: 4054.39 - lr: 0.100000 +2023-04-05 22:32:29,163 epoch 1 - iter 1060/2650 - loss 0.22574983 - time (sec): 134.12 - samples/sec: 4104.69 - lr: 0.100000 +2023-04-05 22:32:51,931 epoch 1 - iter 1325/2650 - loss 0.18673350 - time (sec): 156.89 - samples/sec: 4273.29 - lr: 0.100000 +2023-04-05 22:33:21,764 epoch 1 - iter 1590/2650 - loss 0.16883297 - time (sec): 186.72 - samples/sec: 4340.27 - lr: 0.100000 +2023-04-05 22:34:18,793 epoch 1 - iter 1855/2650 - loss 0.16963428 - time (sec): 243.75 - samples/sec: 4205.97 - lr: 0.100000 +2023-04-05 22:34:54,838 epoch 1 - iter 2120/2650 - loss 0.16383173 - time (sec): 279.80 - samples/sec: 4277.99 - lr: 0.100000 +2023-04-05 22:35:24,373 epoch 1 - iter 2385/2650 - loss 0.15943840 - time (sec): 309.33 - samples/sec: 4224.09 - lr: 0.100000 +2023-04-05 22:36:00,651 epoch 1 - iter 2650/2650 - loss 0.15617985 - time (sec): 345.61 - samples/sec: 4231.23 - lr: 0.100000 +2023-04-05 22:36:00,651 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:36:00,651 EPOCH 1 done: loss 0.1562 - lr 0.100000 +2023-04-05 22:36:00,651 BAD EPOCHS (no improvement): 0 +2023-04-05 22:36:00,654 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:36:20,175 epoch 2 - iter 265/2650 - loss 0.11266887 - time (sec): 19.52 - samples/sec: 7514.22 - lr: 0.100000 +2023-04-05 22:36:40,387 epoch 2 - iter 530/2650 - loss 0.10817789 - time (sec): 39.73 - samples/sec: 7381.47 - lr: 0.100000 +2023-04-05 22:37:00,484 epoch 2 - iter 795/2650 - loss 0.10710700 - time (sec): 59.83 - samples/sec: 7365.19 - lr: 0.100000 +2023-04-05 22:37:20,242 epoch 2 - iter 1060/2650 - loss 0.10320501 - time (sec): 79.59 - samples/sec: 7384.58 - lr: 0.100000 +2023-04-05 22:37:39,929 epoch 2 - iter 1325/2650 - loss 0.10145208 - time (sec): 99.27 - samples/sec: 7397.57 - lr: 0.100000 +2023-04-05 22:37:59,130 epoch 2 - iter 1590/2650 - loss 0.09967449 - time (sec): 118.48 - samples/sec: 7419.91 - lr: 0.100000 +2023-04-05 22:38:18,213 epoch 2 - iter 1855/2650 - loss 0.09813847 - time (sec): 137.56 - samples/sec: 7457.22 - lr: 0.100000 +2023-04-05 22:38:37,939 epoch 2 - iter 2120/2650 - loss 0.09664446 - time (sec): 157.28 - samples/sec: 7446.97 - lr: 0.100000 +2023-04-05 22:38:57,208 epoch 2 - iter 2385/2650 - loss 0.09547294 - time (sec): 176.55 - samples/sec: 7453.94 - lr: 0.100000 +2023-04-05 22:39:17,307 epoch 2 - iter 2650/2650 - loss 0.09408016 - time (sec): 196.65 - samples/sec: 7436.28 - lr: 0.100000 +2023-04-05 22:39:17,307 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:39:17,307 EPOCH 2 done: loss 0.0941 - lr 0.100000 +2023-04-05 22:39:17,307 BAD EPOCHS (no improvement): 0 +2023-04-05 22:39:17,310 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:39:37,267 epoch 3 - iter 265/2650 - loss 0.07783923 - time (sec): 19.96 - samples/sec: 7299.54 - lr: 0.100000 +2023-04-05 22:39:57,216 epoch 3 - iter 530/2650 - loss 0.07650488 - time (sec): 39.91 - samples/sec: 7265.92 - lr: 0.100000 +2023-04-05 22:40:16,963 epoch 3 - iter 795/2650 - loss 0.07719409 - time (sec): 59.65 - samples/sec: 7344.12 - lr: 0.100000 +2023-04-05 22:40:36,712 epoch 3 - iter 1060/2650 - loss 0.07616210 - time (sec): 79.40 - samples/sec: 7340.71 - lr: 0.100000 +2023-04-05 22:40:55,833 epoch 3 - iter 1325/2650 - loss 0.07542488 - time (sec): 98.52 - samples/sec: 7400.24 - lr: 0.100000 +2023-04-05 22:41:15,217 epoch 3 - iter 1590/2650 - loss 0.07535956 - time (sec): 117.91 - samples/sec: 7422.77 - lr: 0.100000 +2023-04-05 22:41:35,620 epoch 3 - iter 1855/2650 - loss 0.07497975 - time (sec): 138.31 - samples/sec: 7393.97 - lr: 0.100000 +2023-04-05 22:41:55,694 epoch 3 - iter 2120/2650 - loss 0.07488640 - time (sec): 158.38 - samples/sec: 7387.59 - lr: 0.100000 +2023-04-05 22:42:14,676 epoch 3 - iter 2385/2650 - loss 0.07452064 - time (sec): 177.37 - samples/sec: 7409.65 - lr: 0.100000 +2023-04-05 22:42:34,632 epoch 3 - iter 2650/2650 - loss 0.07399061 - time (sec): 197.32 - samples/sec: 7411.06 - lr: 0.100000 +2023-04-05 22:42:34,633 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:42:34,633 EPOCH 3 done: loss 0.0740 - lr 0.100000 +2023-04-05 22:42:34,633 BAD EPOCHS (no improvement): 0 +2023-04-05 22:42:34,637 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:42:54,041 epoch 4 - iter 265/2650 - loss 0.06719111 - time (sec): 19.40 - samples/sec: 7442.48 - lr: 0.100000 +2023-04-05 22:43:13,462 epoch 4 - iter 530/2650 - loss 0.06563034 - time (sec): 38.83 - samples/sec: 7441.37 - lr: 0.100000 +2023-04-05 22:43:33,226 epoch 4 - iter 795/2650 - loss 0.06592207 - time (sec): 58.59 - samples/sec: 7433.62 - lr: 0.100000 +2023-04-05 22:43:53,627 epoch 4 - iter 1060/2650 - loss 0.06555259 - time (sec): 78.99 - samples/sec: 7398.78 - lr: 0.100000 +2023-04-05 22:44:12,939 epoch 4 - iter 1325/2650 - loss 0.06575556 - time (sec): 98.30 - samples/sec: 7430.50 - lr: 0.100000 +2023-04-05 22:44:32,656 epoch 4 - iter 1590/2650 - loss 0.06516319 - time (sec): 118.02 - samples/sec: 7431.80 - lr: 0.100000 +2023-04-05 22:44:52,404 epoch 4 - iter 1855/2650 - loss 0.06536955 - time (sec): 137.77 - samples/sec: 7422.69 - lr: 0.100000 +2023-04-05 22:45:12,221 epoch 4 - iter 2120/2650 - loss 0.06486299 - time (sec): 157.58 - samples/sec: 7425.58 - lr: 0.100000 +2023-04-05 22:45:31,977 epoch 4 - iter 2385/2650 - loss 0.06478095 - time (sec): 177.34 - samples/sec: 7418.20 - lr: 0.100000 +2023-04-05 22:45:52,125 epoch 4 - iter 2650/2650 - loss 0.06459631 - time (sec): 197.49 - samples/sec: 7404.83 - lr: 0.100000 +2023-04-05 22:45:52,125 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:45:52,125 EPOCH 4 done: loss 0.0646 - lr 0.100000 +2023-04-05 22:45:52,125 BAD EPOCHS (no improvement): 0 +2023-04-05 22:45:52,129 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:46:11,939 epoch 5 - iter 265/2650 - loss 0.05973687 - time (sec): 19.81 - samples/sec: 7357.18 - lr: 0.100000 +2023-04-05 22:46:31,940 epoch 5 - iter 530/2650 - loss 0.05917111 - time (sec): 39.81 - samples/sec: 7354.57 - lr: 0.100000 +2023-04-05 22:46:50,759 epoch 5 - iter 795/2650 - loss 0.05935966 - time (sec): 58.63 - samples/sec: 7461.84 - lr: 0.100000 +2023-04-05 22:47:10,249 epoch 5 - iter 1060/2650 - loss 0.05946565 - time (sec): 78.12 - samples/sec: 7461.49 - lr: 0.100000 +2023-04-05 22:47:29,535 epoch 5 - iter 1325/2650 - loss 0.05923236 - time (sec): 97.41 - samples/sec: 7475.72 - lr: 0.100000 +2023-04-05 22:47:49,495 epoch 5 - iter 1590/2650 - loss 0.05918268 - time (sec): 117.37 - samples/sec: 7445.03 - lr: 0.100000 +2023-04-05 22:48:09,579 epoch 5 - iter 1855/2650 - loss 0.05875262 - time (sec): 137.45 - samples/sec: 7424.07 - lr: 0.100000 +2023-04-05 22:48:30,187 epoch 5 - iter 2120/2650 - loss 0.05927092 - time (sec): 158.06 - samples/sec: 7393.11 - lr: 0.100000 +2023-04-05 22:48:50,165 epoch 5 - iter 2385/2650 - loss 0.05920544 - time (sec): 178.04 - samples/sec: 7394.84 - lr: 0.100000 +2023-04-05 22:49:09,896 epoch 5 - iter 2650/2650 - loss 0.05907764 - time (sec): 197.77 - samples/sec: 7394.37 - lr: 0.100000 +2023-04-05 22:49:09,897 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:49:09,897 EPOCH 5 done: loss 0.0591 - lr 0.100000 +2023-04-05 22:49:09,897 BAD EPOCHS (no improvement): 0 +2023-04-05 22:49:09,900 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:49:29,334 epoch 6 - iter 265/2650 - loss 0.05432288 - time (sec): 19.43 - samples/sec: 7516.43 - lr: 0.100000 +2023-04-05 22:49:49,597 epoch 6 - iter 530/2650 - loss 0.05452878 - time (sec): 39.70 - samples/sec: 7356.38 - lr: 0.100000 +2023-04-05 22:50:09,358 epoch 6 - iter 795/2650 - loss 0.05516482 - time (sec): 59.46 - samples/sec: 7374.86 - lr: 0.100000 +2023-04-05 22:50:29,035 epoch 6 - iter 1060/2650 - loss 0.05541375 - time (sec): 79.14 - samples/sec: 7376.45 - lr: 0.100000 +2023-04-05 22:50:49,221 epoch 6 - iter 1325/2650 - loss 0.05551200 - time (sec): 99.32 - samples/sec: 7349.54 - lr: 0.100000 +2023-04-05 22:51:08,701 epoch 6 - iter 1590/2650 - loss 0.05539049 - time (sec): 118.80 - samples/sec: 7362.18 - lr: 0.100000 +2023-04-05 22:51:28,697 epoch 6 - iter 1855/2650 - loss 0.05542507 - time (sec): 138.80 - samples/sec: 7373.95 - lr: 0.100000 +2023-04-05 22:51:48,548 epoch 6 - iter 2120/2650 - loss 0.05541067 - time (sec): 158.65 - samples/sec: 7371.34 - lr: 0.100000 +2023-04-05 22:52:08,340 epoch 6 - iter 2385/2650 - loss 0.05545153 - time (sec): 178.44 - samples/sec: 7376.38 - lr: 0.100000 +2023-04-05 22:52:27,814 epoch 6 - iter 2650/2650 - loss 0.05526669 - time (sec): 197.91 - samples/sec: 7388.86 - lr: 0.100000 +2023-04-05 22:52:27,815 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:52:27,815 EPOCH 6 done: loss 0.0553 - lr 0.100000 +2023-04-05 22:52:27,815 BAD EPOCHS (no improvement): 0 +2023-04-05 22:52:27,818 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:52:47,338 epoch 7 - iter 265/2650 - loss 0.04891490 - time (sec): 19.52 - samples/sec: 7429.35 - lr: 0.100000 +2023-04-05 22:53:06,924 epoch 7 - iter 530/2650 - loss 0.05120080 - time (sec): 39.11 - samples/sec: 7420.36 - lr: 0.100000 +2023-04-05 22:53:27,114 epoch 7 - iter 795/2650 - loss 0.05129684 - time (sec): 59.30 - samples/sec: 7359.66 - lr: 0.100000 +2023-04-05 22:53:46,768 epoch 7 - iter 1060/2650 - loss 0.05161041 - time (sec): 78.95 - samples/sec: 7380.19 - lr: 0.100000 +2023-04-05 22:54:07,000 epoch 7 - iter 1325/2650 - loss 0.05165356 - time (sec): 99.18 - samples/sec: 7363.82 - lr: 0.100000 +2023-04-05 22:54:27,113 epoch 7 - iter 1590/2650 - loss 0.05159275 - time (sec): 119.29 - samples/sec: 7357.10 - lr: 0.100000 +2023-04-05 22:54:47,334 epoch 7 - iter 1855/2650 - loss 0.05192562 - time (sec): 139.52 - samples/sec: 7341.50 - lr: 0.100000 +2023-04-05 22:55:07,101 epoch 7 - iter 2120/2650 - loss 0.05203989 - time (sec): 159.28 - samples/sec: 7353.59 - lr: 0.100000 +2023-04-05 22:55:26,223 epoch 7 - iter 2385/2650 - loss 0.05204132 - time (sec): 178.40 - samples/sec: 7377.60 - lr: 0.100000 +2023-04-05 22:55:45,962 epoch 7 - iter 2650/2650 - loss 0.05201672 - time (sec): 198.14 - samples/sec: 7380.33 - lr: 0.100000 +2023-04-05 22:55:45,962 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:55:45,962 EPOCH 7 done: loss 0.0520 - lr 0.100000 +2023-04-05 22:55:45,962 BAD EPOCHS (no improvement): 0 +2023-04-05 22:55:45,966 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:56:05,316 epoch 8 - iter 265/2650 - loss 0.04853580 - time (sec): 19.35 - samples/sec: 7511.67 - lr: 0.100000 +2023-04-05 22:56:25,019 epoch 8 - iter 530/2650 - loss 0.04745612 - time (sec): 39.05 - samples/sec: 7443.61 - lr: 0.100000 +2023-04-05 22:56:44,649 epoch 8 - iter 795/2650 - loss 0.04766666 - time (sec): 58.68 - samples/sec: 7445.38 - lr: 0.100000 +2023-04-05 22:57:03,853 epoch 8 - iter 1060/2650 - loss 0.04851233 - time (sec): 77.89 - samples/sec: 7495.21 - lr: 0.100000 +2023-04-05 22:57:24,061 epoch 8 - iter 1325/2650 - loss 0.04905184 - time (sec): 98.09 - samples/sec: 7448.51 - lr: 0.100000 +2023-04-05 22:57:44,701 epoch 8 - iter 1590/2650 - loss 0.04925669 - time (sec): 118.73 - samples/sec: 7396.58 - lr: 0.100000 +2023-04-05 22:58:04,165 epoch 8 - iter 1855/2650 - loss 0.04955004 - time (sec): 138.20 - samples/sec: 7410.96 - lr: 0.100000 +2023-04-05 22:58:24,256 epoch 8 - iter 2120/2650 - loss 0.04949264 - time (sec): 158.29 - samples/sec: 7399.93 - lr: 0.100000 +2023-04-05 22:58:44,417 epoch 8 - iter 2385/2650 - loss 0.04950536 - time (sec): 178.45 - samples/sec: 7383.48 - lr: 0.100000 +2023-04-05 22:59:03,464 epoch 8 - iter 2650/2650 - loss 0.04943978 - time (sec): 197.50 - samples/sec: 7404.46 - lr: 0.100000 +2023-04-05 22:59:03,464 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:59:03,464 EPOCH 8 done: loss 0.0494 - lr 0.100000 +2023-04-05 22:59:03,464 BAD EPOCHS (no improvement): 0 +2023-04-05 22:59:03,467 ---------------------------------------------------------------------------------------------------- +2023-04-05 22:59:23,247 epoch 9 - iter 265/2650 - loss 0.04629974 - time (sec): 19.78 - samples/sec: 7400.70 - lr: 0.100000 +2023-04-05 22:59:42,953 epoch 9 - iter 530/2650 - loss 0.04662181 - time (sec): 39.49 - samples/sec: 7356.32 - lr: 0.100000 +2023-04-05 23:00:02,695 epoch 9 - iter 795/2650 - loss 0.04730929 - time (sec): 59.23 - samples/sec: 7378.40 - lr: 0.100000 +2023-04-05 23:00:22,037 epoch 9 - iter 1060/2650 - loss 0.04736771 - time (sec): 78.57 - samples/sec: 7395.22 - lr: 0.100000 +2023-04-05 23:00:42,649 epoch 9 - iter 1325/2650 - loss 0.04760472 - time (sec): 99.18 - samples/sec: 7359.11 - lr: 0.100000 +2023-04-05 23:01:02,282 epoch 9 - iter 1590/2650 - loss 0.04773742 - time (sec): 118.82 - samples/sec: 7380.24 - lr: 0.100000 +2023-04-05 23:01:21,265 epoch 9 - iter 1855/2650 - loss 0.04813461 - time (sec): 137.80 - samples/sec: 7415.81 - lr: 0.100000 +2023-04-05 23:01:41,073 epoch 9 - iter 2120/2650 - loss 0.04796157 - time (sec): 157.61 - samples/sec: 7404.29 - lr: 0.100000 +2023-04-05 23:02:01,310 epoch 9 - iter 2385/2650 - loss 0.04766473 - time (sec): 177.84 - samples/sec: 7394.19 - lr: 0.100000 +2023-04-05 23:02:21,121 epoch 9 - iter 2650/2650 - loss 0.04761529 - time (sec): 197.65 - samples/sec: 7398.59 - lr: 0.100000 +2023-04-05 23:02:21,122 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:02:21,122 EPOCH 9 done: loss 0.0476 - lr 0.100000 +2023-04-05 23:02:21,122 BAD EPOCHS (no improvement): 0 +2023-04-05 23:02:21,126 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:02:40,052 epoch 10 - iter 265/2650 - loss 0.04401852 - time (sec): 18.93 - samples/sec: 7641.22 - lr: 0.100000 +2023-04-05 23:03:00,049 epoch 10 - iter 530/2650 - loss 0.04465764 - time (sec): 38.92 - samples/sec: 7511.87 - lr: 0.100000 +2023-04-05 23:03:20,403 epoch 10 - iter 795/2650 - loss 0.04494720 - time (sec): 59.28 - samples/sec: 7419.15 - lr: 0.100000 +2023-04-05 23:03:40,295 epoch 10 - iter 1060/2650 - loss 0.04523321 - time (sec): 79.17 - samples/sec: 7386.01 - lr: 0.100000 +2023-04-05 23:04:00,351 epoch 10 - iter 1325/2650 - loss 0.04516569 - time (sec): 99.22 - samples/sec: 7370.28 - lr: 0.100000 +2023-04-05 23:04:20,180 epoch 10 - iter 1590/2650 - loss 0.04527092 - time (sec): 119.05 - samples/sec: 7384.36 - lr: 0.100000 +2023-04-05 23:04:39,938 epoch 10 - iter 1855/2650 - loss 0.04589615 - time (sec): 138.81 - samples/sec: 7389.48 - lr: 0.100000 +2023-04-05 23:04:59,296 epoch 10 - iter 2120/2650 - loss 0.04617516 - time (sec): 158.17 - samples/sec: 7404.27 - lr: 0.100000 +2023-04-05 23:05:18,613 epoch 10 - iter 2385/2650 - loss 0.04630414 - time (sec): 177.49 - samples/sec: 7417.67 - lr: 0.100000 +2023-04-05 23:05:38,785 epoch 10 - iter 2650/2650 - loss 0.04598758 - time (sec): 197.66 - samples/sec: 7398.42 - lr: 0.100000 +2023-04-05 23:05:38,785 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:05:38,785 EPOCH 10 done: loss 0.0460 - lr 0.100000 +2023-04-05 23:05:38,786 BAD EPOCHS (no improvement): 0 +2023-04-05 23:05:38,790 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:05:59,245 epoch 11 - iter 265/2650 - loss 0.04308864 - time (sec): 20.46 - samples/sec: 7184.88 - lr: 0.100000 +2023-04-05 23:06:18,165 epoch 11 - iter 530/2650 - loss 0.04341556 - time (sec): 39.38 - samples/sec: 7384.04 - lr: 0.100000 +2023-04-05 23:06:38,033 epoch 11 - iter 795/2650 - loss 0.04383832 - time (sec): 59.24 - samples/sec: 7351.10 - lr: 0.100000 +2023-04-05 23:06:58,051 epoch 11 - iter 1060/2650 - loss 0.04354113 - time (sec): 79.26 - samples/sec: 7357.07 - lr: 0.100000 +2023-04-05 23:07:17,533 epoch 11 - iter 1325/2650 - loss 0.04422198 - time (sec): 98.74 - samples/sec: 7389.02 - lr: 0.100000 +2023-04-05 23:07:37,431 epoch 11 - iter 1590/2650 - loss 0.04468420 - time (sec): 118.64 - samples/sec: 7399.86 - lr: 0.100000 +2023-04-05 23:07:56,955 epoch 11 - iter 1855/2650 - loss 0.04430505 - time (sec): 138.16 - samples/sec: 7403.42 - lr: 0.100000 +2023-04-05 23:08:16,911 epoch 11 - iter 2120/2650 - loss 0.04443916 - time (sec): 158.12 - samples/sec: 7405.10 - lr: 0.100000 +2023-04-05 23:08:36,476 epoch 11 - iter 2385/2650 - loss 0.04487273 - time (sec): 177.69 - samples/sec: 7410.68 - lr: 0.100000 +2023-04-05 23:08:56,565 epoch 11 - iter 2650/2650 - loss 0.04488036 - time (sec): 197.78 - samples/sec: 7394.05 - lr: 0.100000 +2023-04-05 23:08:56,566 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:08:56,566 EPOCH 11 done: loss 0.0449 - lr 0.100000 +2023-04-05 23:08:56,566 BAD EPOCHS (no improvement): 0 +2023-04-05 23:08:56,568 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:09:15,735 epoch 12 - iter 265/2650 - loss 0.04334881 - time (sec): 19.17 - samples/sec: 7616.70 - lr: 0.100000 +2023-04-05 23:09:35,985 epoch 12 - iter 530/2650 - loss 0.04285008 - time (sec): 39.42 - samples/sec: 7405.04 - lr: 0.100000 +2023-04-05 23:09:56,340 epoch 12 - iter 795/2650 - loss 0.04256310 - time (sec): 59.77 - samples/sec: 7346.53 - lr: 0.100000 +2023-04-05 23:10:25,880 epoch 12 - iter 1060/2650 - loss 0.04275866 - time (sec): 89.31 - samples/sec: 6540.63 - lr: 0.100000 +2023-04-05 23:10:45,682 epoch 12 - iter 1325/2650 - loss 0.04238591 - time (sec): 109.11 - samples/sec: 6697.27 - lr: 0.100000 +2023-04-05 23:11:05,621 epoch 12 - iter 1590/2650 - loss 0.04256063 - time (sec): 129.05 - samples/sec: 6790.77 - lr: 0.100000 +2023-04-05 23:11:25,100 epoch 12 - iter 1855/2650 - loss 0.04275237 - time (sec): 148.53 - samples/sec: 6881.81 - lr: 0.100000 +2023-04-05 23:11:45,477 epoch 12 - iter 2120/2650 - loss 0.04285750 - time (sec): 168.91 - samples/sec: 6922.19 - lr: 0.100000 +2023-04-05 23:12:05,261 epoch 12 - iter 2385/2650 - loss 0.04281505 - time (sec): 188.69 - samples/sec: 6971.98 - lr: 0.100000 +2023-04-05 23:12:25,108 epoch 12 - iter 2650/2650 - loss 0.04306715 - time (sec): 208.54 - samples/sec: 7012.39 - lr: 0.100000 +2023-04-05 23:12:25,108 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:12:25,109 EPOCH 12 done: loss 0.0431 - lr 0.100000 +2023-04-05 23:12:25,109 BAD EPOCHS (no improvement): 0 +2023-04-05 23:12:25,111 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:12:44,587 epoch 13 - iter 265/2650 - loss 0.04142773 - time (sec): 19.48 - samples/sec: 7504.99 - lr: 0.100000 +2023-04-05 23:13:04,053 epoch 13 - iter 530/2650 - loss 0.04156061 - time (sec): 38.94 - samples/sec: 7455.74 - lr: 0.100000 +2023-04-05 23:13:24,198 epoch 13 - iter 795/2650 - loss 0.04179977 - time (sec): 59.09 - samples/sec: 7417.48 - lr: 0.100000 +2023-04-05 23:13:44,205 epoch 13 - iter 1060/2650 - loss 0.04148937 - time (sec): 79.09 - samples/sec: 7364.55 - lr: 0.100000 +2023-04-05 23:14:04,428 epoch 13 - iter 1325/2650 - loss 0.04152584 - time (sec): 99.32 - samples/sec: 7355.39 - lr: 0.100000 +2023-04-05 23:14:24,564 epoch 13 - iter 1590/2650 - loss 0.04201696 - time (sec): 119.45 - samples/sec: 7357.53 - lr: 0.100000 +2023-04-05 23:14:44,529 epoch 13 - iter 1855/2650 - loss 0.04233746 - time (sec): 139.42 - samples/sec: 7348.26 - lr: 0.100000 +2023-04-05 23:15:04,002 epoch 13 - iter 2120/2650 - loss 0.04244611 - time (sec): 158.89 - samples/sec: 7359.73 - lr: 0.100000 +2023-04-05 23:15:23,465 epoch 13 - iter 2385/2650 - loss 0.04262677 - time (sec): 178.35 - samples/sec: 7376.37 - lr: 0.100000 +2023-04-05 23:15:43,269 epoch 13 - iter 2650/2650 - loss 0.04272274 - time (sec): 198.16 - samples/sec: 7379.81 - lr: 0.100000 +2023-04-05 23:15:43,269 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:15:43,269 EPOCH 13 done: loss 0.0427 - lr 0.100000 +2023-04-05 23:15:43,269 BAD EPOCHS (no improvement): 0 +2023-04-05 23:15:43,273 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:16:02,785 epoch 14 - iter 265/2650 - loss 0.04040378 - time (sec): 19.51 - samples/sec: 7496.29 - lr: 0.100000 +2023-04-05 23:16:22,612 epoch 14 - iter 530/2650 - loss 0.04051854 - time (sec): 39.34 - samples/sec: 7432.54 - lr: 0.100000 +2023-04-05 23:16:42,152 epoch 14 - iter 795/2650 - loss 0.04045287 - time (sec): 58.88 - samples/sec: 7463.45 - lr: 0.100000 +2023-04-05 23:17:01,779 epoch 14 - iter 1060/2650 - loss 0.04071775 - time (sec): 78.51 - samples/sec: 7444.60 - lr: 0.100000 +2023-04-05 23:17:21,518 epoch 14 - iter 1325/2650 - loss 0.04123238 - time (sec): 98.24 - samples/sec: 7426.64 - lr: 0.100000 +2023-04-05 23:17:41,438 epoch 14 - iter 1590/2650 - loss 0.04129789 - time (sec): 118.16 - samples/sec: 7410.28 - lr: 0.100000 +2023-04-05 23:18:01,440 epoch 14 - iter 1855/2650 - loss 0.04154665 - time (sec): 138.17 - samples/sec: 7389.66 - lr: 0.100000 +2023-04-05 23:18:21,712 epoch 14 - iter 2120/2650 - loss 0.04146642 - time (sec): 158.44 - samples/sec: 7370.57 - lr: 0.100000 +2023-04-05 23:18:41,916 epoch 14 - iter 2385/2650 - loss 0.04167842 - time (sec): 178.64 - samples/sec: 7371.37 - lr: 0.100000 +2023-04-05 23:19:01,361 epoch 14 - iter 2650/2650 - loss 0.04158336 - time (sec): 198.09 - samples/sec: 7382.40 - lr: 0.100000 +2023-04-05 23:19:01,361 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:19:01,362 EPOCH 14 done: loss 0.0416 - lr 0.100000 +2023-04-05 23:19:01,362 BAD EPOCHS (no improvement): 0 +2023-04-05 23:19:01,364 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:19:21,964 epoch 15 - iter 265/2650 - loss 0.04057739 - time (sec): 20.60 - samples/sec: 7215.38 - lr: 0.100000 +2023-04-05 23:19:41,561 epoch 15 - iter 530/2650 - loss 0.04016299 - time (sec): 40.20 - samples/sec: 7292.50 - lr: 0.100000 +2023-04-05 23:20:01,728 epoch 15 - iter 795/2650 - loss 0.04025444 - time (sec): 60.36 - samples/sec: 7290.78 - lr: 0.100000 +2023-04-05 23:20:21,120 epoch 15 - iter 1060/2650 - loss 0.04048143 - time (sec): 79.76 - samples/sec: 7343.57 - lr: 0.100000 +2023-04-05 23:20:40,469 epoch 15 - iter 1325/2650 - loss 0.04087959 - time (sec): 99.10 - samples/sec: 7393.69 - lr: 0.100000 +2023-04-05 23:21:00,293 epoch 15 - iter 1590/2650 - loss 0.04062910 - time (sec): 118.93 - samples/sec: 7378.63 - lr: 0.100000 +2023-04-05 23:21:19,930 epoch 15 - iter 1855/2650 - loss 0.04104456 - time (sec): 138.57 - samples/sec: 7383.22 - lr: 0.100000 +2023-04-05 23:21:39,700 epoch 15 - iter 2120/2650 - loss 0.04109267 - time (sec): 158.34 - samples/sec: 7400.18 - lr: 0.100000 +2023-04-05 23:21:59,117 epoch 15 - iter 2385/2650 - loss 0.04104225 - time (sec): 177.75 - samples/sec: 7413.57 - lr: 0.100000 +2023-04-05 23:22:18,565 epoch 15 - iter 2650/2650 - loss 0.04103241 - time (sec): 197.20 - samples/sec: 7415.62 - lr: 0.100000 +2023-04-05 23:22:18,565 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:22:18,565 EPOCH 15 done: loss 0.0410 - lr 0.100000 +2023-04-05 23:22:18,565 BAD EPOCHS (no improvement): 0 +2023-04-05 23:22:18,568 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:22:38,201 epoch 16 - iter 265/2650 - loss 0.03886402 - time (sec): 19.63 - samples/sec: 7398.21 - lr: 0.100000 +2023-04-05 23:22:58,514 epoch 16 - iter 530/2650 - loss 0.03856798 - time (sec): 39.95 - samples/sec: 7335.67 - lr: 0.100000 +2023-04-05 23:23:17,939 epoch 16 - iter 795/2650 - loss 0.03875860 - time (sec): 59.37 - samples/sec: 7415.29 - lr: 0.100000 +2023-04-05 23:23:37,572 epoch 16 - iter 1060/2650 - loss 0.03930614 - time (sec): 79.00 - samples/sec: 7428.67 - lr: 0.100000 +2023-04-05 23:23:57,815 epoch 16 - iter 1325/2650 - loss 0.03920468 - time (sec): 99.25 - samples/sec: 7404.11 - lr: 0.100000 +2023-04-05 23:24:17,587 epoch 16 - iter 1590/2650 - loss 0.03972817 - time (sec): 119.02 - samples/sec: 7396.41 - lr: 0.100000 +2023-04-05 23:24:37,231 epoch 16 - iter 1855/2650 - loss 0.03969746 - time (sec): 138.66 - samples/sec: 7404.57 - lr: 0.100000 +2023-04-05 23:24:56,968 epoch 16 - iter 2120/2650 - loss 0.03985046 - time (sec): 158.40 - samples/sec: 7401.81 - lr: 0.100000 +2023-04-05 23:25:16,312 epoch 16 - iter 2385/2650 - loss 0.03977147 - time (sec): 177.74 - samples/sec: 7408.41 - lr: 0.100000 +2023-04-05 23:25:36,004 epoch 16 - iter 2650/2650 - loss 0.03978966 - time (sec): 197.44 - samples/sec: 7406.76 - lr: 0.100000 +2023-04-05 23:25:36,005 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:25:36,005 EPOCH 16 done: loss 0.0398 - lr 0.100000 +2023-04-05 23:25:36,005 BAD EPOCHS (no improvement): 0 +2023-04-05 23:25:36,008 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:25:55,680 epoch 17 - iter 265/2650 - loss 0.03893019 - time (sec): 19.67 - samples/sec: 7540.89 - lr: 0.100000 +2023-04-05 23:26:15,159 epoch 17 - iter 530/2650 - loss 0.03896850 - time (sec): 39.15 - samples/sec: 7538.03 - lr: 0.100000 +2023-04-05 23:26:34,992 epoch 17 - iter 795/2650 - loss 0.03868454 - time (sec): 58.98 - samples/sec: 7438.92 - lr: 0.100000 +2023-04-05 23:26:54,357 epoch 17 - iter 1060/2650 - loss 0.03900134 - time (sec): 78.35 - samples/sec: 7468.06 - lr: 0.100000 +2023-04-05 23:27:14,422 epoch 17 - iter 1325/2650 - loss 0.03886878 - time (sec): 98.41 - samples/sec: 7438.71 - lr: 0.100000 +2023-04-05 23:27:34,567 epoch 17 - iter 1590/2650 - loss 0.03908285 - time (sec): 118.56 - samples/sec: 7422.44 - lr: 0.100000 +2023-04-05 23:27:54,046 epoch 17 - iter 1855/2650 - loss 0.03899825 - time (sec): 138.04 - samples/sec: 7426.49 - lr: 0.100000 +2023-04-05 23:28:13,796 epoch 17 - iter 2120/2650 - loss 0.03916759 - time (sec): 157.79 - samples/sec: 7429.28 - lr: 0.100000 +2023-04-05 23:28:33,115 epoch 17 - iter 2385/2650 - loss 0.03939620 - time (sec): 177.11 - samples/sec: 7432.65 - lr: 0.100000 +2023-04-05 23:28:52,933 epoch 17 - iter 2650/2650 - loss 0.03953680 - time (sec): 196.93 - samples/sec: 7425.98 - lr: 0.100000 +2023-04-05 23:28:52,933 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:28:52,933 EPOCH 17 done: loss 0.0395 - lr 0.100000 +2023-04-05 23:28:52,934 BAD EPOCHS (no improvement): 0 +2023-04-05 23:28:52,938 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:29:12,185 epoch 18 - iter 265/2650 - loss 0.03687451 - time (sec): 19.25 - samples/sec: 7619.91 - lr: 0.100000 +2023-04-05 23:29:31,517 epoch 18 - iter 530/2650 - loss 0.03767030 - time (sec): 38.58 - samples/sec: 7536.49 - lr: 0.100000 +2023-04-05 23:29:50,801 epoch 18 - iter 795/2650 - loss 0.03800426 - time (sec): 57.86 - samples/sec: 7543.23 - lr: 0.100000 +2023-04-05 23:30:10,920 epoch 18 - iter 1060/2650 - loss 0.03805599 - time (sec): 77.98 - samples/sec: 7499.18 - lr: 0.100000 +2023-04-05 23:30:30,337 epoch 18 - iter 1325/2650 - loss 0.03840052 - time (sec): 97.40 - samples/sec: 7513.44 - lr: 0.100000 +2023-04-05 23:30:51,052 epoch 18 - iter 1590/2650 - loss 0.03833296 - time (sec): 118.11 - samples/sec: 7421.03 - lr: 0.100000 +2023-04-05 23:31:10,108 epoch 18 - iter 1855/2650 - loss 0.03819256 - time (sec): 137.17 - samples/sec: 7441.23 - lr: 0.100000 +2023-04-05 23:31:29,855 epoch 18 - iter 2120/2650 - loss 0.03839978 - time (sec): 156.92 - samples/sec: 7444.39 - lr: 0.100000 +2023-04-05 23:31:50,005 epoch 18 - iter 2385/2650 - loss 0.03851343 - time (sec): 177.07 - samples/sec: 7429.91 - lr: 0.100000 +2023-04-05 23:32:09,711 epoch 18 - iter 2650/2650 - loss 0.03872445 - time (sec): 196.77 - samples/sec: 7431.71 - lr: 0.100000 +2023-04-05 23:32:09,712 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:32:09,712 EPOCH 18 done: loss 0.0387 - lr 0.100000 +2023-04-05 23:32:09,712 BAD EPOCHS (no improvement): 0 +2023-04-05 23:32:09,715 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:32:30,213 epoch 19 - iter 265/2650 - loss 0.03884484 - time (sec): 20.50 - samples/sec: 7228.96 - lr: 0.100000 +2023-04-05 23:32:50,229 epoch 19 - iter 530/2650 - loss 0.03841242 - time (sec): 40.51 - samples/sec: 7293.71 - lr: 0.100000 +2023-04-05 23:33:10,451 epoch 19 - iter 795/2650 - loss 0.03815781 - time (sec): 60.74 - samples/sec: 7303.40 - lr: 0.100000 +2023-04-05 23:33:30,064 epoch 19 - iter 1060/2650 - loss 0.03750413 - time (sec): 80.35 - samples/sec: 7348.77 - lr: 0.100000 +2023-04-05 23:33:49,691 epoch 19 - iter 1325/2650 - loss 0.03731076 - time (sec): 99.98 - samples/sec: 7362.88 - lr: 0.100000 +2023-04-05 23:34:09,257 epoch 19 - iter 1590/2650 - loss 0.03771377 - time (sec): 119.54 - samples/sec: 7370.16 - lr: 0.100000 +2023-04-05 23:34:28,844 epoch 19 - iter 1855/2650 - loss 0.03810818 - time (sec): 139.13 - samples/sec: 7376.18 - lr: 0.100000 +2023-04-05 23:34:48,041 epoch 19 - iter 2120/2650 - loss 0.03821494 - time (sec): 158.33 - samples/sec: 7397.75 - lr: 0.100000 +2023-04-05 23:35:07,460 epoch 19 - iter 2385/2650 - loss 0.03813717 - time (sec): 177.74 - samples/sec: 7400.15 - lr: 0.100000 +2023-04-05 23:35:26,939 epoch 19 - iter 2650/2650 - loss 0.03823628 - time (sec): 197.22 - samples/sec: 7414.72 - lr: 0.100000 +2023-04-05 23:35:26,940 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:35:26,940 EPOCH 19 done: loss 0.0382 - lr 0.100000 +2023-04-05 23:35:26,940 BAD EPOCHS (no improvement): 0 +2023-04-05 23:35:26,943 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:35:46,625 epoch 20 - iter 265/2650 - loss 0.03559866 - time (sec): 19.68 - samples/sec: 7427.06 - lr: 0.100000 +2023-04-05 23:36:06,472 epoch 20 - iter 530/2650 - loss 0.03592580 - time (sec): 39.53 - samples/sec: 7373.49 - lr: 0.100000 +2023-04-05 23:36:25,896 epoch 20 - iter 795/2650 - loss 0.03698562 - time (sec): 58.95 - samples/sec: 7401.61 - lr: 0.100000 +2023-04-05 23:36:45,925 epoch 20 - iter 1060/2650 - loss 0.03742835 - time (sec): 78.98 - samples/sec: 7369.34 - lr: 0.100000 +2023-04-05 23:37:05,971 epoch 20 - iter 1325/2650 - loss 0.03731818 - time (sec): 99.03 - samples/sec: 7367.01 - lr: 0.100000 +2023-04-05 23:37:25,748 epoch 20 - iter 1590/2650 - loss 0.03746228 - time (sec): 118.80 - samples/sec: 7391.55 - lr: 0.100000 +2023-04-05 23:37:45,220 epoch 20 - iter 1855/2650 - loss 0.03786424 - time (sec): 138.28 - samples/sec: 7404.92 - lr: 0.100000 +2023-04-05 23:38:05,059 epoch 20 - iter 2120/2650 - loss 0.03780190 - time (sec): 158.12 - samples/sec: 7403.73 - lr: 0.100000 +2023-04-05 23:38:24,656 epoch 20 - iter 2385/2650 - loss 0.03783936 - time (sec): 177.71 - samples/sec: 7407.09 - lr: 0.100000 +2023-04-05 23:38:44,500 epoch 20 - iter 2650/2650 - loss 0.03785266 - time (sec): 197.56 - samples/sec: 7402.23 - lr: 0.100000 +2023-04-05 23:38:44,500 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:38:44,500 EPOCH 20 done: loss 0.0379 - lr 0.100000 +2023-04-05 23:38:44,501 BAD EPOCHS (no improvement): 0 +2023-04-05 23:38:44,504 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:39:04,676 epoch 21 - iter 265/2650 - loss 0.03780550 - time (sec): 20.17 - samples/sec: 7322.75 - lr: 0.100000 +2023-04-05 23:39:24,449 epoch 21 - iter 530/2650 - loss 0.03773684 - time (sec): 39.95 - samples/sec: 7384.12 - lr: 0.100000 +2023-04-05 23:39:43,861 epoch 21 - iter 795/2650 - loss 0.03737256 - time (sec): 59.36 - samples/sec: 7420.77 - lr: 0.100000 +2023-04-05 23:40:03,746 epoch 21 - iter 1060/2650 - loss 0.03715455 - time (sec): 79.24 - samples/sec: 7376.67 - lr: 0.100000 +2023-04-05 23:40:23,344 epoch 21 - iter 1325/2650 - loss 0.03741216 - time (sec): 98.84 - samples/sec: 7389.94 - lr: 0.100000 +2023-04-05 23:40:43,239 epoch 21 - iter 1590/2650 - loss 0.03731411 - time (sec): 118.74 - samples/sec: 7394.94 - lr: 0.100000 +2023-04-05 23:41:03,529 epoch 21 - iter 1855/2650 - loss 0.03728695 - time (sec): 139.03 - samples/sec: 7374.52 - lr: 0.100000 +2023-04-05 23:41:22,750 epoch 21 - iter 2120/2650 - loss 0.03712129 - time (sec): 158.25 - samples/sec: 7393.62 - lr: 0.100000 +2023-04-05 23:41:42,544 epoch 21 - iter 2385/2650 - loss 0.03749829 - time (sec): 178.04 - samples/sec: 7395.76 - lr: 0.100000 +2023-04-05 23:42:02,045 epoch 21 - iter 2650/2650 - loss 0.03747642 - time (sec): 197.54 - samples/sec: 7402.82 - lr: 0.100000 +2023-04-05 23:42:02,045 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:42:02,046 EPOCH 21 done: loss 0.0375 - lr 0.100000 +2023-04-05 23:42:02,046 BAD EPOCHS (no improvement): 0 +2023-04-05 23:42:02,049 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:42:22,281 epoch 22 - iter 265/2650 - loss 0.03542972 - time (sec): 20.23 - samples/sec: 7319.59 - lr: 0.100000 +2023-04-05 23:42:41,503 epoch 22 - iter 530/2650 - loss 0.03599258 - time (sec): 39.45 - samples/sec: 7424.71 - lr: 0.100000 +2023-04-05 23:43:01,282 epoch 22 - iter 795/2650 - loss 0.03656613 - time (sec): 59.23 - samples/sec: 7434.62 - lr: 0.100000 +2023-04-05 23:43:20,772 epoch 22 - iter 1060/2650 - loss 0.03682889 - time (sec): 78.72 - samples/sec: 7457.28 - lr: 0.100000 +2023-04-05 23:43:40,627 epoch 22 - iter 1325/2650 - loss 0.03685723 - time (sec): 98.58 - samples/sec: 7419.84 - lr: 0.100000 +2023-04-05 23:43:59,838 epoch 22 - iter 1590/2650 - loss 0.03704254 - time (sec): 117.79 - samples/sec: 7440.78 - lr: 0.100000 +2023-04-05 23:44:19,305 epoch 22 - iter 1855/2650 - loss 0.03718383 - time (sec): 137.26 - samples/sec: 7442.92 - lr: 0.100000 +2023-04-05 23:44:40,018 epoch 22 - iter 2120/2650 - loss 0.03723118 - time (sec): 157.97 - samples/sec: 7418.12 - lr: 0.100000 +2023-04-05 23:44:59,794 epoch 22 - iter 2385/2650 - loss 0.03714435 - time (sec): 177.75 - samples/sec: 7410.37 - lr: 0.100000 +2023-04-05 23:45:19,182 epoch 22 - iter 2650/2650 - loss 0.03707664 - time (sec): 197.13 - samples/sec: 7418.17 - lr: 0.100000 +2023-04-05 23:45:19,182 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:45:19,182 EPOCH 22 done: loss 0.0371 - lr 0.100000 +2023-04-05 23:45:19,182 BAD EPOCHS (no improvement): 0 +2023-04-05 23:45:19,185 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:45:38,701 epoch 23 - iter 265/2650 - loss 0.03629860 - time (sec): 19.52 - samples/sec: 7507.41 - lr: 0.100000 +2023-04-05 23:45:58,284 epoch 23 - iter 530/2650 - loss 0.03570194 - time (sec): 39.10 - samples/sec: 7512.79 - lr: 0.100000 +2023-04-05 23:46:18,368 epoch 23 - iter 795/2650 - loss 0.03589799 - time (sec): 59.18 - samples/sec: 7438.25 - lr: 0.100000 +2023-04-05 23:46:37,983 epoch 23 - iter 1060/2650 - loss 0.03606682 - time (sec): 78.80 - samples/sec: 7447.06 - lr: 0.100000 +2023-04-05 23:46:57,667 epoch 23 - iter 1325/2650 - loss 0.03658331 - time (sec): 98.48 - samples/sec: 7453.84 - lr: 0.100000 +2023-04-05 23:47:17,796 epoch 23 - iter 1590/2650 - loss 0.03661517 - time (sec): 118.61 - samples/sec: 7429.45 - lr: 0.100000 +2023-04-05 23:47:37,456 epoch 23 - iter 1855/2650 - loss 0.03669495 - time (sec): 138.27 - samples/sec: 7419.77 - lr: 0.100000 +2023-04-05 23:47:57,066 epoch 23 - iter 2120/2650 - loss 0.03664858 - time (sec): 157.88 - samples/sec: 7419.55 - lr: 0.100000 +2023-04-05 23:48:17,484 epoch 23 - iter 2385/2650 - loss 0.03688217 - time (sec): 178.30 - samples/sec: 7390.99 - lr: 0.100000 +2023-04-05 23:48:36,859 epoch 23 - iter 2650/2650 - loss 0.03685770 - time (sec): 197.67 - samples/sec: 7397.86 - lr: 0.100000 +2023-04-05 23:48:36,859 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:48:36,859 EPOCH 23 done: loss 0.0369 - lr 0.100000 +2023-04-05 23:48:36,859 BAD EPOCHS (no improvement): 0 +2023-04-05 23:48:36,862 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:48:56,710 epoch 24 - iter 265/2650 - loss 0.03582443 - time (sec): 19.85 - samples/sec: 7340.07 - lr: 0.100000 +2023-04-05 23:49:16,397 epoch 24 - iter 530/2650 - loss 0.03522920 - time (sec): 39.54 - samples/sec: 7350.19 - lr: 0.100000 +2023-04-05 23:49:36,260 epoch 24 - iter 795/2650 - loss 0.03538745 - time (sec): 59.40 - samples/sec: 7383.65 - lr: 0.100000 +2023-04-05 23:49:55,638 epoch 24 - iter 1060/2650 - loss 0.03577330 - time (sec): 78.78 - samples/sec: 7421.88 - lr: 0.100000 +2023-04-05 23:50:15,480 epoch 24 - iter 1325/2650 - loss 0.03569175 - time (sec): 98.62 - samples/sec: 7421.43 - lr: 0.100000 +2023-04-05 23:50:35,563 epoch 24 - iter 1590/2650 - loss 0.03568417 - time (sec): 118.70 - samples/sec: 7399.17 - lr: 0.100000 +2023-04-05 23:50:55,454 epoch 24 - iter 1855/2650 - loss 0.03568288 - time (sec): 138.59 - samples/sec: 7399.89 - lr: 0.100000 +2023-04-05 23:51:15,381 epoch 24 - iter 2120/2650 - loss 0.03589099 - time (sec): 158.52 - samples/sec: 7390.31 - lr: 0.100000 +2023-04-05 23:51:35,169 epoch 24 - iter 2385/2650 - loss 0.03586016 - time (sec): 178.31 - samples/sec: 7392.10 - lr: 0.100000 +2023-04-05 23:51:54,542 epoch 24 - iter 2650/2650 - loss 0.03589277 - time (sec): 197.68 - samples/sec: 7397.63 - lr: 0.100000 +2023-04-05 23:51:54,542 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:51:54,542 EPOCH 24 done: loss 0.0359 - lr 0.100000 +2023-04-05 23:51:54,542 BAD EPOCHS (no improvement): 0 +2023-04-05 23:51:54,545 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:52:13,903 epoch 25 - iter 265/2650 - loss 0.03532779 - time (sec): 19.36 - samples/sec: 7481.79 - lr: 0.100000 +2023-04-05 23:52:33,772 epoch 25 - iter 530/2650 - loss 0.03500281 - time (sec): 39.23 - samples/sec: 7403.86 - lr: 0.100000 +2023-04-05 23:52:54,198 epoch 25 - iter 795/2650 - loss 0.03495293 - time (sec): 59.65 - samples/sec: 7327.61 - lr: 0.100000 +2023-04-05 23:53:13,691 epoch 25 - iter 1060/2650 - loss 0.03498747 - time (sec): 79.15 - samples/sec: 7358.93 - lr: 0.100000 +2023-04-05 23:53:33,806 epoch 25 - iter 1325/2650 - loss 0.03532740 - time (sec): 99.26 - samples/sec: 7345.66 - lr: 0.100000 +2023-04-05 23:53:53,645 epoch 25 - iter 1590/2650 - loss 0.03542241 - time (sec): 119.10 - samples/sec: 7362.68 - lr: 0.100000 +2023-04-05 23:54:13,488 epoch 25 - iter 1855/2650 - loss 0.03538326 - time (sec): 138.94 - samples/sec: 7371.29 - lr: 0.100000 +2023-04-05 23:54:33,354 epoch 25 - iter 2120/2650 - loss 0.03549279 - time (sec): 158.81 - samples/sec: 7367.08 - lr: 0.100000 +2023-04-05 23:54:53,339 epoch 25 - iter 2385/2650 - loss 0.03574900 - time (sec): 178.79 - samples/sec: 7362.93 - lr: 0.100000 +2023-04-05 23:55:12,630 epoch 25 - iter 2650/2650 - loss 0.03580619 - time (sec): 198.08 - samples/sec: 7382.53 - lr: 0.100000 +2023-04-05 23:55:12,630 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:55:12,630 EPOCH 25 done: loss 0.0358 - lr 0.100000 +2023-04-05 23:55:12,630 BAD EPOCHS (no improvement): 0 +2023-04-05 23:55:12,637 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:55:31,770 epoch 26 - iter 265/2650 - loss 0.03350377 - time (sec): 19.13 - samples/sec: 7516.35 - lr: 0.100000 +2023-04-05 23:55:52,193 epoch 26 - iter 530/2650 - loss 0.03394008 - time (sec): 39.56 - samples/sec: 7342.59 - lr: 0.100000 +2023-04-05 23:56:11,865 epoch 26 - iter 795/2650 - loss 0.03414596 - time (sec): 59.23 - samples/sec: 7388.13 - lr: 0.100000 +2023-04-05 23:56:31,649 epoch 26 - iter 1060/2650 - loss 0.03446851 - time (sec): 79.01 - samples/sec: 7393.17 - lr: 0.100000 +2023-04-05 23:56:51,450 epoch 26 - iter 1325/2650 - loss 0.03429756 - time (sec): 98.81 - samples/sec: 7400.81 - lr: 0.100000 +2023-04-05 23:57:11,456 epoch 26 - iter 1590/2650 - loss 0.03468016 - time (sec): 118.82 - samples/sec: 7395.33 - lr: 0.100000 +2023-04-05 23:57:30,771 epoch 26 - iter 1855/2650 - loss 0.03473978 - time (sec): 138.13 - samples/sec: 7410.69 - lr: 0.100000 +2023-04-05 23:57:50,563 epoch 26 - iter 2120/2650 - loss 0.03505711 - time (sec): 157.93 - samples/sec: 7404.82 - lr: 0.100000 +2023-04-05 23:58:10,762 epoch 26 - iter 2385/2650 - loss 0.03506223 - time (sec): 178.12 - samples/sec: 7392.84 - lr: 0.100000 +2023-04-05 23:58:30,277 epoch 26 - iter 2650/2650 - loss 0.03529119 - time (sec): 197.64 - samples/sec: 7399.12 - lr: 0.100000 +2023-04-05 23:58:30,278 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:58:30,278 EPOCH 26 done: loss 0.0353 - lr 0.100000 +2023-04-05 23:58:30,278 BAD EPOCHS (no improvement): 0 +2023-04-05 23:58:30,281 ---------------------------------------------------------------------------------------------------- +2023-04-05 23:58:50,314 epoch 27 - iter 265/2650 - loss 0.03362257 - time (sec): 20.03 - samples/sec: 7335.13 - lr: 0.100000 +2023-04-05 23:59:09,741 epoch 27 - iter 530/2650 - loss 0.03399168 - time (sec): 39.46 - samples/sec: 7402.14 - lr: 0.100000 +2023-04-05 23:59:28,948 epoch 27 - iter 795/2650 - loss 0.03460693 - time (sec): 58.67 - samples/sec: 7446.46 - lr: 0.100000 +2023-04-05 23:59:48,994 epoch 27 - iter 1060/2650 - loss 0.03505005 - time (sec): 78.71 - samples/sec: 7412.61 - lr: 0.100000 +2023-04-06 00:00:08,569 epoch 27 - iter 1325/2650 - loss 0.03510471 - time (sec): 98.29 - samples/sec: 7420.29 - lr: 0.100000 +2023-04-06 00:00:28,359 epoch 27 - iter 1590/2650 - loss 0.03527188 - time (sec): 118.08 - samples/sec: 7422.11 - lr: 0.100000 +2023-04-06 00:00:47,938 epoch 27 - iter 1855/2650 - loss 0.03541833 - time (sec): 137.66 - samples/sec: 7426.88 - lr: 0.100000 +2023-04-06 00:01:08,114 epoch 27 - iter 2120/2650 - loss 0.03580167 - time (sec): 157.83 - samples/sec: 7414.12 - lr: 0.100000 +2023-04-06 00:01:28,076 epoch 27 - iter 2385/2650 - loss 0.03578883 - time (sec): 177.79 - samples/sec: 7404.56 - lr: 0.100000 +2023-04-06 00:01:57,476 epoch 27 - iter 2650/2650 - loss 0.03560065 - time (sec): 207.19 - samples/sec: 7057.91 - lr: 0.100000 +2023-04-06 00:01:57,476 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:01:57,476 EPOCH 27 done: loss 0.0356 - lr 0.100000 +2023-04-06 00:01:57,476 BAD EPOCHS (no improvement): 1 +2023-04-06 00:01:57,479 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:02:16,947 epoch 28 - iter 265/2650 - loss 0.03376720 - time (sec): 19.47 - samples/sec: 7429.25 - lr: 0.100000 +2023-04-06 00:02:36,633 epoch 28 - iter 530/2650 - loss 0.03468018 - time (sec): 39.15 - samples/sec: 7448.92 - lr: 0.100000 +2023-04-06 00:02:55,960 epoch 28 - iter 795/2650 - loss 0.03445018 - time (sec): 58.48 - samples/sec: 7474.34 - lr: 0.100000 +2023-04-06 00:03:16,013 epoch 28 - iter 1060/2650 - loss 0.03433266 - time (sec): 78.53 - samples/sec: 7424.46 - lr: 0.100000 +2023-04-06 00:03:35,844 epoch 28 - iter 1325/2650 - loss 0.03452301 - time (sec): 98.36 - samples/sec: 7411.61 - lr: 0.100000 +2023-04-06 00:03:55,088 epoch 28 - iter 1590/2650 - loss 0.03439093 - time (sec): 117.61 - samples/sec: 7437.60 - lr: 0.100000 +2023-04-06 00:04:15,301 epoch 28 - iter 1855/2650 - loss 0.03466075 - time (sec): 137.82 - samples/sec: 7412.01 - lr: 0.100000 +2023-04-06 00:04:34,590 epoch 28 - iter 2120/2650 - loss 0.03459712 - time (sec): 157.11 - samples/sec: 7427.12 - lr: 0.100000 +2023-04-06 00:04:54,572 epoch 28 - iter 2385/2650 - loss 0.03479347 - time (sec): 177.09 - samples/sec: 7422.76 - lr: 0.100000 +2023-04-06 00:05:14,650 epoch 28 - iter 2650/2650 - loss 0.03491241 - time (sec): 197.17 - samples/sec: 7416.73 - lr: 0.100000 +2023-04-06 00:05:14,650 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:05:14,650 EPOCH 28 done: loss 0.0349 - lr 0.100000 +2023-04-06 00:05:14,650 BAD EPOCHS (no improvement): 0 +2023-04-06 00:05:14,657 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:05:34,405 epoch 29 - iter 265/2650 - loss 0.03520691 - time (sec): 19.75 - samples/sec: 7415.80 - lr: 0.100000 +2023-04-06 00:05:54,041 epoch 29 - iter 530/2650 - loss 0.03489647 - time (sec): 39.38 - samples/sec: 7421.36 - lr: 0.100000 +2023-04-06 00:06:13,849 epoch 29 - iter 795/2650 - loss 0.03457302 - time (sec): 59.19 - samples/sec: 7402.64 - lr: 0.100000 +2023-04-06 00:06:33,926 epoch 29 - iter 1060/2650 - loss 0.03435361 - time (sec): 79.27 - samples/sec: 7342.94 - lr: 0.100000 +2023-04-06 00:06:53,579 epoch 29 - iter 1325/2650 - loss 0.03411601 - time (sec): 98.92 - samples/sec: 7378.13 - lr: 0.100000 +2023-04-06 00:07:13,193 epoch 29 - iter 1590/2650 - loss 0.03390079 - time (sec): 118.54 - samples/sec: 7392.69 - lr: 0.100000 +2023-04-06 00:07:33,217 epoch 29 - iter 1855/2650 - loss 0.03380149 - time (sec): 138.56 - samples/sec: 7387.28 - lr: 0.100000 +2023-04-06 00:07:52,877 epoch 29 - iter 2120/2650 - loss 0.03393107 - time (sec): 158.22 - samples/sec: 7394.75 - lr: 0.100000 +2023-04-06 00:08:12,973 epoch 29 - iter 2385/2650 - loss 0.03424095 - time (sec): 178.32 - samples/sec: 7382.56 - lr: 0.100000 +2023-04-06 00:08:32,548 epoch 29 - iter 2650/2650 - loss 0.03451294 - time (sec): 197.89 - samples/sec: 7389.77 - lr: 0.100000 +2023-04-06 00:08:32,548 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:08:32,548 EPOCH 29 done: loss 0.0345 - lr 0.100000 +2023-04-06 00:08:32,548 BAD EPOCHS (no improvement): 0 +2023-04-06 00:08:32,552 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:08:52,996 epoch 30 - iter 265/2650 - loss 0.03395257 - time (sec): 20.44 - samples/sec: 7169.77 - lr: 0.100000 +2023-04-06 00:09:12,646 epoch 30 - iter 530/2650 - loss 0.03399807 - time (sec): 40.09 - samples/sec: 7309.66 - lr: 0.100000 +2023-04-06 00:09:32,149 epoch 30 - iter 795/2650 - loss 0.03387434 - time (sec): 59.60 - samples/sec: 7379.49 - lr: 0.100000 +2023-04-06 00:09:51,642 epoch 30 - iter 1060/2650 - loss 0.03376718 - time (sec): 79.09 - samples/sec: 7394.78 - lr: 0.100000 +2023-04-06 00:10:10,841 epoch 30 - iter 1325/2650 - loss 0.03378417 - time (sec): 98.29 - samples/sec: 7418.95 - lr: 0.100000 +2023-04-06 00:10:30,969 epoch 30 - iter 1590/2650 - loss 0.03420691 - time (sec): 118.42 - samples/sec: 7412.24 - lr: 0.100000 +2023-04-06 00:10:51,481 epoch 30 - iter 1855/2650 - loss 0.03415484 - time (sec): 138.93 - samples/sec: 7380.61 - lr: 0.100000 +2023-04-06 00:11:11,685 epoch 30 - iter 2120/2650 - loss 0.03428628 - time (sec): 159.13 - samples/sec: 7362.62 - lr: 0.100000 +2023-04-06 00:11:30,571 epoch 30 - iter 2385/2650 - loss 0.03438469 - time (sec): 178.02 - samples/sec: 7396.79 - lr: 0.100000 +2023-04-06 00:11:49,934 epoch 30 - iter 2650/2650 - loss 0.03446056 - time (sec): 197.38 - samples/sec: 7408.81 - lr: 0.100000 +2023-04-06 00:11:49,934 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:11:49,934 EPOCH 30 done: loss 0.0345 - lr 0.100000 +2023-04-06 00:11:49,934 BAD EPOCHS (no improvement): 0 +2023-04-06 00:11:49,937 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:12:09,552 epoch 31 - iter 265/2650 - loss 0.03284975 - time (sec): 19.62 - samples/sec: 7446.77 - lr: 0.100000 +2023-04-06 00:12:28,505 epoch 31 - iter 530/2650 - loss 0.03379530 - time (sec): 38.57 - samples/sec: 7525.61 - lr: 0.100000 +2023-04-06 00:12:48,101 epoch 31 - iter 795/2650 - loss 0.03398737 - time (sec): 58.16 - samples/sec: 7500.71 - lr: 0.100000 +2023-04-06 00:13:07,682 epoch 31 - iter 1060/2650 - loss 0.03362497 - time (sec): 77.75 - samples/sec: 7482.14 - lr: 0.100000 +2023-04-06 00:13:27,001 epoch 31 - iter 1325/2650 - loss 0.03324185 - time (sec): 97.06 - samples/sec: 7503.81 - lr: 0.100000 +2023-04-06 00:13:46,356 epoch 31 - iter 1590/2650 - loss 0.03352791 - time (sec): 116.42 - samples/sec: 7511.85 - lr: 0.100000 +2023-04-06 00:14:06,553 epoch 31 - iter 1855/2650 - loss 0.03357960 - time (sec): 136.62 - samples/sec: 7488.90 - lr: 0.100000 +2023-04-06 00:14:26,798 epoch 31 - iter 2120/2650 - loss 0.03383146 - time (sec): 156.86 - samples/sec: 7456.87 - lr: 0.100000 +2023-04-06 00:14:46,232 epoch 31 - iter 2385/2650 - loss 0.03383897 - time (sec): 176.29 - samples/sec: 7458.15 - lr: 0.100000 +2023-04-06 00:15:06,225 epoch 31 - iter 2650/2650 - loss 0.03414900 - time (sec): 196.29 - samples/sec: 7450.11 - lr: 0.100000 +2023-04-06 00:15:06,225 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:15:06,225 EPOCH 31 done: loss 0.0341 - lr 0.100000 +2023-04-06 00:15:06,225 BAD EPOCHS (no improvement): 0 +2023-04-06 00:15:06,228 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:15:26,099 epoch 32 - iter 265/2650 - loss 0.03147212 - time (sec): 19.87 - samples/sec: 7409.54 - lr: 0.100000 +2023-04-06 00:15:45,471 epoch 32 - iter 530/2650 - loss 0.03254038 - time (sec): 39.24 - samples/sec: 7419.60 - lr: 0.100000 +2023-04-06 00:16:05,580 epoch 32 - iter 795/2650 - loss 0.03283877 - time (sec): 59.35 - samples/sec: 7386.18 - lr: 0.100000 +2023-04-06 00:16:25,099 epoch 32 - iter 1060/2650 - loss 0.03341404 - time (sec): 78.87 - samples/sec: 7401.66 - lr: 0.100000 +2023-04-06 00:16:44,253 epoch 32 - iter 1325/2650 - loss 0.03331500 - time (sec): 98.02 - samples/sec: 7437.30 - lr: 0.100000 +2023-04-06 00:17:04,537 epoch 32 - iter 1590/2650 - loss 0.03321410 - time (sec): 118.31 - samples/sec: 7414.28 - lr: 0.100000 +2023-04-06 00:17:24,099 epoch 32 - iter 1855/2650 - loss 0.03327462 - time (sec): 137.87 - samples/sec: 7426.39 - lr: 0.100000 +2023-04-06 00:17:43,875 epoch 32 - iter 2120/2650 - loss 0.03345272 - time (sec): 157.65 - samples/sec: 7427.04 - lr: 0.100000 +2023-04-06 00:18:04,089 epoch 32 - iter 2385/2650 - loss 0.03349502 - time (sec): 177.86 - samples/sec: 7405.32 - lr: 0.100000 +2023-04-06 00:18:23,777 epoch 32 - iter 2650/2650 - loss 0.03352724 - time (sec): 197.55 - samples/sec: 7402.55 - lr: 0.100000 +2023-04-06 00:18:23,777 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:18:23,777 EPOCH 32 done: loss 0.0335 - lr 0.100000 +2023-04-06 00:18:23,777 BAD EPOCHS (no improvement): 0 +2023-04-06 00:18:23,781 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:18:43,620 epoch 33 - iter 265/2650 - loss 0.03293303 - time (sec): 19.84 - samples/sec: 7451.97 - lr: 0.100000 +2023-04-06 00:19:04,013 epoch 33 - iter 530/2650 - loss 0.03251799 - time (sec): 40.23 - samples/sec: 7300.16 - lr: 0.100000 +2023-04-06 00:19:23,642 epoch 33 - iter 795/2650 - loss 0.03294772 - time (sec): 59.86 - samples/sec: 7345.09 - lr: 0.100000 +2023-04-06 00:19:42,895 epoch 33 - iter 1060/2650 - loss 0.03348348 - time (sec): 79.11 - samples/sec: 7409.27 - lr: 0.100000 +2023-04-06 00:20:02,713 epoch 33 - iter 1325/2650 - loss 0.03377057 - time (sec): 98.93 - samples/sec: 7403.47 - lr: 0.100000 +2023-04-06 00:20:21,899 epoch 33 - iter 1590/2650 - loss 0.03371583 - time (sec): 118.12 - samples/sec: 7436.49 - lr: 0.100000 +2023-04-06 00:20:41,457 epoch 33 - iter 1855/2650 - loss 0.03416892 - time (sec): 137.68 - samples/sec: 7427.54 - lr: 0.100000 +2023-04-06 00:21:01,231 epoch 33 - iter 2120/2650 - loss 0.03417072 - time (sec): 157.45 - samples/sec: 7428.38 - lr: 0.100000 +2023-04-06 00:21:21,101 epoch 33 - iter 2385/2650 - loss 0.03407835 - time (sec): 177.32 - samples/sec: 7423.52 - lr: 0.100000 +2023-04-06 00:21:40,710 epoch 33 - iter 2650/2650 - loss 0.03383043 - time (sec): 196.93 - samples/sec: 7425.85 - lr: 0.100000 +2023-04-06 00:21:40,711 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:21:40,711 EPOCH 33 done: loss 0.0338 - lr 0.100000 +2023-04-06 00:21:40,711 BAD EPOCHS (no improvement): 1 +2023-04-06 00:21:40,714 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:22:00,161 epoch 34 - iter 265/2650 - loss 0.03278319 - time (sec): 19.45 - samples/sec: 7497.91 - lr: 0.100000 +2023-04-06 00:22:19,630 epoch 34 - iter 530/2650 - loss 0.03157491 - time (sec): 38.92 - samples/sec: 7545.00 - lr: 0.100000 +2023-04-06 00:22:39,592 epoch 34 - iter 795/2650 - loss 0.03197803 - time (sec): 58.88 - samples/sec: 7480.62 - lr: 0.100000 +2023-04-06 00:22:59,215 epoch 34 - iter 1060/2650 - loss 0.03199495 - time (sec): 78.50 - samples/sec: 7443.87 - lr: 0.100000 +2023-04-06 00:23:19,204 epoch 34 - iter 1325/2650 - loss 0.03200690 - time (sec): 98.49 - samples/sec: 7428.28 - lr: 0.100000 +2023-04-06 00:23:39,422 epoch 34 - iter 1590/2650 - loss 0.03210826 - time (sec): 118.71 - samples/sec: 7404.68 - lr: 0.100000 +2023-04-06 00:23:58,385 epoch 34 - iter 1855/2650 - loss 0.03260764 - time (sec): 137.67 - samples/sec: 7425.00 - lr: 0.100000 +2023-04-06 00:24:17,848 epoch 34 - iter 2120/2650 - loss 0.03303662 - time (sec): 157.13 - samples/sec: 7435.83 - lr: 0.100000 +2023-04-06 00:24:37,227 epoch 34 - iter 2385/2650 - loss 0.03309589 - time (sec): 176.51 - samples/sec: 7454.00 - lr: 0.100000 +2023-04-06 00:24:57,498 epoch 34 - iter 2650/2650 - loss 0.03331709 - time (sec): 196.78 - samples/sec: 7431.32 - lr: 0.100000 +2023-04-06 00:24:57,498 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:24:57,498 EPOCH 34 done: loss 0.0333 - lr 0.100000 +2023-04-06 00:24:57,498 BAD EPOCHS (no improvement): 0 +2023-04-06 00:24:57,502 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:25:16,904 epoch 35 - iter 265/2650 - loss 0.03371517 - time (sec): 19.40 - samples/sec: 7495.97 - lr: 0.100000 +2023-04-06 00:25:36,441 epoch 35 - iter 530/2650 - loss 0.03327525 - time (sec): 38.94 - samples/sec: 7496.87 - lr: 0.100000 +2023-04-06 00:25:56,859 epoch 35 - iter 795/2650 - loss 0.03318869 - time (sec): 59.36 - samples/sec: 7395.84 - lr: 0.100000 +2023-04-06 00:26:15,956 epoch 35 - iter 1060/2650 - loss 0.03318483 - time (sec): 78.45 - samples/sec: 7456.93 - lr: 0.100000 +2023-04-06 00:26:35,646 epoch 35 - iter 1325/2650 - loss 0.03278300 - time (sec): 98.14 - samples/sec: 7448.75 - lr: 0.100000 +2023-04-06 00:26:55,552 epoch 35 - iter 1590/2650 - loss 0.03281379 - time (sec): 118.05 - samples/sec: 7430.99 - lr: 0.100000 +2023-04-06 00:27:15,148 epoch 35 - iter 1855/2650 - loss 0.03312041 - time (sec): 137.65 - samples/sec: 7441.62 - lr: 0.100000 +2023-04-06 00:27:34,639 epoch 35 - iter 2120/2650 - loss 0.03325428 - time (sec): 157.14 - samples/sec: 7452.69 - lr: 0.100000 +2023-04-06 00:27:54,506 epoch 35 - iter 2385/2650 - loss 0.03341533 - time (sec): 177.00 - samples/sec: 7436.04 - lr: 0.100000 +2023-04-06 00:28:14,146 epoch 35 - iter 2650/2650 - loss 0.03334312 - time (sec): 196.64 - samples/sec: 7436.61 - lr: 0.100000 +2023-04-06 00:28:14,146 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:28:14,146 EPOCH 35 done: loss 0.0333 - lr 0.100000 +2023-04-06 00:28:14,146 BAD EPOCHS (no improvement): 1 +2023-04-06 00:28:14,150 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:28:33,897 epoch 36 - iter 265/2650 - loss 0.03222855 - time (sec): 19.75 - samples/sec: 7394.01 - lr: 0.100000 +2023-04-06 00:28:53,926 epoch 36 - iter 530/2650 - loss 0.03294347 - time (sec): 39.78 - samples/sec: 7367.28 - lr: 0.100000 +2023-04-06 00:29:13,800 epoch 36 - iter 795/2650 - loss 0.03294840 - time (sec): 59.65 - samples/sec: 7354.79 - lr: 0.100000 +2023-04-06 00:29:33,708 epoch 36 - iter 1060/2650 - loss 0.03310192 - time (sec): 79.56 - samples/sec: 7363.33 - lr: 0.100000 +2023-04-06 00:29:53,294 epoch 36 - iter 1325/2650 - loss 0.03333328 - time (sec): 99.14 - samples/sec: 7384.62 - lr: 0.100000 +2023-04-06 00:30:13,575 epoch 36 - iter 1590/2650 - loss 0.03332831 - time (sec): 119.42 - samples/sec: 7355.71 - lr: 0.100000 +2023-04-06 00:30:33,209 epoch 36 - iter 1855/2650 - loss 0.03327820 - time (sec): 139.06 - samples/sec: 7379.34 - lr: 0.100000 +2023-04-06 00:30:52,698 epoch 36 - iter 2120/2650 - loss 0.03324384 - time (sec): 158.55 - samples/sec: 7384.65 - lr: 0.100000 +2023-04-06 00:31:12,092 epoch 36 - iter 2385/2650 - loss 0.03315761 - time (sec): 177.94 - samples/sec: 7399.17 - lr: 0.100000 +2023-04-06 00:31:31,774 epoch 36 - iter 2650/2650 - loss 0.03329781 - time (sec): 197.62 - samples/sec: 7399.72 - lr: 0.100000 +2023-04-06 00:31:31,775 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:31:31,775 EPOCH 36 done: loss 0.0333 - lr 0.100000 +2023-04-06 00:31:31,775 BAD EPOCHS (no improvement): 0 +2023-04-06 00:31:31,779 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:31:51,300 epoch 37 - iter 265/2650 - loss 0.03098230 - time (sec): 19.52 - samples/sec: 7518.36 - lr: 0.100000 +2023-04-06 00:32:11,094 epoch 37 - iter 530/2650 - loss 0.03164831 - time (sec): 39.32 - samples/sec: 7465.97 - lr: 0.100000 +2023-04-06 00:32:31,379 epoch 37 - iter 795/2650 - loss 0.03213314 - time (sec): 59.60 - samples/sec: 7383.20 - lr: 0.100000 +2023-04-06 00:32:51,399 epoch 37 - iter 1060/2650 - loss 0.03273908 - time (sec): 79.62 - samples/sec: 7355.85 - lr: 0.100000 +2023-04-06 00:33:10,812 epoch 37 - iter 1325/2650 - loss 0.03233362 - time (sec): 99.03 - samples/sec: 7380.96 - lr: 0.100000 +2023-04-06 00:33:30,381 epoch 37 - iter 1590/2650 - loss 0.03244750 - time (sec): 118.60 - samples/sec: 7388.45 - lr: 0.100000 +2023-04-06 00:33:50,354 epoch 37 - iter 1855/2650 - loss 0.03242242 - time (sec): 138.58 - samples/sec: 7385.99 - lr: 0.100000 +2023-04-06 00:34:10,547 epoch 37 - iter 2120/2650 - loss 0.03220163 - time (sec): 158.77 - samples/sec: 7379.11 - lr: 0.100000 +2023-04-06 00:34:29,902 epoch 37 - iter 2385/2650 - loss 0.03234543 - time (sec): 178.12 - samples/sec: 7393.21 - lr: 0.100000 +2023-04-06 00:34:49,528 epoch 37 - iter 2650/2650 - loss 0.03254981 - time (sec): 197.75 - samples/sec: 7395.03 - lr: 0.100000 +2023-04-06 00:34:49,529 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:34:49,529 EPOCH 37 done: loss 0.0325 - lr 0.100000 +2023-04-06 00:34:49,529 BAD EPOCHS (no improvement): 0 +2023-04-06 00:34:49,532 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:35:09,720 epoch 38 - iter 265/2650 - loss 0.03299786 - time (sec): 20.19 - samples/sec: 7313.39 - lr: 0.100000 +2023-04-06 00:35:29,227 epoch 38 - iter 530/2650 - loss 0.03246811 - time (sec): 39.70 - samples/sec: 7404.89 - lr: 0.100000 +2023-04-06 00:35:49,251 epoch 38 - iter 795/2650 - loss 0.03282325 - time (sec): 59.72 - samples/sec: 7357.62 - lr: 0.100000 +2023-04-06 00:36:08,965 epoch 38 - iter 1060/2650 - loss 0.03258656 - time (sec): 79.43 - samples/sec: 7367.71 - lr: 0.100000 +2023-04-06 00:36:28,845 epoch 38 - iter 1325/2650 - loss 0.03257285 - time (sec): 99.31 - samples/sec: 7374.48 - lr: 0.100000 +2023-04-06 00:36:48,700 epoch 38 - iter 1590/2650 - loss 0.03260684 - time (sec): 119.17 - samples/sec: 7375.71 - lr: 0.100000 +2023-04-06 00:37:08,370 epoch 38 - iter 1855/2650 - loss 0.03263233 - time (sec): 138.84 - samples/sec: 7379.81 - lr: 0.100000 +2023-04-06 00:37:27,968 epoch 38 - iter 2120/2650 - loss 0.03250047 - time (sec): 158.44 - samples/sec: 7385.57 - lr: 0.100000 +2023-04-06 00:37:47,872 epoch 38 - iter 2385/2650 - loss 0.03254518 - time (sec): 178.34 - samples/sec: 7383.94 - lr: 0.100000 +2023-04-06 00:38:07,359 epoch 38 - iter 2650/2650 - loss 0.03256946 - time (sec): 197.83 - samples/sec: 7392.10 - lr: 0.100000 +2023-04-06 00:38:07,360 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:38:07,360 EPOCH 38 done: loss 0.0326 - lr 0.100000 +2023-04-06 00:38:07,360 BAD EPOCHS (no improvement): 1 +2023-04-06 00:38:07,363 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:38:27,051 epoch 39 - iter 265/2650 - loss 0.03232815 - time (sec): 19.69 - samples/sec: 7345.86 - lr: 0.100000 +2023-04-06 00:38:46,782 epoch 39 - iter 530/2650 - loss 0.03211567 - time (sec): 39.42 - samples/sec: 7403.54 - lr: 0.100000 +2023-04-06 00:39:06,599 epoch 39 - iter 795/2650 - loss 0.03195153 - time (sec): 59.24 - samples/sec: 7409.57 - lr: 0.100000 +2023-04-06 00:39:26,775 epoch 39 - iter 1060/2650 - loss 0.03162712 - time (sec): 79.41 - samples/sec: 7379.61 - lr: 0.100000 +2023-04-06 00:39:46,523 epoch 39 - iter 1325/2650 - loss 0.03230874 - time (sec): 99.16 - samples/sec: 7379.12 - lr: 0.100000 +2023-04-06 00:40:06,130 epoch 39 - iter 1590/2650 - loss 0.03233712 - time (sec): 118.77 - samples/sec: 7393.02 - lr: 0.100000 +2023-04-06 00:40:25,864 epoch 39 - iter 1855/2650 - loss 0.03245259 - time (sec): 138.50 - samples/sec: 7394.45 - lr: 0.100000 +2023-04-06 00:40:45,769 epoch 39 - iter 2120/2650 - loss 0.03263103 - time (sec): 158.41 - samples/sec: 7388.52 - lr: 0.100000 +2023-04-06 00:41:05,497 epoch 39 - iter 2385/2650 - loss 0.03265201 - time (sec): 178.13 - samples/sec: 7398.60 - lr: 0.100000 +2023-04-06 00:41:24,989 epoch 39 - iter 2650/2650 - loss 0.03264164 - time (sec): 197.63 - samples/sec: 7399.66 - lr: 0.100000 +2023-04-06 00:41:24,989 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:41:24,989 EPOCH 39 done: loss 0.0326 - lr 0.100000 +2023-04-06 00:41:24,990 BAD EPOCHS (no improvement): 2 +2023-04-06 00:41:24,993 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:41:45,177 epoch 40 - iter 265/2650 - loss 0.03287872 - time (sec): 20.18 - samples/sec: 7383.20 - lr: 0.100000 +2023-04-06 00:42:04,779 epoch 40 - iter 530/2650 - loss 0.03217006 - time (sec): 39.79 - samples/sec: 7402.31 - lr: 0.100000 +2023-04-06 00:42:24,709 epoch 40 - iter 795/2650 - loss 0.03147888 - time (sec): 59.72 - samples/sec: 7373.96 - lr: 0.100000 +2023-04-06 00:42:44,139 epoch 40 - iter 1060/2650 - loss 0.03181766 - time (sec): 79.15 - samples/sec: 7401.65 - lr: 0.100000 +2023-04-06 00:43:03,362 epoch 40 - iter 1325/2650 - loss 0.03176037 - time (sec): 98.37 - samples/sec: 7429.62 - lr: 0.100000 +2023-04-06 00:43:22,956 epoch 40 - iter 1590/2650 - loss 0.03192259 - time (sec): 117.96 - samples/sec: 7431.03 - lr: 0.100000 +2023-04-06 00:43:42,668 epoch 40 - iter 1855/2650 - loss 0.03229649 - time (sec): 137.68 - samples/sec: 7434.31 - lr: 0.100000 +2023-04-06 00:44:01,895 epoch 40 - iter 2120/2650 - loss 0.03235237 - time (sec): 156.90 - samples/sec: 7453.33 - lr: 0.100000 +2023-04-06 00:44:21,789 epoch 40 - iter 2385/2650 - loss 0.03268056 - time (sec): 176.80 - samples/sec: 7449.19 - lr: 0.100000 +2023-04-06 00:44:41,159 epoch 40 - iter 2650/2650 - loss 0.03280627 - time (sec): 196.17 - samples/sec: 7454.72 - lr: 0.100000 +2023-04-06 00:44:41,160 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:44:41,160 EPOCH 40 done: loss 0.0328 - lr 0.100000 +2023-04-06 00:44:41,160 BAD EPOCHS (no improvement): 3 +2023-04-06 00:44:41,163 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:45:00,702 epoch 41 - iter 265/2650 - loss 0.03174940 - time (sec): 19.54 - samples/sec: 7506.79 - lr: 0.100000 +2023-04-06 00:45:19,887 epoch 41 - iter 530/2650 - loss 0.03177356 - time (sec): 38.72 - samples/sec: 7538.45 - lr: 0.100000 +2023-04-06 00:45:39,151 epoch 41 - iter 795/2650 - loss 0.03247711 - time (sec): 57.99 - samples/sec: 7542.75 - lr: 0.100000 +2023-04-06 00:45:58,892 epoch 41 - iter 1060/2650 - loss 0.03228117 - time (sec): 77.73 - samples/sec: 7519.18 - lr: 0.100000 +2023-04-06 00:46:18,378 epoch 41 - iter 1325/2650 - loss 0.03205756 - time (sec): 97.21 - samples/sec: 7512.14 - lr: 0.100000 +2023-04-06 00:46:37,887 epoch 41 - iter 1590/2650 - loss 0.03237677 - time (sec): 116.72 - samples/sec: 7510.67 - lr: 0.100000 +2023-04-06 00:46:57,176 epoch 41 - iter 1855/2650 - loss 0.03213207 - time (sec): 136.01 - samples/sec: 7512.22 - lr: 0.100000 +2023-04-06 00:47:17,212 epoch 41 - iter 2120/2650 - loss 0.03251258 - time (sec): 156.05 - samples/sec: 7503.62 - lr: 0.100000 +2023-04-06 00:47:37,218 epoch 41 - iter 2385/2650 - loss 0.03257332 - time (sec): 176.05 - samples/sec: 7483.69 - lr: 0.100000 +2023-04-06 00:47:56,229 epoch 41 - iter 2650/2650 - loss 0.03272240 - time (sec): 195.07 - samples/sec: 7496.76 - lr: 0.100000 +2023-04-06 00:47:56,229 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:47:56,229 EPOCH 41 done: loss 0.0327 - lr 0.100000 +2023-04-06 00:47:56,229 Epoch 41: reducing learning rate of group 0 to 5.0000e-02. +2023-04-06 00:47:56,229 BAD EPOCHS (no improvement): 4 +2023-04-06 00:47:56,232 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:48:15,885 epoch 42 - iter 265/2650 - loss 0.02955627 - time (sec): 19.65 - samples/sec: 7414.30 - lr: 0.050000 +2023-04-06 00:48:35,659 epoch 42 - iter 530/2650 - loss 0.03067219 - time (sec): 39.43 - samples/sec: 7497.40 - lr: 0.050000 +2023-04-06 00:48:54,990 epoch 42 - iter 795/2650 - loss 0.03056294 - time (sec): 58.76 - samples/sec: 7471.31 - lr: 0.050000 +2023-04-06 00:49:14,285 epoch 42 - iter 1060/2650 - loss 0.03019372 - time (sec): 78.05 - samples/sec: 7505.97 - lr: 0.050000 +2023-04-06 00:49:33,798 epoch 42 - iter 1325/2650 - loss 0.03022652 - time (sec): 97.57 - samples/sec: 7504.12 - lr: 0.050000 +2023-04-06 00:49:53,249 epoch 42 - iter 1590/2650 - loss 0.02997870 - time (sec): 117.02 - samples/sec: 7509.38 - lr: 0.050000 +2023-04-06 00:50:12,663 epoch 42 - iter 1855/2650 - loss 0.02969903 - time (sec): 136.43 - samples/sec: 7508.86 - lr: 0.050000 +2023-04-06 00:50:32,607 epoch 42 - iter 2120/2650 - loss 0.02975692 - time (sec): 156.37 - samples/sec: 7490.84 - lr: 0.050000 +2023-04-06 00:50:52,034 epoch 42 - iter 2385/2650 - loss 0.02977858 - time (sec): 175.80 - samples/sec: 7493.21 - lr: 0.050000 +2023-04-06 00:51:10,965 epoch 42 - iter 2650/2650 - loss 0.02985402 - time (sec): 194.73 - samples/sec: 7509.59 - lr: 0.050000 +2023-04-06 00:51:10,965 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:51:10,965 EPOCH 42 done: loss 0.0299 - lr 0.050000 +2023-04-06 00:51:10,965 BAD EPOCHS (no improvement): 0 +2023-04-06 00:51:10,968 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:51:31,043 epoch 43 - iter 265/2650 - loss 0.02799119 - time (sec): 20.07 - samples/sec: 7386.23 - lr: 0.050000 +2023-04-06 00:51:50,322 epoch 43 - iter 530/2650 - loss 0.02850278 - time (sec): 39.35 - samples/sec: 7450.60 - lr: 0.050000 +2023-04-06 00:52:09,860 epoch 43 - iter 795/2650 - loss 0.02804902 - time (sec): 58.89 - samples/sec: 7485.08 - lr: 0.050000 +2023-04-06 00:52:28,808 epoch 43 - iter 1060/2650 - loss 0.02836221 - time (sec): 77.84 - samples/sec: 7556.55 - lr: 0.050000 +2023-04-06 00:52:48,170 epoch 43 - iter 1325/2650 - loss 0.02851280 - time (sec): 97.20 - samples/sec: 7541.96 - lr: 0.050000 +2023-04-06 00:53:17,979 epoch 43 - iter 1590/2650 - loss 0.02869553 - time (sec): 127.01 - samples/sec: 6931.99 - lr: 0.050000 +2023-04-06 00:53:37,000 epoch 43 - iter 1855/2650 - loss 0.02883675 - time (sec): 146.03 - samples/sec: 7008.85 - lr: 0.050000 +2023-04-06 00:53:56,381 epoch 43 - iter 2120/2650 - loss 0.02869713 - time (sec): 165.41 - samples/sec: 7080.72 - lr: 0.050000 +2023-04-06 00:54:15,961 epoch 43 - iter 2385/2650 - loss 0.02862479 - time (sec): 184.99 - samples/sec: 7117.62 - lr: 0.050000 +2023-04-06 00:54:35,447 epoch 43 - iter 2650/2650 - loss 0.02866556 - time (sec): 204.48 - samples/sec: 7151.67 - lr: 0.050000 +2023-04-06 00:54:35,447 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:54:35,447 EPOCH 43 done: loss 0.0287 - lr 0.050000 +2023-04-06 00:54:35,447 BAD EPOCHS (no improvement): 0 +2023-04-06 00:54:35,451 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:54:55,598 epoch 44 - iter 265/2650 - loss 0.02710923 - time (sec): 20.15 - samples/sec: 7285.25 - lr: 0.050000 +2023-04-06 00:55:14,932 epoch 44 - iter 530/2650 - loss 0.02736684 - time (sec): 39.48 - samples/sec: 7439.46 - lr: 0.050000 +2023-04-06 00:55:34,411 epoch 44 - iter 795/2650 - loss 0.02717180 - time (sec): 58.96 - samples/sec: 7460.04 - lr: 0.050000 +2023-04-06 00:55:53,601 epoch 44 - iter 1060/2650 - loss 0.02729847 - time (sec): 78.15 - samples/sec: 7485.47 - lr: 0.050000 +2023-04-06 00:56:12,925 epoch 44 - iter 1325/2650 - loss 0.02746751 - time (sec): 97.47 - samples/sec: 7509.87 - lr: 0.050000 +2023-04-06 00:56:32,029 epoch 44 - iter 1590/2650 - loss 0.02758190 - time (sec): 116.58 - samples/sec: 7531.09 - lr: 0.050000 +2023-04-06 00:56:51,588 epoch 44 - iter 1855/2650 - loss 0.02744225 - time (sec): 136.14 - samples/sec: 7534.10 - lr: 0.050000 +2023-04-06 00:57:11,142 epoch 44 - iter 2120/2650 - loss 0.02742070 - time (sec): 155.69 - samples/sec: 7536.47 - lr: 0.050000 +2023-04-06 00:57:30,320 epoch 44 - iter 2385/2650 - loss 0.02746320 - time (sec): 174.87 - samples/sec: 7537.48 - lr: 0.050000 +2023-04-06 00:57:49,294 epoch 44 - iter 2650/2650 - loss 0.02770175 - time (sec): 193.84 - samples/sec: 7544.07 - lr: 0.050000 +2023-04-06 00:57:49,294 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:57:49,294 EPOCH 44 done: loss 0.0277 - lr 0.050000 +2023-04-06 00:57:49,294 BAD EPOCHS (no improvement): 0 +2023-04-06 00:57:49,298 ---------------------------------------------------------------------------------------------------- +2023-04-06 00:58:08,191 epoch 45 - iter 265/2650 - loss 0.02509799 - time (sec): 18.89 - samples/sec: 7671.46 - lr: 0.050000 +2023-04-06 00:58:27,340 epoch 45 - iter 530/2650 - loss 0.02702074 - time (sec): 38.04 - samples/sec: 7632.51 - lr: 0.050000 +2023-04-06 00:58:46,386 epoch 45 - iter 795/2650 - loss 0.02733058 - time (sec): 57.09 - samples/sec: 7633.16 - lr: 0.050000 +2023-04-06 00:59:05,973 epoch 45 - iter 1060/2650 - loss 0.02741913 - time (sec): 76.68 - samples/sec: 7591.64 - lr: 0.050000 +2023-04-06 00:59:25,313 epoch 45 - iter 1325/2650 - loss 0.02708325 - time (sec): 96.02 - samples/sec: 7580.69 - lr: 0.050000 +2023-04-06 00:59:44,651 epoch 45 - iter 1590/2650 - loss 0.02708799 - time (sec): 115.35 - samples/sec: 7581.25 - lr: 0.050000 +2023-04-06 01:00:04,840 epoch 45 - iter 1855/2650 - loss 0.02726109 - time (sec): 135.54 - samples/sec: 7542.93 - lr: 0.050000 +2023-04-06 01:00:24,277 epoch 45 - iter 2120/2650 - loss 0.02740109 - time (sec): 154.98 - samples/sec: 7540.46 - lr: 0.050000 +2023-04-06 01:00:43,609 epoch 45 - iter 2385/2650 - loss 0.02735535 - time (sec): 174.31 - samples/sec: 7545.51 - lr: 0.050000 +2023-04-06 01:01:03,274 epoch 45 - iter 2650/2650 - loss 0.02734510 - time (sec): 193.98 - samples/sec: 7538.87 - lr: 0.050000 +2023-04-06 01:01:03,274 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:01:03,275 EPOCH 45 done: loss 0.0273 - lr 0.050000 +2023-04-06 01:01:03,275 BAD EPOCHS (no improvement): 0 +2023-04-06 01:01:03,290 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:01:22,877 epoch 46 - iter 265/2650 - loss 0.02775340 - time (sec): 19.59 - samples/sec: 7494.71 - lr: 0.050000 +2023-04-06 01:01:42,020 epoch 46 - iter 530/2650 - loss 0.02753420 - time (sec): 38.73 - samples/sec: 7580.22 - lr: 0.050000 +2023-04-06 01:02:01,173 epoch 46 - iter 795/2650 - loss 0.02683500 - time (sec): 57.88 - samples/sec: 7583.53 - lr: 0.050000 +2023-04-06 01:02:21,033 epoch 46 - iter 1060/2650 - loss 0.02685330 - time (sec): 77.74 - samples/sec: 7518.09 - lr: 0.050000 +2023-04-06 01:02:40,432 epoch 46 - iter 1325/2650 - loss 0.02686319 - time (sec): 97.14 - samples/sec: 7516.76 - lr: 0.050000 +2023-04-06 01:03:00,209 epoch 46 - iter 1590/2650 - loss 0.02686952 - time (sec): 116.92 - samples/sec: 7510.60 - lr: 0.050000 +2023-04-06 01:03:20,298 epoch 46 - iter 1855/2650 - loss 0.02696233 - time (sec): 137.01 - samples/sec: 7487.66 - lr: 0.050000 +2023-04-06 01:03:39,539 epoch 46 - iter 2120/2650 - loss 0.02709771 - time (sec): 156.25 - samples/sec: 7503.20 - lr: 0.050000 +2023-04-06 01:03:58,387 epoch 46 - iter 2385/2650 - loss 0.02721047 - time (sec): 175.10 - samples/sec: 7516.19 - lr: 0.050000 +2023-04-06 01:04:17,792 epoch 46 - iter 2650/2650 - loss 0.02726884 - time (sec): 194.50 - samples/sec: 7518.52 - lr: 0.050000 +2023-04-06 01:04:17,792 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:04:17,792 EPOCH 46 done: loss 0.0273 - lr 0.050000 +2023-04-06 01:04:17,792 BAD EPOCHS (no improvement): 0 +2023-04-06 01:04:17,796 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:04:37,761 epoch 47 - iter 265/2650 - loss 0.02579254 - time (sec): 19.96 - samples/sec: 7396.54 - lr: 0.050000 +2023-04-06 01:04:56,809 epoch 47 - iter 530/2650 - loss 0.02520486 - time (sec): 39.01 - samples/sec: 7504.27 - lr: 0.050000 +2023-04-06 01:05:16,166 epoch 47 - iter 795/2650 - loss 0.02535124 - time (sec): 58.37 - samples/sec: 7510.62 - lr: 0.050000 +2023-04-06 01:05:35,787 epoch 47 - iter 1060/2650 - loss 0.02555169 - time (sec): 77.99 - samples/sec: 7503.14 - lr: 0.050000 +2023-04-06 01:05:55,087 epoch 47 - iter 1325/2650 - loss 0.02568268 - time (sec): 97.29 - samples/sec: 7504.14 - lr: 0.050000 +2023-04-06 01:06:14,578 epoch 47 - iter 1590/2650 - loss 0.02589613 - time (sec): 116.78 - samples/sec: 7517.83 - lr: 0.050000 +2023-04-06 01:06:33,942 epoch 47 - iter 1855/2650 - loss 0.02605782 - time (sec): 136.15 - samples/sec: 7524.67 - lr: 0.050000 +2023-04-06 01:06:53,258 epoch 47 - iter 2120/2650 - loss 0.02630314 - time (sec): 155.46 - samples/sec: 7519.38 - lr: 0.050000 +2023-04-06 01:07:12,382 epoch 47 - iter 2385/2650 - loss 0.02634488 - time (sec): 174.59 - samples/sec: 7530.39 - lr: 0.050000 +2023-04-06 01:07:32,130 epoch 47 - iter 2650/2650 - loss 0.02638097 - time (sec): 194.33 - samples/sec: 7525.04 - lr: 0.050000 +2023-04-06 01:07:32,130 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:07:32,130 EPOCH 47 done: loss 0.0264 - lr 0.050000 +2023-04-06 01:07:32,130 BAD EPOCHS (no improvement): 0 +2023-04-06 01:07:32,134 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:07:51,165 epoch 48 - iter 265/2650 - loss 0.02497006 - time (sec): 19.03 - samples/sec: 7708.24 - lr: 0.050000 +2023-04-06 01:08:10,521 epoch 48 - iter 530/2650 - loss 0.02537864 - time (sec): 38.39 - samples/sec: 7652.81 - lr: 0.050000 +2023-04-06 01:08:30,134 epoch 48 - iter 795/2650 - loss 0.02586341 - time (sec): 58.00 - samples/sec: 7601.50 - lr: 0.050000 +2023-04-06 01:08:49,049 epoch 48 - iter 1060/2650 - loss 0.02610405 - time (sec): 76.91 - samples/sec: 7624.61 - lr: 0.050000 +2023-04-06 01:09:08,782 epoch 48 - iter 1325/2650 - loss 0.02613025 - time (sec): 96.65 - samples/sec: 7585.54 - lr: 0.050000 +2023-04-06 01:09:27,998 epoch 48 - iter 1590/2650 - loss 0.02639868 - time (sec): 115.86 - samples/sec: 7587.82 - lr: 0.050000 +2023-04-06 01:09:47,645 epoch 48 - iter 1855/2650 - loss 0.02665686 - time (sec): 135.51 - samples/sec: 7557.65 - lr: 0.050000 +2023-04-06 01:10:07,062 epoch 48 - iter 2120/2650 - loss 0.02648754 - time (sec): 154.93 - samples/sec: 7560.05 - lr: 0.050000 +2023-04-06 01:10:26,239 epoch 48 - iter 2385/2650 - loss 0.02640973 - time (sec): 174.10 - samples/sec: 7562.91 - lr: 0.050000 +2023-04-06 01:10:45,825 epoch 48 - iter 2650/2650 - loss 0.02644546 - time (sec): 193.69 - samples/sec: 7549.98 - lr: 0.050000 +2023-04-06 01:10:45,825 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:10:45,825 EPOCH 48 done: loss 0.0264 - lr 0.050000 +2023-04-06 01:10:45,825 BAD EPOCHS (no improvement): 1 +2023-04-06 01:10:45,828 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:11:04,470 epoch 49 - iter 265/2650 - loss 0.02572595 - time (sec): 18.64 - samples/sec: 7716.66 - lr: 0.050000 +2023-04-06 01:11:24,007 epoch 49 - iter 530/2650 - loss 0.02552120 - time (sec): 38.18 - samples/sec: 7602.09 - lr: 0.050000 +2023-04-06 01:11:43,480 epoch 49 - iter 795/2650 - loss 0.02633131 - time (sec): 57.65 - samples/sec: 7576.99 - lr: 0.050000 +2023-04-06 01:12:02,339 epoch 49 - iter 1060/2650 - loss 0.02598872 - time (sec): 76.51 - samples/sec: 7590.27 - lr: 0.050000 +2023-04-06 01:12:22,289 epoch 49 - iter 1325/2650 - loss 0.02601439 - time (sec): 96.46 - samples/sec: 7541.19 - lr: 0.050000 +2023-04-06 01:12:42,730 epoch 49 - iter 1590/2650 - loss 0.02620471 - time (sec): 116.90 - samples/sec: 7492.66 - lr: 0.050000 +2023-04-06 01:13:01,883 epoch 49 - iter 1855/2650 - loss 0.02615302 - time (sec): 136.05 - samples/sec: 7516.21 - lr: 0.050000 +2023-04-06 01:13:20,819 epoch 49 - iter 2120/2650 - loss 0.02615157 - time (sec): 154.99 - samples/sec: 7522.12 - lr: 0.050000 +2023-04-06 01:13:40,282 epoch 49 - iter 2385/2650 - loss 0.02609305 - time (sec): 174.45 - samples/sec: 7535.30 - lr: 0.050000 +2023-04-06 01:13:59,805 epoch 49 - iter 2650/2650 - loss 0.02602727 - time (sec): 193.98 - samples/sec: 7538.88 - lr: 0.050000 +2023-04-06 01:13:59,805 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:13:59,805 EPOCH 49 done: loss 0.0260 - lr 0.050000 +2023-04-06 01:13:59,805 BAD EPOCHS (no improvement): 0 +2023-04-06 01:13:59,808 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:14:19,314 epoch 50 - iter 265/2650 - loss 0.02565035 - time (sec): 19.51 - samples/sec: 7508.88 - lr: 0.050000 +2023-04-06 01:14:38,162 epoch 50 - iter 530/2650 - loss 0.02543204 - time (sec): 38.35 - samples/sec: 7571.96 - lr: 0.050000 +2023-04-06 01:14:57,197 epoch 50 - iter 795/2650 - loss 0.02555477 - time (sec): 57.39 - samples/sec: 7615.21 - lr: 0.050000 +2023-04-06 01:15:16,424 epoch 50 - iter 1060/2650 - loss 0.02503155 - time (sec): 76.62 - samples/sec: 7592.32 - lr: 0.050000 +2023-04-06 01:15:35,860 epoch 50 - iter 1325/2650 - loss 0.02525104 - time (sec): 96.05 - samples/sec: 7584.93 - lr: 0.050000 +2023-04-06 01:15:55,505 epoch 50 - iter 1590/2650 - loss 0.02528522 - time (sec): 115.70 - samples/sec: 7579.38 - lr: 0.050000 +2023-04-06 01:16:14,798 epoch 50 - iter 1855/2650 - loss 0.02549004 - time (sec): 134.99 - samples/sec: 7577.29 - lr: 0.050000 +2023-04-06 01:16:34,439 epoch 50 - iter 2120/2650 - loss 0.02573239 - time (sec): 154.63 - samples/sec: 7560.74 - lr: 0.050000 +2023-04-06 01:16:54,084 epoch 50 - iter 2385/2650 - loss 0.02561036 - time (sec): 174.28 - samples/sec: 7552.73 - lr: 0.050000 +2023-04-06 01:17:13,721 epoch 50 - iter 2650/2650 - loss 0.02588396 - time (sec): 193.91 - samples/sec: 7541.35 - lr: 0.050000 +2023-04-06 01:17:13,722 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:17:13,722 EPOCH 50 done: loss 0.0259 - lr 0.050000 +2023-04-06 01:17:13,722 BAD EPOCHS (no improvement): 0 +2023-04-06 01:17:13,725 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:17:33,203 epoch 51 - iter 265/2650 - loss 0.02476935 - time (sec): 19.48 - samples/sec: 7500.10 - lr: 0.050000 +2023-04-06 01:17:52,079 epoch 51 - iter 530/2650 - loss 0.02463422 - time (sec): 38.35 - samples/sec: 7586.37 - lr: 0.050000 +2023-04-06 01:18:11,377 epoch 51 - iter 795/2650 - loss 0.02502662 - time (sec): 57.65 - samples/sec: 7590.55 - lr: 0.050000 +2023-04-06 01:18:30,412 epoch 51 - iter 1060/2650 - loss 0.02513068 - time (sec): 76.69 - samples/sec: 7601.60 - lr: 0.050000 +2023-04-06 01:18:49,768 epoch 51 - iter 1325/2650 - loss 0.02536481 - time (sec): 96.04 - samples/sec: 7604.77 - lr: 0.050000 +2023-04-06 01:19:08,895 epoch 51 - iter 1590/2650 - loss 0.02530856 - time (sec): 115.17 - samples/sec: 7607.85 - lr: 0.050000 +2023-04-06 01:19:28,314 epoch 51 - iter 1855/2650 - loss 0.02515549 - time (sec): 134.59 - samples/sec: 7599.49 - lr: 0.050000 +2023-04-06 01:19:48,204 epoch 51 - iter 2120/2650 - loss 0.02537275 - time (sec): 154.48 - samples/sec: 7572.89 - lr: 0.050000 +2023-04-06 01:20:07,558 epoch 51 - iter 2385/2650 - loss 0.02531388 - time (sec): 173.83 - samples/sec: 7571.59 - lr: 0.050000 +2023-04-06 01:20:26,705 epoch 51 - iter 2650/2650 - loss 0.02558449 - time (sec): 192.98 - samples/sec: 7577.82 - lr: 0.050000 +2023-04-06 01:20:26,705 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:20:26,705 EPOCH 51 done: loss 0.0256 - lr 0.050000 +2023-04-06 01:20:26,705 BAD EPOCHS (no improvement): 0 +2023-04-06 01:20:26,708 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:20:46,533 epoch 52 - iter 265/2650 - loss 0.02428667 - time (sec): 19.82 - samples/sec: 7498.55 - lr: 0.050000 +2023-04-06 01:21:06,088 epoch 52 - iter 530/2650 - loss 0.02445563 - time (sec): 39.38 - samples/sec: 7479.28 - lr: 0.050000 +2023-04-06 01:21:25,191 epoch 52 - iter 795/2650 - loss 0.02421567 - time (sec): 58.48 - samples/sec: 7523.45 - lr: 0.050000 +2023-04-06 01:21:44,634 epoch 52 - iter 1060/2650 - loss 0.02474226 - time (sec): 77.93 - samples/sec: 7506.65 - lr: 0.050000 +2023-04-06 01:22:03,898 epoch 52 - iter 1325/2650 - loss 0.02506947 - time (sec): 97.19 - samples/sec: 7544.89 - lr: 0.050000 +2023-04-06 01:22:23,454 epoch 52 - iter 1590/2650 - loss 0.02522818 - time (sec): 116.75 - samples/sec: 7548.89 - lr: 0.050000 +2023-04-06 01:22:43,024 epoch 52 - iter 1855/2650 - loss 0.02536071 - time (sec): 136.32 - samples/sec: 7535.44 - lr: 0.050000 +2023-04-06 01:23:02,131 epoch 52 - iter 2120/2650 - loss 0.02545367 - time (sec): 155.42 - samples/sec: 7557.21 - lr: 0.050000 +2023-04-06 01:23:20,797 epoch 52 - iter 2385/2650 - loss 0.02536263 - time (sec): 174.09 - samples/sec: 7577.26 - lr: 0.050000 +2023-04-06 01:23:39,861 epoch 52 - iter 2650/2650 - loss 0.02535702 - time (sec): 193.15 - samples/sec: 7571.02 - lr: 0.050000 +2023-04-06 01:23:39,861 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:23:39,861 EPOCH 52 done: loss 0.0254 - lr 0.050000 +2023-04-06 01:23:39,861 BAD EPOCHS (no improvement): 0 +2023-04-06 01:23:39,864 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:23:59,168 epoch 53 - iter 265/2650 - loss 0.02384415 - time (sec): 19.30 - samples/sec: 7587.55 - lr: 0.050000 +2023-04-06 01:24:18,424 epoch 53 - iter 530/2650 - loss 0.02477392 - time (sec): 38.56 - samples/sec: 7568.35 - lr: 0.050000 +2023-04-06 01:24:37,042 epoch 53 - iter 795/2650 - loss 0.02478839 - time (sec): 57.18 - samples/sec: 7644.22 - lr: 0.050000 +2023-04-06 01:24:56,776 epoch 53 - iter 1060/2650 - loss 0.02494889 - time (sec): 76.91 - samples/sec: 7597.85 - lr: 0.050000 +2023-04-06 01:25:16,271 epoch 53 - iter 1325/2650 - loss 0.02480454 - time (sec): 96.41 - samples/sec: 7601.60 - lr: 0.050000 +2023-04-06 01:25:35,661 epoch 53 - iter 1590/2650 - loss 0.02468777 - time (sec): 115.80 - samples/sec: 7580.97 - lr: 0.050000 +2023-04-06 01:25:54,928 epoch 53 - iter 1855/2650 - loss 0.02499293 - time (sec): 135.06 - samples/sec: 7572.97 - lr: 0.050000 +2023-04-06 01:26:13,712 epoch 53 - iter 2120/2650 - loss 0.02510099 - time (sec): 153.85 - samples/sec: 7593.36 - lr: 0.050000 +2023-04-06 01:26:33,163 epoch 53 - iter 2385/2650 - loss 0.02489719 - time (sec): 173.30 - samples/sec: 7587.98 - lr: 0.050000 +2023-04-06 01:26:53,182 epoch 53 - iter 2650/2650 - loss 0.02507869 - time (sec): 193.32 - samples/sec: 7564.54 - lr: 0.050000 +2023-04-06 01:26:53,183 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:26:53,183 EPOCH 53 done: loss 0.0251 - lr 0.050000 +2023-04-06 01:26:53,183 BAD EPOCHS (no improvement): 0 +2023-04-06 01:26:53,186 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:27:12,263 epoch 54 - iter 265/2650 - loss 0.02404935 - time (sec): 19.08 - samples/sec: 7668.36 - lr: 0.050000 +2023-04-06 01:27:31,619 epoch 54 - iter 530/2650 - loss 0.02523240 - time (sec): 38.43 - samples/sec: 7617.33 - lr: 0.050000 +2023-04-06 01:27:51,094 epoch 54 - iter 795/2650 - loss 0.02507307 - time (sec): 57.91 - samples/sec: 7607.61 - lr: 0.050000 +2023-04-06 01:28:11,262 epoch 54 - iter 1060/2650 - loss 0.02508579 - time (sec): 78.08 - samples/sec: 7537.86 - lr: 0.050000 +2023-04-06 01:28:30,719 epoch 54 - iter 1325/2650 - loss 0.02516602 - time (sec): 97.53 - samples/sec: 7549.15 - lr: 0.050000 +2023-04-06 01:28:50,363 epoch 54 - iter 1590/2650 - loss 0.02526335 - time (sec): 117.18 - samples/sec: 7526.76 - lr: 0.050000 +2023-04-06 01:29:08,929 epoch 54 - iter 1855/2650 - loss 0.02520349 - time (sec): 135.74 - samples/sec: 7550.96 - lr: 0.050000 +2023-04-06 01:29:28,607 epoch 54 - iter 2120/2650 - loss 0.02535713 - time (sec): 155.42 - samples/sec: 7542.01 - lr: 0.050000 +2023-04-06 01:29:47,436 epoch 54 - iter 2385/2650 - loss 0.02533769 - time (sec): 174.25 - samples/sec: 7550.47 - lr: 0.050000 +2023-04-06 01:30:06,963 epoch 54 - iter 2650/2650 - loss 0.02533762 - time (sec): 193.78 - samples/sec: 7546.64 - lr: 0.050000 +2023-04-06 01:30:06,964 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:30:06,964 EPOCH 54 done: loss 0.0253 - lr 0.050000 +2023-04-06 01:30:06,964 BAD EPOCHS (no improvement): 1 +2023-04-06 01:30:06,968 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:30:25,678 epoch 55 - iter 265/2650 - loss 0.02445691 - time (sec): 18.71 - samples/sec: 7748.94 - lr: 0.050000 +2023-04-06 01:30:44,548 epoch 55 - iter 530/2650 - loss 0.02469012 - time (sec): 37.58 - samples/sec: 7732.49 - lr: 0.050000 +2023-04-06 01:31:04,063 epoch 55 - iter 795/2650 - loss 0.02431063 - time (sec): 57.10 - samples/sec: 7675.71 - lr: 0.050000 +2023-04-06 01:31:24,143 epoch 55 - iter 1060/2650 - loss 0.02403691 - time (sec): 77.18 - samples/sec: 7587.05 - lr: 0.050000 +2023-04-06 01:31:43,149 epoch 55 - iter 1325/2650 - loss 0.02393999 - time (sec): 96.18 - samples/sec: 7591.61 - lr: 0.050000 +2023-04-06 01:32:02,452 epoch 55 - iter 1590/2650 - loss 0.02432887 - time (sec): 115.48 - samples/sec: 7597.23 - lr: 0.050000 +2023-04-06 01:32:22,099 epoch 55 - iter 1855/2650 - loss 0.02429997 - time (sec): 135.13 - samples/sec: 7571.78 - lr: 0.050000 +2023-04-06 01:32:40,968 epoch 55 - iter 2120/2650 - loss 0.02442207 - time (sec): 154.00 - samples/sec: 7583.90 - lr: 0.050000 +2023-04-06 01:33:00,509 epoch 55 - iter 2385/2650 - loss 0.02432777 - time (sec): 173.54 - samples/sec: 7574.46 - lr: 0.050000 +2023-04-06 01:33:20,420 epoch 55 - iter 2650/2650 - loss 0.02436127 - time (sec): 193.45 - samples/sec: 7559.28 - lr: 0.050000 +2023-04-06 01:33:20,421 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:33:20,421 EPOCH 55 done: loss 0.0244 - lr 0.050000 +2023-04-06 01:33:20,421 BAD EPOCHS (no improvement): 0 +2023-04-06 01:33:20,425 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:33:39,910 epoch 56 - iter 265/2650 - loss 0.02377505 - time (sec): 19.49 - samples/sec: 7489.99 - lr: 0.050000 +2023-04-06 01:33:59,324 epoch 56 - iter 530/2650 - loss 0.02438565 - time (sec): 38.90 - samples/sec: 7519.72 - lr: 0.050000 +2023-04-06 01:34:18,821 epoch 56 - iter 795/2650 - loss 0.02383171 - time (sec): 58.40 - samples/sec: 7519.05 - lr: 0.050000 +2023-04-06 01:34:38,703 epoch 56 - iter 1060/2650 - loss 0.02403599 - time (sec): 78.28 - samples/sec: 7485.78 - lr: 0.050000 +2023-04-06 01:34:57,585 epoch 56 - iter 1325/2650 - loss 0.02387954 - time (sec): 97.16 - samples/sec: 7515.97 - lr: 0.050000 +2023-04-06 01:35:17,090 epoch 56 - iter 1590/2650 - loss 0.02397118 - time (sec): 116.67 - samples/sec: 7514.80 - lr: 0.050000 +2023-04-06 01:35:36,055 epoch 56 - iter 1855/2650 - loss 0.02403955 - time (sec): 135.63 - samples/sec: 7542.35 - lr: 0.050000 +2023-04-06 01:35:55,238 epoch 56 - iter 2120/2650 - loss 0.02403829 - time (sec): 154.81 - samples/sec: 7555.59 - lr: 0.050000 +2023-04-06 01:36:14,399 epoch 56 - iter 2385/2650 - loss 0.02412982 - time (sec): 173.97 - samples/sec: 7557.59 - lr: 0.050000 +2023-04-06 01:36:33,828 epoch 56 - iter 2650/2650 - loss 0.02428701 - time (sec): 193.40 - samples/sec: 7561.22 - lr: 0.050000 +2023-04-06 01:36:33,828 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:36:33,828 EPOCH 56 done: loss 0.0243 - lr 0.050000 +2023-04-06 01:36:33,828 BAD EPOCHS (no improvement): 0 +2023-04-06 01:36:33,832 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:36:53,152 epoch 57 - iter 265/2650 - loss 0.02398013 - time (sec): 19.32 - samples/sec: 7533.07 - lr: 0.050000 +2023-04-06 01:37:12,591 epoch 57 - iter 530/2650 - loss 0.02429248 - time (sec): 38.76 - samples/sec: 7542.41 - lr: 0.050000 +2023-04-06 01:37:32,172 epoch 57 - iter 795/2650 - loss 0.02418072 - time (sec): 58.34 - samples/sec: 7538.34 - lr: 0.050000 +2023-04-06 01:37:51,594 epoch 57 - iter 1060/2650 - loss 0.02418512 - time (sec): 77.76 - samples/sec: 7538.48 - lr: 0.050000 +2023-04-06 01:38:10,575 epoch 57 - iter 1325/2650 - loss 0.02406297 - time (sec): 96.74 - samples/sec: 7565.41 - lr: 0.050000 +2023-04-06 01:38:29,560 epoch 57 - iter 1590/2650 - loss 0.02409748 - time (sec): 115.73 - samples/sec: 7583.74 - lr: 0.050000 +2023-04-06 01:38:48,964 epoch 57 - iter 1855/2650 - loss 0.02398304 - time (sec): 135.13 - samples/sec: 7579.53 - lr: 0.050000 +2023-04-06 01:39:08,450 epoch 57 - iter 2120/2650 - loss 0.02405014 - time (sec): 154.62 - samples/sec: 7571.11 - lr: 0.050000 +2023-04-06 01:39:27,959 epoch 57 - iter 2385/2650 - loss 0.02400264 - time (sec): 174.13 - samples/sec: 7564.21 - lr: 0.050000 +2023-04-06 01:39:46,995 epoch 57 - iter 2650/2650 - loss 0.02417812 - time (sec): 193.16 - samples/sec: 7570.62 - lr: 0.050000 +2023-04-06 01:39:46,995 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:39:46,995 EPOCH 57 done: loss 0.0242 - lr 0.050000 +2023-04-06 01:39:46,995 BAD EPOCHS (no improvement): 0 +2023-04-06 01:39:46,998 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:40:06,059 epoch 58 - iter 265/2650 - loss 0.02391883 - time (sec): 19.06 - samples/sec: 7554.10 - lr: 0.050000 +2023-04-06 01:40:25,476 epoch 58 - iter 530/2650 - loss 0.02445235 - time (sec): 38.48 - samples/sec: 7534.71 - lr: 0.050000 +2023-04-06 01:40:44,829 epoch 58 - iter 795/2650 - loss 0.02420618 - time (sec): 57.83 - samples/sec: 7572.99 - lr: 0.050000 +2023-04-06 01:41:03,885 epoch 58 - iter 1060/2650 - loss 0.02416510 - time (sec): 76.89 - samples/sec: 7586.44 - lr: 0.050000 +2023-04-06 01:41:23,497 epoch 58 - iter 1325/2650 - loss 0.02420534 - time (sec): 96.50 - samples/sec: 7549.23 - lr: 0.050000 +2023-04-06 01:41:43,225 epoch 58 - iter 1590/2650 - loss 0.02406354 - time (sec): 116.23 - samples/sec: 7528.95 - lr: 0.050000 +2023-04-06 01:42:03,252 epoch 58 - iter 1855/2650 - loss 0.02407472 - time (sec): 136.25 - samples/sec: 7512.06 - lr: 0.050000 +2023-04-06 01:42:22,191 epoch 58 - iter 2120/2650 - loss 0.02412140 - time (sec): 155.19 - samples/sec: 7537.83 - lr: 0.050000 +2023-04-06 01:42:41,533 epoch 58 - iter 2385/2650 - loss 0.02397507 - time (sec): 174.53 - samples/sec: 7544.20 - lr: 0.050000 +2023-04-06 01:43:00,508 epoch 58 - iter 2650/2650 - loss 0.02401095 - time (sec): 193.51 - samples/sec: 7557.06 - lr: 0.050000 +2023-04-06 01:43:00,508 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:43:00,508 EPOCH 58 done: loss 0.0240 - lr 0.050000 +2023-04-06 01:43:00,508 BAD EPOCHS (no improvement): 0 +2023-04-06 01:43:00,511 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:43:29,743 epoch 59 - iter 265/2650 - loss 0.02401676 - time (sec): 29.23 - samples/sec: 4985.83 - lr: 0.050000 +2023-04-06 01:43:49,665 epoch 59 - iter 530/2650 - loss 0.02373717 - time (sec): 49.15 - samples/sec: 5958.01 - lr: 0.050000 +2023-04-06 01:44:08,998 epoch 59 - iter 795/2650 - loss 0.02367060 - time (sec): 68.49 - samples/sec: 6416.11 - lr: 0.050000 +2023-04-06 01:44:27,974 epoch 59 - iter 1060/2650 - loss 0.02394443 - time (sec): 87.46 - samples/sec: 6707.21 - lr: 0.050000 +2023-04-06 01:44:47,346 epoch 59 - iter 1325/2650 - loss 0.02376119 - time (sec): 106.83 - samples/sec: 6875.43 - lr: 0.050000 +2023-04-06 01:45:06,237 epoch 59 - iter 1590/2650 - loss 0.02397139 - time (sec): 125.73 - samples/sec: 6993.14 - lr: 0.050000 +2023-04-06 01:45:25,520 epoch 59 - iter 1855/2650 - loss 0.02410068 - time (sec): 145.01 - samples/sec: 7072.06 - lr: 0.050000 +2023-04-06 01:45:44,796 epoch 59 - iter 2120/2650 - loss 0.02416227 - time (sec): 164.28 - samples/sec: 7131.06 - lr: 0.050000 +2023-04-06 01:46:04,055 epoch 59 - iter 2385/2650 - loss 0.02427166 - time (sec): 183.54 - samples/sec: 7171.22 - lr: 0.050000 +2023-04-06 01:46:23,607 epoch 59 - iter 2650/2650 - loss 0.02429694 - time (sec): 203.10 - samples/sec: 7200.36 - lr: 0.050000 +2023-04-06 01:46:23,608 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:46:23,608 EPOCH 59 done: loss 0.0243 - lr 0.050000 +2023-04-06 01:46:23,608 BAD EPOCHS (no improvement): 1 +2023-04-06 01:46:23,612 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:46:43,440 epoch 60 - iter 265/2650 - loss 0.02377375 - time (sec): 19.83 - samples/sec: 7434.15 - lr: 0.050000 +2023-04-06 01:47:02,502 epoch 60 - iter 530/2650 - loss 0.02425963 - time (sec): 38.89 - samples/sec: 7541.74 - lr: 0.050000 +2023-04-06 01:47:21,936 epoch 60 - iter 795/2650 - loss 0.02365385 - time (sec): 58.32 - samples/sec: 7510.84 - lr: 0.050000 +2023-04-06 01:47:41,656 epoch 60 - iter 1060/2650 - loss 0.02378961 - time (sec): 78.04 - samples/sec: 7487.93 - lr: 0.050000 +2023-04-06 01:48:01,510 epoch 60 - iter 1325/2650 - loss 0.02388184 - time (sec): 97.90 - samples/sec: 7474.98 - lr: 0.050000 +2023-04-06 01:48:20,827 epoch 60 - iter 1590/2650 - loss 0.02398835 - time (sec): 117.22 - samples/sec: 7487.91 - lr: 0.050000 +2023-04-06 01:48:39,680 epoch 60 - iter 1855/2650 - loss 0.02396476 - time (sec): 136.07 - samples/sec: 7523.92 - lr: 0.050000 +2023-04-06 01:48:59,119 epoch 60 - iter 2120/2650 - loss 0.02391949 - time (sec): 155.51 - samples/sec: 7528.10 - lr: 0.050000 +2023-04-06 01:49:18,645 epoch 60 - iter 2385/2650 - loss 0.02394978 - time (sec): 175.03 - samples/sec: 7521.83 - lr: 0.050000 +2023-04-06 01:49:37,311 epoch 60 - iter 2650/2650 - loss 0.02405185 - time (sec): 193.70 - samples/sec: 7549.66 - lr: 0.050000 +2023-04-06 01:49:37,311 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:49:37,311 EPOCH 60 done: loss 0.0241 - lr 0.050000 +2023-04-06 01:49:37,311 BAD EPOCHS (no improvement): 2 +2023-04-06 01:49:37,314 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:49:57,331 epoch 61 - iter 265/2650 - loss 0.02314493 - time (sec): 20.02 - samples/sec: 7346.36 - lr: 0.050000 +2023-04-06 01:50:16,962 epoch 61 - iter 530/2650 - loss 0.02354502 - time (sec): 39.65 - samples/sec: 7428.09 - lr: 0.050000 +2023-04-06 01:50:36,953 epoch 61 - iter 795/2650 - loss 0.02334702 - time (sec): 59.64 - samples/sec: 7399.68 - lr: 0.050000 +2023-04-06 01:50:55,747 epoch 61 - iter 1060/2650 - loss 0.02314119 - time (sec): 78.43 - samples/sec: 7481.04 - lr: 0.050000 +2023-04-06 01:51:14,671 epoch 61 - iter 1325/2650 - loss 0.02323366 - time (sec): 97.36 - samples/sec: 7519.98 - lr: 0.050000 +2023-04-06 01:51:33,426 epoch 61 - iter 1590/2650 - loss 0.02328936 - time (sec): 116.11 - samples/sec: 7552.74 - lr: 0.050000 +2023-04-06 01:51:52,857 epoch 61 - iter 1855/2650 - loss 0.02346059 - time (sec): 135.54 - samples/sec: 7560.67 - lr: 0.050000 +2023-04-06 01:52:11,964 epoch 61 - iter 2120/2650 - loss 0.02365344 - time (sec): 154.65 - samples/sec: 7564.04 - lr: 0.050000 +2023-04-06 01:52:31,516 epoch 61 - iter 2385/2650 - loss 0.02360404 - time (sec): 174.20 - samples/sec: 7562.99 - lr: 0.050000 +2023-04-06 01:52:50,450 epoch 61 - iter 2650/2650 - loss 0.02365696 - time (sec): 193.14 - samples/sec: 7571.68 - lr: 0.050000 +2023-04-06 01:52:50,451 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:52:50,451 EPOCH 61 done: loss 0.0237 - lr 0.050000 +2023-04-06 01:52:50,451 BAD EPOCHS (no improvement): 0 +2023-04-06 01:52:50,454 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:53:09,375 epoch 62 - iter 265/2650 - loss 0.02199520 - time (sec): 18.92 - samples/sec: 7697.59 - lr: 0.050000 +2023-04-06 01:53:28,458 epoch 62 - iter 530/2650 - loss 0.02213204 - time (sec): 38.00 - samples/sec: 7643.91 - lr: 0.050000 +2023-04-06 01:53:48,180 epoch 62 - iter 795/2650 - loss 0.02257149 - time (sec): 57.73 - samples/sec: 7583.14 - lr: 0.050000 +2023-04-06 01:54:07,794 epoch 62 - iter 1060/2650 - loss 0.02305612 - time (sec): 77.34 - samples/sec: 7560.76 - lr: 0.050000 +2023-04-06 01:54:27,055 epoch 62 - iter 1325/2650 - loss 0.02306570 - time (sec): 96.60 - samples/sec: 7567.68 - lr: 0.050000 +2023-04-06 01:54:46,278 epoch 62 - iter 1590/2650 - loss 0.02325935 - time (sec): 115.82 - samples/sec: 7570.73 - lr: 0.050000 +2023-04-06 01:55:05,033 epoch 62 - iter 1855/2650 - loss 0.02333108 - time (sec): 134.58 - samples/sec: 7591.17 - lr: 0.050000 +2023-04-06 01:55:24,646 epoch 62 - iter 2120/2650 - loss 0.02324183 - time (sec): 154.19 - samples/sec: 7580.73 - lr: 0.050000 +2023-04-06 01:55:43,810 epoch 62 - iter 2385/2650 - loss 0.02313471 - time (sec): 173.36 - samples/sec: 7586.10 - lr: 0.050000 +2023-04-06 01:56:03,592 epoch 62 - iter 2650/2650 - loss 0.02312860 - time (sec): 193.14 - samples/sec: 7571.58 - lr: 0.050000 +2023-04-06 01:56:03,593 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:56:03,593 EPOCH 62 done: loss 0.0231 - lr 0.050000 +2023-04-06 01:56:03,593 BAD EPOCHS (no improvement): 0 +2023-04-06 01:56:03,596 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:56:22,959 epoch 63 - iter 265/2650 - loss 0.02258374 - time (sec): 19.36 - samples/sec: 7544.21 - lr: 0.050000 +2023-04-06 01:56:41,606 epoch 63 - iter 530/2650 - loss 0.02268069 - time (sec): 38.01 - samples/sec: 7580.64 - lr: 0.050000 +2023-04-06 01:57:00,821 epoch 63 - iter 795/2650 - loss 0.02266222 - time (sec): 57.22 - samples/sec: 7611.11 - lr: 0.050000 +2023-04-06 01:57:19,730 epoch 63 - iter 1060/2650 - loss 0.02299915 - time (sec): 76.13 - samples/sec: 7638.57 - lr: 0.050000 +2023-04-06 01:57:39,117 epoch 63 - iter 1325/2650 - loss 0.02301035 - time (sec): 95.52 - samples/sec: 7620.75 - lr: 0.050000 +2023-04-06 01:57:59,259 epoch 63 - iter 1590/2650 - loss 0.02327957 - time (sec): 115.66 - samples/sec: 7567.01 - lr: 0.050000 +2023-04-06 01:58:18,795 epoch 63 - iter 1855/2650 - loss 0.02326396 - time (sec): 135.20 - samples/sec: 7564.16 - lr: 0.050000 +2023-04-06 01:58:38,026 epoch 63 - iter 2120/2650 - loss 0.02342097 - time (sec): 154.43 - samples/sec: 7575.37 - lr: 0.050000 +2023-04-06 01:58:57,439 epoch 63 - iter 2385/2650 - loss 0.02347558 - time (sec): 173.84 - samples/sec: 7573.20 - lr: 0.050000 +2023-04-06 01:59:16,838 epoch 63 - iter 2650/2650 - loss 0.02347955 - time (sec): 193.24 - samples/sec: 7567.53 - lr: 0.050000 +2023-04-06 01:59:16,838 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:59:16,838 EPOCH 63 done: loss 0.0235 - lr 0.050000 +2023-04-06 01:59:16,838 BAD EPOCHS (no improvement): 1 +2023-04-06 01:59:16,842 ---------------------------------------------------------------------------------------------------- +2023-04-06 01:59:35,954 epoch 64 - iter 265/2650 - loss 0.02286926 - time (sec): 19.11 - samples/sec: 7552.47 - lr: 0.050000 +2023-04-06 01:59:55,675 epoch 64 - iter 530/2650 - loss 0.02258219 - time (sec): 38.83 - samples/sec: 7523.03 - lr: 0.050000 +2023-04-06 02:00:15,374 epoch 64 - iter 795/2650 - loss 0.02226003 - time (sec): 58.53 - samples/sec: 7498.28 - lr: 0.050000 +2023-04-06 02:00:34,600 epoch 64 - iter 1060/2650 - loss 0.02266443 - time (sec): 77.76 - samples/sec: 7534.54 - lr: 0.050000 +2023-04-06 02:00:53,993 epoch 64 - iter 1325/2650 - loss 0.02277547 - time (sec): 97.15 - samples/sec: 7517.59 - lr: 0.050000 +2023-04-06 02:01:13,129 epoch 64 - iter 1590/2650 - loss 0.02285390 - time (sec): 116.29 - samples/sec: 7538.17 - lr: 0.050000 +2023-04-06 02:01:32,920 epoch 64 - iter 1855/2650 - loss 0.02273884 - time (sec): 136.08 - samples/sec: 7528.09 - lr: 0.050000 +2023-04-06 02:01:52,455 epoch 64 - iter 2120/2650 - loss 0.02292576 - time (sec): 155.61 - samples/sec: 7523.95 - lr: 0.050000 +2023-04-06 02:02:11,476 epoch 64 - iter 2385/2650 - loss 0.02302581 - time (sec): 174.63 - samples/sec: 7537.45 - lr: 0.050000 +2023-04-06 02:02:30,604 epoch 64 - iter 2650/2650 - loss 0.02311827 - time (sec): 193.76 - samples/sec: 7547.21 - lr: 0.050000 +2023-04-06 02:02:30,605 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:02:30,605 EPOCH 64 done: loss 0.0231 - lr 0.050000 +2023-04-06 02:02:30,605 BAD EPOCHS (no improvement): 0 +2023-04-06 02:02:30,608 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:02:49,959 epoch 65 - iter 265/2650 - loss 0.02145897 - time (sec): 19.35 - samples/sec: 7592.50 - lr: 0.050000 +2023-04-06 02:03:09,235 epoch 65 - iter 530/2650 - loss 0.02177615 - time (sec): 38.63 - samples/sec: 7632.40 - lr: 0.050000 +2023-04-06 02:03:28,707 epoch 65 - iter 795/2650 - loss 0.02203147 - time (sec): 58.10 - samples/sec: 7592.61 - lr: 0.050000 +2023-04-06 02:03:48,187 epoch 65 - iter 1060/2650 - loss 0.02216671 - time (sec): 77.58 - samples/sec: 7582.59 - lr: 0.050000 +2023-04-06 02:04:07,463 epoch 65 - iter 1325/2650 - loss 0.02224406 - time (sec): 96.85 - samples/sec: 7574.96 - lr: 0.050000 +2023-04-06 02:04:27,519 epoch 65 - iter 1590/2650 - loss 0.02235511 - time (sec): 116.91 - samples/sec: 7541.14 - lr: 0.050000 +2023-04-06 02:04:46,972 epoch 65 - iter 1855/2650 - loss 0.02269270 - time (sec): 136.36 - samples/sec: 7535.08 - lr: 0.050000 +2023-04-06 02:05:05,650 epoch 65 - iter 2120/2650 - loss 0.02296573 - time (sec): 155.04 - samples/sec: 7553.61 - lr: 0.050000 +2023-04-06 02:05:24,696 epoch 65 - iter 2385/2650 - loss 0.02303537 - time (sec): 174.09 - samples/sec: 7561.03 - lr: 0.050000 +2023-04-06 02:05:44,097 epoch 65 - iter 2650/2650 - loss 0.02305247 - time (sec): 193.49 - samples/sec: 7557.88 - lr: 0.050000 +2023-04-06 02:05:44,097 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:05:44,098 EPOCH 65 done: loss 0.0231 - lr 0.050000 +2023-04-06 02:05:44,098 BAD EPOCHS (no improvement): 0 +2023-04-06 02:05:44,104 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:06:03,358 epoch 66 - iter 265/2650 - loss 0.02208292 - time (sec): 19.25 - samples/sec: 7588.07 - lr: 0.050000 +2023-04-06 02:06:22,953 epoch 66 - iter 530/2650 - loss 0.02263528 - time (sec): 38.85 - samples/sec: 7542.83 - lr: 0.050000 +2023-04-06 02:06:42,879 epoch 66 - iter 795/2650 - loss 0.02226817 - time (sec): 58.77 - samples/sec: 7504.66 - lr: 0.050000 +2023-04-06 02:07:02,304 epoch 66 - iter 1060/2650 - loss 0.02280661 - time (sec): 78.20 - samples/sec: 7498.00 - lr: 0.050000 +2023-04-06 02:07:21,646 epoch 66 - iter 1325/2650 - loss 0.02293911 - time (sec): 97.54 - samples/sec: 7509.08 - lr: 0.050000 +2023-04-06 02:07:41,504 epoch 66 - iter 1590/2650 - loss 0.02291120 - time (sec): 117.40 - samples/sec: 7479.78 - lr: 0.050000 +2023-04-06 02:08:00,381 epoch 66 - iter 1855/2650 - loss 0.02294978 - time (sec): 136.28 - samples/sec: 7515.20 - lr: 0.050000 +2023-04-06 02:08:19,847 epoch 66 - iter 2120/2650 - loss 0.02298986 - time (sec): 155.74 - samples/sec: 7508.62 - lr: 0.050000 +2023-04-06 02:08:39,638 epoch 66 - iter 2385/2650 - loss 0.02288823 - time (sec): 175.53 - samples/sec: 7504.41 - lr: 0.050000 +2023-04-06 02:08:58,978 epoch 66 - iter 2650/2650 - loss 0.02295924 - time (sec): 194.87 - samples/sec: 7504.13 - lr: 0.050000 +2023-04-06 02:08:58,979 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:08:58,979 EPOCH 66 done: loss 0.0230 - lr 0.050000 +2023-04-06 02:08:58,979 BAD EPOCHS (no improvement): 0 +2023-04-06 02:08:58,983 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:09:18,543 epoch 67 - iter 265/2650 - loss 0.02270088 - time (sec): 19.56 - samples/sec: 7542.19 - lr: 0.050000 +2023-04-06 02:09:38,184 epoch 67 - iter 530/2650 - loss 0.02266399 - time (sec): 39.20 - samples/sec: 7515.29 - lr: 0.050000 +2023-04-06 02:09:57,194 epoch 67 - iter 795/2650 - loss 0.02250087 - time (sec): 58.21 - samples/sec: 7568.40 - lr: 0.050000 +2023-04-06 02:10:16,038 epoch 67 - iter 1060/2650 - loss 0.02244498 - time (sec): 77.06 - samples/sec: 7594.56 - lr: 0.050000 +2023-04-06 02:10:35,481 epoch 67 - iter 1325/2650 - loss 0.02244627 - time (sec): 96.50 - samples/sec: 7570.32 - lr: 0.050000 +2023-04-06 02:10:54,900 epoch 67 - iter 1590/2650 - loss 0.02243636 - time (sec): 115.92 - samples/sec: 7551.17 - lr: 0.050000 +2023-04-06 02:11:14,566 epoch 67 - iter 1855/2650 - loss 0.02249549 - time (sec): 135.58 - samples/sec: 7534.42 - lr: 0.050000 +2023-04-06 02:11:34,013 epoch 67 - iter 2120/2650 - loss 0.02240109 - time (sec): 155.03 - samples/sec: 7534.93 - lr: 0.050000 +2023-04-06 02:11:53,475 epoch 67 - iter 2385/2650 - loss 0.02255590 - time (sec): 174.49 - samples/sec: 7539.04 - lr: 0.050000 +2023-04-06 02:12:13,168 epoch 67 - iter 2650/2650 - loss 0.02262329 - time (sec): 194.18 - samples/sec: 7530.77 - lr: 0.050000 +2023-04-06 02:12:13,168 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:12:13,168 EPOCH 67 done: loss 0.0226 - lr 0.050000 +2023-04-06 02:12:13,168 BAD EPOCHS (no improvement): 0 +2023-04-06 02:12:13,172 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:12:32,814 epoch 68 - iter 265/2650 - loss 0.02206876 - time (sec): 19.64 - samples/sec: 7495.31 - lr: 0.050000 +2023-04-06 02:12:52,286 epoch 68 - iter 530/2650 - loss 0.02203861 - time (sec): 39.11 - samples/sec: 7500.05 - lr: 0.050000 +2023-04-06 02:13:12,383 epoch 68 - iter 795/2650 - loss 0.02227440 - time (sec): 59.21 - samples/sec: 7442.11 - lr: 0.050000 +2023-04-06 02:13:31,791 epoch 68 - iter 1060/2650 - loss 0.02262573 - time (sec): 78.62 - samples/sec: 7470.98 - lr: 0.050000 +2023-04-06 02:13:51,208 epoch 68 - iter 1325/2650 - loss 0.02273658 - time (sec): 98.04 - samples/sec: 7491.21 - lr: 0.050000 +2023-04-06 02:14:10,333 epoch 68 - iter 1590/2650 - loss 0.02261569 - time (sec): 117.16 - samples/sec: 7496.80 - lr: 0.050000 +2023-04-06 02:14:29,564 epoch 68 - iter 1855/2650 - loss 0.02274152 - time (sec): 136.39 - samples/sec: 7508.86 - lr: 0.050000 +2023-04-06 02:14:48,371 epoch 68 - iter 2120/2650 - loss 0.02262592 - time (sec): 155.20 - samples/sec: 7519.42 - lr: 0.050000 +2023-04-06 02:15:08,258 epoch 68 - iter 2385/2650 - loss 0.02274996 - time (sec): 175.09 - samples/sec: 7505.90 - lr: 0.050000 +2023-04-06 02:15:27,863 epoch 68 - iter 2650/2650 - loss 0.02265242 - time (sec): 194.69 - samples/sec: 7511.21 - lr: 0.050000 +2023-04-06 02:15:27,863 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:15:27,863 EPOCH 68 done: loss 0.0227 - lr 0.050000 +2023-04-06 02:15:27,863 BAD EPOCHS (no improvement): 1 +2023-04-06 02:15:27,868 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:15:47,380 epoch 69 - iter 265/2650 - loss 0.02158817 - time (sec): 19.51 - samples/sec: 7505.22 - lr: 0.050000 +2023-04-06 02:16:06,515 epoch 69 - iter 530/2650 - loss 0.02168226 - time (sec): 38.65 - samples/sec: 7531.70 - lr: 0.050000 +2023-04-06 02:16:26,586 epoch 69 - iter 795/2650 - loss 0.02192219 - time (sec): 58.72 - samples/sec: 7484.84 - lr: 0.050000 +2023-04-06 02:16:45,822 epoch 69 - iter 1060/2650 - loss 0.02191979 - time (sec): 77.95 - samples/sec: 7515.55 - lr: 0.050000 +2023-04-06 02:17:05,411 epoch 69 - iter 1325/2650 - loss 0.02210794 - time (sec): 97.54 - samples/sec: 7511.52 - lr: 0.050000 +2023-04-06 02:17:24,756 epoch 69 - iter 1590/2650 - loss 0.02218762 - time (sec): 116.89 - samples/sec: 7524.19 - lr: 0.050000 +2023-04-06 02:17:44,480 epoch 69 - iter 1855/2650 - loss 0.02234665 - time (sec): 136.61 - samples/sec: 7505.18 - lr: 0.050000 +2023-04-06 02:18:03,276 epoch 69 - iter 2120/2650 - loss 0.02240301 - time (sec): 155.41 - samples/sec: 7527.95 - lr: 0.050000 +2023-04-06 02:18:22,368 epoch 69 - iter 2385/2650 - loss 0.02257441 - time (sec): 174.50 - samples/sec: 7541.12 - lr: 0.050000 +2023-04-06 02:18:42,046 epoch 69 - iter 2650/2650 - loss 0.02257588 - time (sec): 194.18 - samples/sec: 7531.03 - lr: 0.050000 +2023-04-06 02:18:42,046 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:18:42,047 EPOCH 69 done: loss 0.0226 - lr 0.050000 +2023-04-06 02:18:42,047 BAD EPOCHS (no improvement): 0 +2023-04-06 02:18:42,050 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:19:01,031 epoch 70 - iter 265/2650 - loss 0.02203687 - time (sec): 18.98 - samples/sec: 7696.80 - lr: 0.050000 +2023-04-06 02:19:20,687 epoch 70 - iter 530/2650 - loss 0.02185210 - time (sec): 38.64 - samples/sec: 7574.17 - lr: 0.050000 +2023-04-06 02:19:39,553 epoch 70 - iter 795/2650 - loss 0.02205071 - time (sec): 57.50 - samples/sec: 7618.20 - lr: 0.050000 +2023-04-06 02:19:59,726 epoch 70 - iter 1060/2650 - loss 0.02188608 - time (sec): 77.68 - samples/sec: 7535.11 - lr: 0.050000 +2023-04-06 02:20:19,575 epoch 70 - iter 1325/2650 - loss 0.02202391 - time (sec): 97.52 - samples/sec: 7516.88 - lr: 0.050000 +2023-04-06 02:20:39,578 epoch 70 - iter 1590/2650 - loss 0.02203704 - time (sec): 117.53 - samples/sec: 7483.12 - lr: 0.050000 +2023-04-06 02:20:59,101 epoch 70 - iter 1855/2650 - loss 0.02213297 - time (sec): 137.05 - samples/sec: 7482.42 - lr: 0.050000 +2023-04-06 02:21:17,841 epoch 70 - iter 2120/2650 - loss 0.02231277 - time (sec): 155.79 - samples/sec: 7514.31 - lr: 0.050000 +2023-04-06 02:21:36,651 epoch 70 - iter 2385/2650 - loss 0.02240361 - time (sec): 174.60 - samples/sec: 7536.55 - lr: 0.050000 +2023-04-06 02:21:56,093 epoch 70 - iter 2650/2650 - loss 0.02241748 - time (sec): 194.04 - samples/sec: 7536.27 - lr: 0.050000 +2023-04-06 02:21:56,094 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:21:56,094 EPOCH 70 done: loss 0.0224 - lr 0.050000 +2023-04-06 02:21:56,094 BAD EPOCHS (no improvement): 0 +2023-04-06 02:21:56,097 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:22:14,933 epoch 71 - iter 265/2650 - loss 0.02190180 - time (sec): 18.84 - samples/sec: 7672.98 - lr: 0.050000 +2023-04-06 02:22:34,378 epoch 71 - iter 530/2650 - loss 0.02177919 - time (sec): 38.28 - samples/sec: 7597.54 - lr: 0.050000 +2023-04-06 02:22:53,376 epoch 71 - iter 795/2650 - loss 0.02250363 - time (sec): 57.28 - samples/sec: 7622.24 - lr: 0.050000 +2023-04-06 02:23:12,966 epoch 71 - iter 1060/2650 - loss 0.02258949 - time (sec): 76.87 - samples/sec: 7565.81 - lr: 0.050000 +2023-04-06 02:23:32,920 epoch 71 - iter 1325/2650 - loss 0.02256175 - time (sec): 96.82 - samples/sec: 7543.42 - lr: 0.050000 +2023-04-06 02:23:52,879 epoch 71 - iter 1590/2650 - loss 0.02268694 - time (sec): 116.78 - samples/sec: 7522.15 - lr: 0.050000 +2023-04-06 02:24:11,933 epoch 71 - iter 1855/2650 - loss 0.02257947 - time (sec): 135.84 - samples/sec: 7542.70 - lr: 0.050000 +2023-04-06 02:24:31,288 epoch 71 - iter 2120/2650 - loss 0.02260316 - time (sec): 155.19 - samples/sec: 7552.96 - lr: 0.050000 +2023-04-06 02:24:50,876 epoch 71 - iter 2385/2650 - loss 0.02261346 - time (sec): 174.78 - samples/sec: 7542.28 - lr: 0.050000 +2023-04-06 02:25:10,271 epoch 71 - iter 2650/2650 - loss 0.02253409 - time (sec): 194.17 - samples/sec: 7531.20 - lr: 0.050000 +2023-04-06 02:25:10,272 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:25:10,272 EPOCH 71 done: loss 0.0225 - lr 0.050000 +2023-04-06 02:25:10,272 BAD EPOCHS (no improvement): 1 +2023-04-06 02:25:10,275 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:25:29,751 epoch 72 - iter 265/2650 - loss 0.02058375 - time (sec): 19.48 - samples/sec: 7532.05 - lr: 0.050000 +2023-04-06 02:25:49,234 epoch 72 - iter 530/2650 - loss 0.02161829 - time (sec): 38.96 - samples/sec: 7529.28 - lr: 0.050000 +2023-04-06 02:26:08,907 epoch 72 - iter 795/2650 - loss 0.02180041 - time (sec): 58.63 - samples/sec: 7512.36 - lr: 0.050000 +2023-04-06 02:26:28,079 epoch 72 - iter 1060/2650 - loss 0.02164555 - time (sec): 77.80 - samples/sec: 7543.19 - lr: 0.050000 +2023-04-06 02:26:47,524 epoch 72 - iter 1325/2650 - loss 0.02125576 - time (sec): 97.25 - samples/sec: 7538.35 - lr: 0.050000 +2023-04-06 02:27:06,980 epoch 72 - iter 1590/2650 - loss 0.02137661 - time (sec): 116.71 - samples/sec: 7540.21 - lr: 0.050000 +2023-04-06 02:27:25,804 epoch 72 - iter 1855/2650 - loss 0.02146511 - time (sec): 135.53 - samples/sec: 7564.82 - lr: 0.050000 +2023-04-06 02:27:45,028 epoch 72 - iter 2120/2650 - loss 0.02164974 - time (sec): 154.75 - samples/sec: 7559.42 - lr: 0.050000 +2023-04-06 02:28:04,262 epoch 72 - iter 2385/2650 - loss 0.02186554 - time (sec): 173.99 - samples/sec: 7557.59 - lr: 0.050000 +2023-04-06 02:28:23,415 epoch 72 - iter 2650/2650 - loss 0.02192431 - time (sec): 193.14 - samples/sec: 7571.54 - lr: 0.050000 +2023-04-06 02:28:23,415 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:28:23,415 EPOCH 72 done: loss 0.0219 - lr 0.050000 +2023-04-06 02:28:23,415 BAD EPOCHS (no improvement): 0 +2023-04-06 02:28:23,418 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:28:42,660 epoch 73 - iter 265/2650 - loss 0.02040867 - time (sec): 19.24 - samples/sec: 7601.41 - lr: 0.050000 +2023-04-06 02:29:02,420 epoch 73 - iter 530/2650 - loss 0.02108392 - time (sec): 39.00 - samples/sec: 7541.29 - lr: 0.050000 +2023-04-06 02:29:22,037 epoch 73 - iter 795/2650 - loss 0.02132792 - time (sec): 58.62 - samples/sec: 7506.55 - lr: 0.050000 +2023-04-06 02:29:41,838 epoch 73 - iter 1060/2650 - loss 0.02141061 - time (sec): 78.42 - samples/sec: 7494.64 - lr: 0.050000 +2023-04-06 02:30:01,037 epoch 73 - iter 1325/2650 - loss 0.02164467 - time (sec): 97.62 - samples/sec: 7518.71 - lr: 0.050000 +2023-04-06 02:30:20,164 epoch 73 - iter 1590/2650 - loss 0.02182246 - time (sec): 116.75 - samples/sec: 7524.69 - lr: 0.050000 +2023-04-06 02:30:39,222 epoch 73 - iter 1855/2650 - loss 0.02194189 - time (sec): 135.80 - samples/sec: 7542.48 - lr: 0.050000 +2023-04-06 02:30:58,066 epoch 73 - iter 2120/2650 - loss 0.02203676 - time (sec): 154.65 - samples/sec: 7567.84 - lr: 0.050000 +2023-04-06 02:31:17,264 epoch 73 - iter 2385/2650 - loss 0.02213209 - time (sec): 173.85 - samples/sec: 7572.98 - lr: 0.050000 +2023-04-06 02:31:36,473 epoch 73 - iter 2650/2650 - loss 0.02218015 - time (sec): 193.05 - samples/sec: 7574.87 - lr: 0.050000 +2023-04-06 02:31:36,473 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:31:36,473 EPOCH 73 done: loss 0.0222 - lr 0.050000 +2023-04-06 02:31:36,473 BAD EPOCHS (no improvement): 1 +2023-04-06 02:31:36,476 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:31:56,197 epoch 74 - iter 265/2650 - loss 0.02288612 - time (sec): 19.72 - samples/sec: 7437.45 - lr: 0.050000 +2023-04-06 02:32:15,648 epoch 74 - iter 530/2650 - loss 0.02176070 - time (sec): 39.17 - samples/sec: 7491.16 - lr: 0.050000 +2023-04-06 02:32:35,321 epoch 74 - iter 795/2650 - loss 0.02135439 - time (sec): 58.84 - samples/sec: 7462.87 - lr: 0.050000 +2023-04-06 02:32:54,653 epoch 74 - iter 1060/2650 - loss 0.02141306 - time (sec): 78.18 - samples/sec: 7500.81 - lr: 0.050000 +2023-04-06 02:33:14,067 epoch 74 - iter 1325/2650 - loss 0.02122902 - time (sec): 97.59 - samples/sec: 7505.46 - lr: 0.050000 +2023-04-06 02:33:43,049 epoch 74 - iter 1590/2650 - loss 0.02158316 - time (sec): 126.57 - samples/sec: 6956.66 - lr: 0.050000 +2023-04-06 02:34:01,816 epoch 74 - iter 1855/2650 - loss 0.02152591 - time (sec): 145.34 - samples/sec: 7056.11 - lr: 0.050000 +2023-04-06 02:34:20,988 epoch 74 - iter 2120/2650 - loss 0.02162005 - time (sec): 164.51 - samples/sec: 7117.86 - lr: 0.050000 +2023-04-06 02:34:40,162 epoch 74 - iter 2385/2650 - loss 0.02176786 - time (sec): 183.69 - samples/sec: 7170.50 - lr: 0.050000 +2023-04-06 02:34:59,047 epoch 74 - iter 2650/2650 - loss 0.02169257 - time (sec): 202.57 - samples/sec: 7219.02 - lr: 0.050000 +2023-04-06 02:34:59,047 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:34:59,047 EPOCH 74 done: loss 0.0217 - lr 0.050000 +2023-04-06 02:34:59,047 BAD EPOCHS (no improvement): 0 +2023-04-06 02:34:59,051 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:35:18,418 epoch 75 - iter 265/2650 - loss 0.02188341 - time (sec): 19.37 - samples/sec: 7538.19 - lr: 0.050000 +2023-04-06 02:35:38,179 epoch 75 - iter 530/2650 - loss 0.02203009 - time (sec): 39.13 - samples/sec: 7491.93 - lr: 0.050000 +2023-04-06 02:35:57,305 epoch 75 - iter 795/2650 - loss 0.02187496 - time (sec): 58.25 - samples/sec: 7523.01 - lr: 0.050000 +2023-04-06 02:36:16,041 epoch 75 - iter 1060/2650 - loss 0.02193217 - time (sec): 76.99 - samples/sec: 7576.77 - lr: 0.050000 +2023-04-06 02:36:35,088 epoch 75 - iter 1325/2650 - loss 0.02178260 - time (sec): 96.04 - samples/sec: 7587.68 - lr: 0.050000 +2023-04-06 02:36:54,778 epoch 75 - iter 1590/2650 - loss 0.02194509 - time (sec): 115.73 - samples/sec: 7571.82 - lr: 0.050000 +2023-04-06 02:37:13,715 epoch 75 - iter 1855/2650 - loss 0.02176340 - time (sec): 134.66 - samples/sec: 7592.99 - lr: 0.050000 +2023-04-06 02:37:33,973 epoch 75 - iter 2120/2650 - loss 0.02173343 - time (sec): 154.92 - samples/sec: 7556.28 - lr: 0.050000 +2023-04-06 02:37:52,839 epoch 75 - iter 2385/2650 - loss 0.02170370 - time (sec): 173.79 - samples/sec: 7567.58 - lr: 0.050000 +2023-04-06 02:38:12,708 epoch 75 - iter 2650/2650 - loss 0.02190977 - time (sec): 193.66 - samples/sec: 7551.32 - lr: 0.050000 +2023-04-06 02:38:12,708 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:38:12,708 EPOCH 75 done: loss 0.0219 - lr 0.050000 +2023-04-06 02:38:12,709 BAD EPOCHS (no improvement): 1 +2023-04-06 02:38:12,712 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:38:31,731 epoch 76 - iter 265/2650 - loss 0.02082060 - time (sec): 19.02 - samples/sec: 7695.36 - lr: 0.050000 +2023-04-06 02:38:50,963 epoch 76 - iter 530/2650 - loss 0.02118057 - time (sec): 38.25 - samples/sec: 7584.77 - lr: 0.050000 +2023-04-06 02:39:10,148 epoch 76 - iter 795/2650 - loss 0.02085589 - time (sec): 57.44 - samples/sec: 7594.63 - lr: 0.050000 +2023-04-06 02:39:29,430 epoch 76 - iter 1060/2650 - loss 0.02099816 - time (sec): 76.72 - samples/sec: 7619.33 - lr: 0.050000 +2023-04-06 02:39:49,204 epoch 76 - iter 1325/2650 - loss 0.02113610 - time (sec): 96.49 - samples/sec: 7593.02 - lr: 0.050000 +2023-04-06 02:40:08,216 epoch 76 - iter 1590/2650 - loss 0.02113944 - time (sec): 115.50 - samples/sec: 7601.32 - lr: 0.050000 +2023-04-06 02:40:27,793 epoch 76 - iter 1855/2650 - loss 0.02116299 - time (sec): 135.08 - samples/sec: 7587.09 - lr: 0.050000 +2023-04-06 02:40:46,902 epoch 76 - iter 2120/2650 - loss 0.02112250 - time (sec): 154.19 - samples/sec: 7582.46 - lr: 0.050000 +2023-04-06 02:41:05,938 epoch 76 - iter 2385/2650 - loss 0.02119870 - time (sec): 173.23 - samples/sec: 7591.27 - lr: 0.050000 +2023-04-06 02:41:25,549 epoch 76 - iter 2650/2650 - loss 0.02131471 - time (sec): 192.84 - samples/sec: 7583.44 - lr: 0.050000 +2023-04-06 02:41:25,549 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:41:25,549 EPOCH 76 done: loss 0.0213 - lr 0.050000 +2023-04-06 02:41:25,549 BAD EPOCHS (no improvement): 0 +2023-04-06 02:41:25,553 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:41:44,038 epoch 77 - iter 265/2650 - loss 0.02037441 - time (sec): 18.48 - samples/sec: 7805.79 - lr: 0.050000 +2023-04-06 02:42:03,501 epoch 77 - iter 530/2650 - loss 0.02150523 - time (sec): 37.95 - samples/sec: 7681.25 - lr: 0.050000 +2023-04-06 02:42:22,702 epoch 77 - iter 795/2650 - loss 0.02170566 - time (sec): 57.15 - samples/sec: 7641.01 - lr: 0.050000 +2023-04-06 02:42:41,801 epoch 77 - iter 1060/2650 - loss 0.02184497 - time (sec): 76.25 - samples/sec: 7637.36 - lr: 0.050000 +2023-04-06 02:43:01,022 epoch 77 - iter 1325/2650 - loss 0.02182261 - time (sec): 95.47 - samples/sec: 7639.35 - lr: 0.050000 +2023-04-06 02:43:20,771 epoch 77 - iter 1590/2650 - loss 0.02190412 - time (sec): 115.22 - samples/sec: 7610.74 - lr: 0.050000 +2023-04-06 02:43:40,245 epoch 77 - iter 1855/2650 - loss 0.02186369 - time (sec): 134.69 - samples/sec: 7596.49 - lr: 0.050000 +2023-04-06 02:43:59,443 epoch 77 - iter 2120/2650 - loss 0.02182253 - time (sec): 153.89 - samples/sec: 7604.75 - lr: 0.050000 +2023-04-06 02:44:18,788 epoch 77 - iter 2385/2650 - loss 0.02178251 - time (sec): 173.23 - samples/sec: 7592.76 - lr: 0.050000 +2023-04-06 02:44:38,653 epoch 77 - iter 2650/2650 - loss 0.02176863 - time (sec): 193.10 - samples/sec: 7573.12 - lr: 0.050000 +2023-04-06 02:44:38,653 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:44:38,653 EPOCH 77 done: loss 0.0218 - lr 0.050000 +2023-04-06 02:44:38,653 BAD EPOCHS (no improvement): 1 +2023-04-06 02:44:38,657 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:44:57,786 epoch 78 - iter 265/2650 - loss 0.02005819 - time (sec): 19.13 - samples/sec: 7634.22 - lr: 0.050000 +2023-04-06 02:45:17,192 epoch 78 - iter 530/2650 - loss 0.02070203 - time (sec): 38.53 - samples/sec: 7620.82 - lr: 0.050000 +2023-04-06 02:45:36,732 epoch 78 - iter 795/2650 - loss 0.02121885 - time (sec): 58.08 - samples/sec: 7586.78 - lr: 0.050000 +2023-04-06 02:45:56,151 epoch 78 - iter 1060/2650 - loss 0.02145587 - time (sec): 77.49 - samples/sec: 7571.92 - lr: 0.050000 +2023-04-06 02:46:16,077 epoch 78 - iter 1325/2650 - loss 0.02159165 - time (sec): 97.42 - samples/sec: 7535.74 - lr: 0.050000 +2023-04-06 02:46:35,260 epoch 78 - iter 1590/2650 - loss 0.02140849 - time (sec): 116.60 - samples/sec: 7542.94 - lr: 0.050000 +2023-04-06 02:46:54,581 epoch 78 - iter 1855/2650 - loss 0.02138362 - time (sec): 135.92 - samples/sec: 7552.01 - lr: 0.050000 +2023-04-06 02:47:13,846 epoch 78 - iter 2120/2650 - loss 0.02128844 - time (sec): 155.19 - samples/sec: 7555.89 - lr: 0.050000 +2023-04-06 02:47:33,078 epoch 78 - iter 2385/2650 - loss 0.02125868 - time (sec): 174.42 - samples/sec: 7556.21 - lr: 0.050000 +2023-04-06 02:47:52,259 epoch 78 - iter 2650/2650 - loss 0.02144732 - time (sec): 193.60 - samples/sec: 7553.46 - lr: 0.050000 +2023-04-06 02:47:52,259 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:47:52,259 EPOCH 78 done: loss 0.0214 - lr 0.050000 +2023-04-06 02:47:52,259 BAD EPOCHS (no improvement): 2 +2023-04-06 02:47:52,263 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:48:11,542 epoch 79 - iter 265/2650 - loss 0.02137987 - time (sec): 19.28 - samples/sec: 7635.29 - lr: 0.050000 +2023-04-06 02:48:30,890 epoch 79 - iter 530/2650 - loss 0.02108487 - time (sec): 38.63 - samples/sec: 7573.68 - lr: 0.050000 +2023-04-06 02:48:49,807 epoch 79 - iter 795/2650 - loss 0.02117952 - time (sec): 57.54 - samples/sec: 7637.53 - lr: 0.050000 +2023-04-06 02:49:08,729 epoch 79 - iter 1060/2650 - loss 0.02127776 - time (sec): 76.47 - samples/sec: 7645.05 - lr: 0.050000 +2023-04-06 02:49:28,292 epoch 79 - iter 1325/2650 - loss 0.02148286 - time (sec): 96.03 - samples/sec: 7610.92 - lr: 0.050000 +2023-04-06 02:49:47,474 epoch 79 - iter 1590/2650 - loss 0.02128983 - time (sec): 115.21 - samples/sec: 7600.67 - lr: 0.050000 +2023-04-06 02:50:07,477 epoch 79 - iter 1855/2650 - loss 0.02132846 - time (sec): 135.21 - samples/sec: 7570.59 - lr: 0.050000 +2023-04-06 02:50:26,920 epoch 79 - iter 2120/2650 - loss 0.02132384 - time (sec): 154.66 - samples/sec: 7560.13 - lr: 0.050000 +2023-04-06 02:50:46,565 epoch 79 - iter 2385/2650 - loss 0.02136009 - time (sec): 174.30 - samples/sec: 7555.75 - lr: 0.050000 +2023-04-06 02:51:05,749 epoch 79 - iter 2650/2650 - loss 0.02138881 - time (sec): 193.49 - samples/sec: 7557.98 - lr: 0.050000 +2023-04-06 02:51:05,749 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:51:05,749 EPOCH 79 done: loss 0.0214 - lr 0.050000 +2023-04-06 02:51:05,749 BAD EPOCHS (no improvement): 3 +2023-04-06 02:51:05,752 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:51:25,370 epoch 80 - iter 265/2650 - loss 0.02085673 - time (sec): 19.62 - samples/sec: 7574.79 - lr: 0.050000 +2023-04-06 02:51:45,238 epoch 80 - iter 530/2650 - loss 0.02161601 - time (sec): 39.49 - samples/sec: 7481.45 - lr: 0.050000 +2023-04-06 02:52:04,892 epoch 80 - iter 795/2650 - loss 0.02164308 - time (sec): 59.14 - samples/sec: 7509.44 - lr: 0.050000 +2023-04-06 02:52:23,525 epoch 80 - iter 1060/2650 - loss 0.02155891 - time (sec): 77.77 - samples/sec: 7570.04 - lr: 0.050000 +2023-04-06 02:52:43,442 epoch 80 - iter 1325/2650 - loss 0.02139747 - time (sec): 97.69 - samples/sec: 7524.85 - lr: 0.050000 +2023-04-06 02:53:02,386 epoch 80 - iter 1590/2650 - loss 0.02128583 - time (sec): 116.63 - samples/sec: 7542.75 - lr: 0.050000 +2023-04-06 02:53:21,223 epoch 80 - iter 1855/2650 - loss 0.02123327 - time (sec): 135.47 - samples/sec: 7568.87 - lr: 0.050000 +2023-04-06 02:53:39,954 epoch 80 - iter 2120/2650 - loss 0.02121860 - time (sec): 154.20 - samples/sec: 7579.95 - lr: 0.050000 +2023-04-06 02:53:59,345 epoch 80 - iter 2385/2650 - loss 0.02114601 - time (sec): 173.59 - samples/sec: 7582.08 - lr: 0.050000 +2023-04-06 02:54:18,721 epoch 80 - iter 2650/2650 - loss 0.02113247 - time (sec): 192.97 - samples/sec: 7578.26 - lr: 0.050000 +2023-04-06 02:54:18,721 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:54:18,721 EPOCH 80 done: loss 0.0211 - lr 0.050000 +2023-04-06 02:54:18,721 BAD EPOCHS (no improvement): 0 +2023-04-06 02:54:18,724 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:54:37,875 epoch 81 - iter 265/2650 - loss 0.02031509 - time (sec): 19.15 - samples/sec: 7562.46 - lr: 0.050000 +2023-04-06 02:54:57,385 epoch 81 - iter 530/2650 - loss 0.02033203 - time (sec): 38.66 - samples/sec: 7545.89 - lr: 0.050000 +2023-04-06 02:55:17,035 epoch 81 - iter 795/2650 - loss 0.02023107 - time (sec): 58.31 - samples/sec: 7509.93 - lr: 0.050000 +2023-04-06 02:55:36,125 epoch 81 - iter 1060/2650 - loss 0.02027924 - time (sec): 77.40 - samples/sec: 7547.45 - lr: 0.050000 +2023-04-06 02:55:55,550 epoch 81 - iter 1325/2650 - loss 0.02043279 - time (sec): 96.83 - samples/sec: 7555.71 - lr: 0.050000 +2023-04-06 02:56:15,178 epoch 81 - iter 1590/2650 - loss 0.02074000 - time (sec): 116.45 - samples/sec: 7537.63 - lr: 0.050000 +2023-04-06 02:56:34,127 epoch 81 - iter 1855/2650 - loss 0.02089810 - time (sec): 135.40 - samples/sec: 7567.10 - lr: 0.050000 +2023-04-06 02:56:53,871 epoch 81 - iter 2120/2650 - loss 0.02085589 - time (sec): 155.15 - samples/sec: 7543.74 - lr: 0.050000 +2023-04-06 02:57:12,906 epoch 81 - iter 2385/2650 - loss 0.02076801 - time (sec): 174.18 - samples/sec: 7559.36 - lr: 0.050000 +2023-04-06 02:57:32,010 epoch 81 - iter 2650/2650 - loss 0.02096402 - time (sec): 193.29 - samples/sec: 7565.82 - lr: 0.050000 +2023-04-06 02:57:32,010 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:57:32,010 EPOCH 81 done: loss 0.0210 - lr 0.050000 +2023-04-06 02:57:32,010 BAD EPOCHS (no improvement): 0 +2023-04-06 02:57:32,013 ---------------------------------------------------------------------------------------------------- +2023-04-06 02:57:51,491 epoch 82 - iter 265/2650 - loss 0.02072531 - time (sec): 19.48 - samples/sec: 7520.93 - lr: 0.050000 +2023-04-06 02:58:11,046 epoch 82 - iter 530/2650 - loss 0.02115192 - time (sec): 39.03 - samples/sec: 7508.94 - lr: 0.050000 +2023-04-06 02:58:29,977 epoch 82 - iter 795/2650 - loss 0.02117868 - time (sec): 57.96 - samples/sec: 7557.58 - lr: 0.050000 +2023-04-06 02:58:49,769 epoch 82 - iter 1060/2650 - loss 0.02084953 - time (sec): 77.75 - samples/sec: 7527.91 - lr: 0.050000 +2023-04-06 02:59:09,113 epoch 82 - iter 1325/2650 - loss 0.02079207 - time (sec): 97.10 - samples/sec: 7547.26 - lr: 0.050000 +2023-04-06 02:59:28,544 epoch 82 - iter 1590/2650 - loss 0.02084338 - time (sec): 116.53 - samples/sec: 7540.04 - lr: 0.050000 +2023-04-06 02:59:47,806 epoch 82 - iter 1855/2650 - loss 0.02089967 - time (sec): 135.79 - samples/sec: 7541.97 - lr: 0.050000 +2023-04-06 03:00:06,825 epoch 82 - iter 2120/2650 - loss 0.02095215 - time (sec): 154.81 - samples/sec: 7553.08 - lr: 0.050000 +2023-04-06 03:00:26,343 epoch 82 - iter 2385/2650 - loss 0.02084949 - time (sec): 174.33 - samples/sec: 7553.22 - lr: 0.050000 +2023-04-06 03:00:45,472 epoch 82 - iter 2650/2650 - loss 0.02068391 - time (sec): 193.46 - samples/sec: 7559.05 - lr: 0.050000 +2023-04-06 03:00:45,472 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:00:45,472 EPOCH 82 done: loss 0.0207 - lr 0.050000 +2023-04-06 03:00:45,472 BAD EPOCHS (no improvement): 0 +2023-04-06 03:00:45,476 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:01:05,218 epoch 83 - iter 265/2650 - loss 0.02074123 - time (sec): 19.74 - samples/sec: 7448.19 - lr: 0.050000 +2023-04-06 03:01:24,444 epoch 83 - iter 530/2650 - loss 0.02023541 - time (sec): 38.97 - samples/sec: 7524.14 - lr: 0.050000 +2023-04-06 03:01:43,599 epoch 83 - iter 795/2650 - loss 0.02037469 - time (sec): 58.12 - samples/sec: 7540.36 - lr: 0.050000 +2023-04-06 03:02:02,843 epoch 83 - iter 1060/2650 - loss 0.02079845 - time (sec): 77.37 - samples/sec: 7552.81 - lr: 0.050000 +2023-04-06 03:02:22,320 epoch 83 - iter 1325/2650 - loss 0.02110778 - time (sec): 96.84 - samples/sec: 7558.98 - lr: 0.050000 +2023-04-06 03:02:41,801 epoch 83 - iter 1590/2650 - loss 0.02082870 - time (sec): 116.33 - samples/sec: 7566.04 - lr: 0.050000 +2023-04-06 03:03:00,465 epoch 83 - iter 1855/2650 - loss 0.02085920 - time (sec): 134.99 - samples/sec: 7600.02 - lr: 0.050000 +2023-04-06 03:03:19,890 epoch 83 - iter 2120/2650 - loss 0.02093997 - time (sec): 154.41 - samples/sec: 7587.51 - lr: 0.050000 +2023-04-06 03:03:39,317 epoch 83 - iter 2385/2650 - loss 0.02100696 - time (sec): 173.84 - samples/sec: 7577.72 - lr: 0.050000 +2023-04-06 03:03:59,329 epoch 83 - iter 2650/2650 - loss 0.02104342 - time (sec): 193.85 - samples/sec: 7543.66 - lr: 0.050000 +2023-04-06 03:03:59,330 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:03:59,330 EPOCH 83 done: loss 0.0210 - lr 0.050000 +2023-04-06 03:03:59,330 BAD EPOCHS (no improvement): 1 +2023-04-06 03:03:59,334 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:04:19,034 epoch 84 - iter 265/2650 - loss 0.02098481 - time (sec): 19.70 - samples/sec: 7441.69 - lr: 0.050000 +2023-04-06 03:04:38,111 epoch 84 - iter 530/2650 - loss 0.02085077 - time (sec): 38.78 - samples/sec: 7507.39 - lr: 0.050000 +2023-04-06 03:04:57,534 epoch 84 - iter 795/2650 - loss 0.02060763 - time (sec): 58.20 - samples/sec: 7508.78 - lr: 0.050000 +2023-04-06 03:05:16,653 epoch 84 - iter 1060/2650 - loss 0.02075731 - time (sec): 77.32 - samples/sec: 7538.07 - lr: 0.050000 +2023-04-06 03:05:36,033 epoch 84 - iter 1325/2650 - loss 0.02108550 - time (sec): 96.70 - samples/sec: 7528.45 - lr: 0.050000 +2023-04-06 03:05:55,244 epoch 84 - iter 1590/2650 - loss 0.02114228 - time (sec): 115.91 - samples/sec: 7545.31 - lr: 0.050000 +2023-04-06 03:06:15,177 epoch 84 - iter 1855/2650 - loss 0.02101618 - time (sec): 135.84 - samples/sec: 7522.49 - lr: 0.050000 +2023-04-06 03:06:34,475 epoch 84 - iter 2120/2650 - loss 0.02116557 - time (sec): 155.14 - samples/sec: 7525.41 - lr: 0.050000 +2023-04-06 03:06:53,707 epoch 84 - iter 2385/2650 - loss 0.02113085 - time (sec): 174.37 - samples/sec: 7535.89 - lr: 0.050000 +2023-04-06 03:07:13,304 epoch 84 - iter 2650/2650 - loss 0.02118390 - time (sec): 193.97 - samples/sec: 7539.13 - lr: 0.050000 +2023-04-06 03:07:13,304 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:07:13,304 EPOCH 84 done: loss 0.0212 - lr 0.050000 +2023-04-06 03:07:13,305 BAD EPOCHS (no improvement): 2 +2023-04-06 03:07:13,308 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:07:33,233 epoch 85 - iter 265/2650 - loss 0.02052031 - time (sec): 19.92 - samples/sec: 7392.80 - lr: 0.050000 +2023-04-06 03:07:52,779 epoch 85 - iter 530/2650 - loss 0.02058148 - time (sec): 39.47 - samples/sec: 7432.20 - lr: 0.050000 +2023-04-06 03:08:11,945 epoch 85 - iter 795/2650 - loss 0.02101608 - time (sec): 58.64 - samples/sec: 7476.27 - lr: 0.050000 +2023-04-06 03:08:31,032 epoch 85 - iter 1060/2650 - loss 0.02106849 - time (sec): 77.72 - samples/sec: 7528.62 - lr: 0.050000 +2023-04-06 03:08:49,824 epoch 85 - iter 1325/2650 - loss 0.02110864 - time (sec): 96.52 - samples/sec: 7553.03 - lr: 0.050000 +2023-04-06 03:09:09,204 epoch 85 - iter 1590/2650 - loss 0.02122742 - time (sec): 115.90 - samples/sec: 7560.96 - lr: 0.050000 +2023-04-06 03:09:28,800 epoch 85 - iter 1855/2650 - loss 0.02098129 - time (sec): 135.49 - samples/sec: 7548.34 - lr: 0.050000 +2023-04-06 03:09:48,358 epoch 85 - iter 2120/2650 - loss 0.02098534 - time (sec): 155.05 - samples/sec: 7542.51 - lr: 0.050000 +2023-04-06 03:10:07,365 epoch 85 - iter 2385/2650 - loss 0.02101951 - time (sec): 174.06 - samples/sec: 7558.47 - lr: 0.050000 +2023-04-06 03:10:27,024 epoch 85 - iter 2650/2650 - loss 0.02098455 - time (sec): 193.72 - samples/sec: 7549.02 - lr: 0.050000 +2023-04-06 03:10:27,025 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:10:27,025 EPOCH 85 done: loss 0.0210 - lr 0.050000 +2023-04-06 03:10:27,025 BAD EPOCHS (no improvement): 3 +2023-04-06 03:10:27,029 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:10:46,114 epoch 86 - iter 265/2650 - loss 0.02016689 - time (sec): 19.08 - samples/sec: 7618.50 - lr: 0.050000 +2023-04-06 03:11:05,378 epoch 86 - iter 530/2650 - loss 0.02002309 - time (sec): 38.35 - samples/sec: 7595.69 - lr: 0.050000 +2023-04-06 03:11:25,165 epoch 86 - iter 795/2650 - loss 0.02004330 - time (sec): 58.14 - samples/sec: 7552.04 - lr: 0.050000 +2023-04-06 03:11:44,889 epoch 86 - iter 1060/2650 - loss 0.02052691 - time (sec): 77.86 - samples/sec: 7516.91 - lr: 0.050000 +2023-04-06 03:12:04,291 epoch 86 - iter 1325/2650 - loss 0.02051491 - time (sec): 97.26 - samples/sec: 7532.71 - lr: 0.050000 +2023-04-06 03:12:23,376 epoch 86 - iter 1590/2650 - loss 0.02042649 - time (sec): 116.35 - samples/sec: 7560.88 - lr: 0.050000 +2023-04-06 03:12:42,975 epoch 86 - iter 1855/2650 - loss 0.02071259 - time (sec): 135.95 - samples/sec: 7558.47 - lr: 0.050000 +2023-04-06 03:13:02,008 epoch 86 - iter 2120/2650 - loss 0.02079442 - time (sec): 154.98 - samples/sec: 7563.74 - lr: 0.050000 +2023-04-06 03:13:20,729 epoch 86 - iter 2385/2650 - loss 0.02077335 - time (sec): 173.70 - samples/sec: 7590.87 - lr: 0.050000 +2023-04-06 03:13:39,908 epoch 86 - iter 2650/2650 - loss 0.02087374 - time (sec): 192.88 - samples/sec: 7581.76 - lr: 0.050000 +2023-04-06 03:13:39,908 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:13:39,909 EPOCH 86 done: loss 0.0209 - lr 0.050000 +2023-04-06 03:13:39,909 Epoch 86: reducing learning rate of group 0 to 2.5000e-02. +2023-04-06 03:13:39,909 BAD EPOCHS (no improvement): 4 +2023-04-06 03:13:39,912 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:13:59,244 epoch 87 - iter 265/2650 - loss 0.01972096 - time (sec): 19.33 - samples/sec: 7599.16 - lr: 0.025000 +2023-04-06 03:14:18,836 epoch 87 - iter 530/2650 - loss 0.02021924 - time (sec): 38.92 - samples/sec: 7532.11 - lr: 0.025000 +2023-04-06 03:14:38,724 epoch 87 - iter 795/2650 - loss 0.02025133 - time (sec): 58.81 - samples/sec: 7452.60 - lr: 0.025000 +2023-04-06 03:14:57,783 epoch 87 - iter 1060/2650 - loss 0.01983906 - time (sec): 77.87 - samples/sec: 7500.80 - lr: 0.025000 +2023-04-06 03:15:17,445 epoch 87 - iter 1325/2650 - loss 0.01993750 - time (sec): 97.53 - samples/sec: 7511.42 - lr: 0.025000 +2023-04-06 03:15:36,633 epoch 87 - iter 1590/2650 - loss 0.01973408 - time (sec): 116.72 - samples/sec: 7518.21 - lr: 0.025000 +2023-04-06 03:15:55,856 epoch 87 - iter 1855/2650 - loss 0.01967572 - time (sec): 135.94 - samples/sec: 7520.00 - lr: 0.025000 +2023-04-06 03:16:15,446 epoch 87 - iter 2120/2650 - loss 0.01976136 - time (sec): 155.53 - samples/sec: 7517.87 - lr: 0.025000 +2023-04-06 03:16:34,635 epoch 87 - iter 2385/2650 - loss 0.01959570 - time (sec): 174.72 - samples/sec: 7532.82 - lr: 0.025000 +2023-04-06 03:16:54,224 epoch 87 - iter 2650/2650 - loss 0.01960481 - time (sec): 194.31 - samples/sec: 7525.85 - lr: 0.025000 +2023-04-06 03:16:54,224 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:16:54,224 EPOCH 87 done: loss 0.0196 - lr 0.025000 +2023-04-06 03:16:54,224 BAD EPOCHS (no improvement): 0 +2023-04-06 03:16:54,228 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:17:13,682 epoch 88 - iter 265/2650 - loss 0.01854281 - time (sec): 19.45 - samples/sec: 7533.88 - lr: 0.025000 +2023-04-06 03:17:33,143 epoch 88 - iter 530/2650 - loss 0.01889028 - time (sec): 38.92 - samples/sec: 7549.68 - lr: 0.025000 +2023-04-06 03:17:51,920 epoch 88 - iter 795/2650 - loss 0.01915780 - time (sec): 57.69 - samples/sec: 7628.89 - lr: 0.025000 +2023-04-06 03:18:11,425 epoch 88 - iter 1060/2650 - loss 0.01896526 - time (sec): 77.20 - samples/sec: 7602.05 - lr: 0.025000 +2023-04-06 03:18:30,447 epoch 88 - iter 1325/2650 - loss 0.01900077 - time (sec): 96.22 - samples/sec: 7617.11 - lr: 0.025000 +2023-04-06 03:18:49,519 epoch 88 - iter 1590/2650 - loss 0.01920954 - time (sec): 115.29 - samples/sec: 7615.15 - lr: 0.025000 +2023-04-06 03:19:09,761 epoch 88 - iter 1855/2650 - loss 0.01920469 - time (sec): 135.53 - samples/sec: 7570.49 - lr: 0.025000 +2023-04-06 03:19:28,581 epoch 88 - iter 2120/2650 - loss 0.01913455 - time (sec): 154.35 - samples/sec: 7588.94 - lr: 0.025000 +2023-04-06 03:19:48,277 epoch 88 - iter 2385/2650 - loss 0.01914383 - time (sec): 174.05 - samples/sec: 7568.17 - lr: 0.025000 +2023-04-06 03:20:07,844 epoch 88 - iter 2650/2650 - loss 0.01906583 - time (sec): 193.62 - samples/sec: 7552.90 - lr: 0.025000 +2023-04-06 03:20:07,844 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:20:07,844 EPOCH 88 done: loss 0.0191 - lr 0.025000 +2023-04-06 03:20:07,844 BAD EPOCHS (no improvement): 0 +2023-04-06 03:20:07,848 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:20:27,876 epoch 89 - iter 265/2650 - loss 0.01783701 - time (sec): 20.03 - samples/sec: 7318.19 - lr: 0.025000 +2023-04-06 03:20:47,167 epoch 89 - iter 530/2650 - loss 0.01839823 - time (sec): 39.32 - samples/sec: 7421.99 - lr: 0.025000 +2023-04-06 03:21:06,504 epoch 89 - iter 795/2650 - loss 0.01853782 - time (sec): 58.66 - samples/sec: 7469.32 - lr: 0.025000 +2023-04-06 03:21:25,597 epoch 89 - iter 1060/2650 - loss 0.01832282 - time (sec): 77.75 - samples/sec: 7524.75 - lr: 0.025000 +2023-04-06 03:21:45,013 epoch 89 - iter 1325/2650 - loss 0.01843820 - time (sec): 97.16 - samples/sec: 7510.41 - lr: 0.025000 +2023-04-06 03:22:04,519 epoch 89 - iter 1590/2650 - loss 0.01826992 - time (sec): 116.67 - samples/sec: 7519.06 - lr: 0.025000 +2023-04-06 03:22:24,043 epoch 89 - iter 1855/2650 - loss 0.01829987 - time (sec): 136.20 - samples/sec: 7512.48 - lr: 0.025000 +2023-04-06 03:22:43,445 epoch 89 - iter 2120/2650 - loss 0.01844779 - time (sec): 155.60 - samples/sec: 7523.58 - lr: 0.025000 +2023-04-06 03:23:02,101 epoch 89 - iter 2385/2650 - loss 0.01843164 - time (sec): 174.25 - samples/sec: 7559.16 - lr: 0.025000 +2023-04-06 03:23:21,038 epoch 89 - iter 2650/2650 - loss 0.01851785 - time (sec): 193.19 - samples/sec: 7569.59 - lr: 0.025000 +2023-04-06 03:23:21,038 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:23:21,038 EPOCH 89 done: loss 0.0185 - lr 0.025000 +2023-04-06 03:23:21,038 BAD EPOCHS (no improvement): 0 +2023-04-06 03:23:21,041 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:23:39,416 epoch 90 - iter 265/2650 - loss 0.01791392 - time (sec): 18.37 - samples/sec: 7864.03 - lr: 0.025000 +2023-04-06 03:24:08,280 epoch 90 - iter 530/2650 - loss 0.01830173 - time (sec): 47.24 - samples/sec: 6156.15 - lr: 0.025000 +2023-04-06 03:24:27,807 epoch 90 - iter 795/2650 - loss 0.01866672 - time (sec): 66.77 - samples/sec: 6558.85 - lr: 0.025000 +2023-04-06 03:24:47,135 epoch 90 - iter 1060/2650 - loss 0.01888757 - time (sec): 86.09 - samples/sec: 6790.83 - lr: 0.025000 +2023-04-06 03:25:07,035 epoch 90 - iter 1325/2650 - loss 0.01931051 - time (sec): 105.99 - samples/sec: 6916.52 - lr: 0.025000 +2023-04-06 03:25:26,306 epoch 90 - iter 1590/2650 - loss 0.01911919 - time (sec): 125.26 - samples/sec: 7020.37 - lr: 0.025000 +2023-04-06 03:25:45,105 epoch 90 - iter 1855/2650 - loss 0.01899358 - time (sec): 144.06 - samples/sec: 7098.02 - lr: 0.025000 +2023-04-06 03:26:04,431 epoch 90 - iter 2120/2650 - loss 0.01896251 - time (sec): 163.39 - samples/sec: 7155.28 - lr: 0.025000 +2023-04-06 03:26:24,084 epoch 90 - iter 2385/2650 - loss 0.01893267 - time (sec): 183.04 - samples/sec: 7184.12 - lr: 0.025000 +2023-04-06 03:26:43,438 epoch 90 - iter 2650/2650 - loss 0.01876960 - time (sec): 202.40 - samples/sec: 7225.24 - lr: 0.025000 +2023-04-06 03:26:43,438 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:26:43,438 EPOCH 90 done: loss 0.0188 - lr 0.025000 +2023-04-06 03:26:43,438 BAD EPOCHS (no improvement): 1 +2023-04-06 03:26:43,441 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:27:02,338 epoch 91 - iter 265/2650 - loss 0.01871084 - time (sec): 18.90 - samples/sec: 7678.69 - lr: 0.025000 +2023-04-06 03:27:20,944 epoch 91 - iter 530/2650 - loss 0.01844487 - time (sec): 37.50 - samples/sec: 7710.32 - lr: 0.025000 +2023-04-06 03:27:40,106 epoch 91 - iter 795/2650 - loss 0.01826494 - time (sec): 56.66 - samples/sec: 7679.37 - lr: 0.025000 +2023-04-06 03:27:59,168 epoch 91 - iter 1060/2650 - loss 0.01803990 - time (sec): 75.73 - samples/sec: 7678.00 - lr: 0.025000 +2023-04-06 03:28:18,968 epoch 91 - iter 1325/2650 - loss 0.01825044 - time (sec): 95.53 - samples/sec: 7627.99 - lr: 0.025000 +2023-04-06 03:28:38,079 epoch 91 - iter 1590/2650 - loss 0.01821903 - time (sec): 114.64 - samples/sec: 7620.24 - lr: 0.025000 +2023-04-06 03:28:57,989 epoch 91 - iter 1855/2650 - loss 0.01843527 - time (sec): 134.55 - samples/sec: 7603.36 - lr: 0.025000 +2023-04-06 03:29:17,613 epoch 91 - iter 2120/2650 - loss 0.01848703 - time (sec): 154.17 - samples/sec: 7593.27 - lr: 0.025000 +2023-04-06 03:29:37,045 epoch 91 - iter 2385/2650 - loss 0.01854293 - time (sec): 173.60 - samples/sec: 7590.28 - lr: 0.025000 +2023-04-06 03:29:56,019 epoch 91 - iter 2650/2650 - loss 0.01852900 - time (sec): 192.58 - samples/sec: 7593.64 - lr: 0.025000 +2023-04-06 03:29:56,019 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:29:56,019 EPOCH 91 done: loss 0.0185 - lr 0.025000 +2023-04-06 03:29:56,019 BAD EPOCHS (no improvement): 2 +2023-04-06 03:29:56,023 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:30:15,675 epoch 92 - iter 265/2650 - loss 0.01765611 - time (sec): 19.65 - samples/sec: 7349.68 - lr: 0.025000 +2023-04-06 03:30:35,010 epoch 92 - iter 530/2650 - loss 0.01807907 - time (sec): 38.99 - samples/sec: 7476.03 - lr: 0.025000 +2023-04-06 03:30:54,183 epoch 92 - iter 795/2650 - loss 0.01799083 - time (sec): 58.16 - samples/sec: 7540.31 - lr: 0.025000 +2023-04-06 03:31:14,016 epoch 92 - iter 1060/2650 - loss 0.01819708 - time (sec): 77.99 - samples/sec: 7506.73 - lr: 0.025000 +2023-04-06 03:31:33,486 epoch 92 - iter 1325/2650 - loss 0.01842859 - time (sec): 97.46 - samples/sec: 7504.91 - lr: 0.025000 +2023-04-06 03:31:52,733 epoch 92 - iter 1590/2650 - loss 0.01829982 - time (sec): 116.71 - samples/sec: 7524.04 - lr: 0.025000 +2023-04-06 03:32:11,655 epoch 92 - iter 1855/2650 - loss 0.01844895 - time (sec): 135.63 - samples/sec: 7543.81 - lr: 0.025000 +2023-04-06 03:32:30,757 epoch 92 - iter 2120/2650 - loss 0.01833490 - time (sec): 154.73 - samples/sec: 7557.65 - lr: 0.025000 +2023-04-06 03:32:50,151 epoch 92 - iter 2385/2650 - loss 0.01825138 - time (sec): 174.13 - samples/sec: 7561.44 - lr: 0.025000 +2023-04-06 03:33:09,239 epoch 92 - iter 2650/2650 - loss 0.01821018 - time (sec): 193.22 - samples/sec: 7568.56 - lr: 0.025000 +2023-04-06 03:33:09,239 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:33:09,239 EPOCH 92 done: loss 0.0182 - lr 0.025000 +2023-04-06 03:33:09,239 BAD EPOCHS (no improvement): 0 +2023-04-06 03:33:09,243 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:33:28,395 epoch 93 - iter 265/2650 - loss 0.01813219 - time (sec): 19.15 - samples/sec: 7659.04 - lr: 0.025000 +2023-04-06 03:33:47,818 epoch 93 - iter 530/2650 - loss 0.01819734 - time (sec): 38.57 - samples/sec: 7615.66 - lr: 0.025000 +2023-04-06 03:34:07,376 epoch 93 - iter 795/2650 - loss 0.01843689 - time (sec): 58.13 - samples/sec: 7577.98 - lr: 0.025000 +2023-04-06 03:34:26,191 epoch 93 - iter 1060/2650 - loss 0.01808521 - time (sec): 76.95 - samples/sec: 7591.28 - lr: 0.025000 +2023-04-06 03:34:45,098 epoch 93 - iter 1325/2650 - loss 0.01813144 - time (sec): 95.85 - samples/sec: 7621.03 - lr: 0.025000 +2023-04-06 03:35:04,413 epoch 93 - iter 1590/2650 - loss 0.01802458 - time (sec): 115.17 - samples/sec: 7615.69 - lr: 0.025000 +2023-04-06 03:35:23,887 epoch 93 - iter 1855/2650 - loss 0.01805462 - time (sec): 134.64 - samples/sec: 7608.42 - lr: 0.025000 +2023-04-06 03:35:43,266 epoch 93 - iter 2120/2650 - loss 0.01814312 - time (sec): 154.02 - samples/sec: 7602.00 - lr: 0.025000 +2023-04-06 03:36:02,471 epoch 93 - iter 2385/2650 - loss 0.01831666 - time (sec): 173.23 - samples/sec: 7594.17 - lr: 0.025000 +2023-04-06 03:36:22,116 epoch 93 - iter 2650/2650 - loss 0.01820257 - time (sec): 192.87 - samples/sec: 7582.03 - lr: 0.025000 +2023-04-06 03:36:22,116 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:36:22,116 EPOCH 93 done: loss 0.0182 - lr 0.025000 +2023-04-06 03:36:22,116 BAD EPOCHS (no improvement): 0 +2023-04-06 03:36:22,120 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:36:41,318 epoch 94 - iter 265/2650 - loss 0.01711928 - time (sec): 19.20 - samples/sec: 7532.56 - lr: 0.025000 +2023-04-06 03:37:00,262 epoch 94 - iter 530/2650 - loss 0.01787308 - time (sec): 38.14 - samples/sec: 7594.06 - lr: 0.025000 +2023-04-06 03:37:19,627 epoch 94 - iter 795/2650 - loss 0.01805023 - time (sec): 57.51 - samples/sec: 7597.37 - lr: 0.025000 +2023-04-06 03:37:38,814 epoch 94 - iter 1060/2650 - loss 0.01790143 - time (sec): 76.69 - samples/sec: 7591.23 - lr: 0.025000 +2023-04-06 03:37:58,362 epoch 94 - iter 1325/2650 - loss 0.01803606 - time (sec): 96.24 - samples/sec: 7579.72 - lr: 0.025000 +2023-04-06 03:38:17,969 epoch 94 - iter 1590/2650 - loss 0.01791083 - time (sec): 115.85 - samples/sec: 7557.05 - lr: 0.025000 +2023-04-06 03:38:37,230 epoch 94 - iter 1855/2650 - loss 0.01786170 - time (sec): 135.11 - samples/sec: 7561.42 - lr: 0.025000 +2023-04-06 03:38:56,894 epoch 94 - iter 2120/2650 - loss 0.01793272 - time (sec): 154.77 - samples/sec: 7549.65 - lr: 0.025000 +2023-04-06 03:39:16,332 epoch 94 - iter 2385/2650 - loss 0.01802128 - time (sec): 174.21 - samples/sec: 7551.15 - lr: 0.025000 +2023-04-06 03:39:35,760 epoch 94 - iter 2650/2650 - loss 0.01797402 - time (sec): 193.64 - samples/sec: 7551.98 - lr: 0.025000 +2023-04-06 03:39:35,761 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:39:35,761 EPOCH 94 done: loss 0.0180 - lr 0.025000 +2023-04-06 03:39:35,761 BAD EPOCHS (no improvement): 0 +2023-04-06 03:39:35,765 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:39:55,059 epoch 95 - iter 265/2650 - loss 0.01790416 - time (sec): 19.29 - samples/sec: 7557.57 - lr: 0.025000 +2023-04-06 03:40:14,274 epoch 95 - iter 530/2650 - loss 0.01731565 - time (sec): 38.51 - samples/sec: 7560.72 - lr: 0.025000 +2023-04-06 03:40:33,909 epoch 95 - iter 795/2650 - loss 0.01791248 - time (sec): 58.14 - samples/sec: 7508.33 - lr: 0.025000 +2023-04-06 03:40:53,791 epoch 95 - iter 1060/2650 - loss 0.01808322 - time (sec): 78.03 - samples/sec: 7483.79 - lr: 0.025000 +2023-04-06 03:41:12,789 epoch 95 - iter 1325/2650 - loss 0.01797099 - time (sec): 97.02 - samples/sec: 7517.48 - lr: 0.025000 +2023-04-06 03:41:31,863 epoch 95 - iter 1590/2650 - loss 0.01792932 - time (sec): 116.10 - samples/sec: 7548.10 - lr: 0.025000 +2023-04-06 03:41:51,382 epoch 95 - iter 1855/2650 - loss 0.01800752 - time (sec): 135.62 - samples/sec: 7546.39 - lr: 0.025000 +2023-04-06 03:42:10,965 epoch 95 - iter 2120/2650 - loss 0.01803854 - time (sec): 155.20 - samples/sec: 7533.71 - lr: 0.025000 +2023-04-06 03:42:30,075 epoch 95 - iter 2385/2650 - loss 0.01798750 - time (sec): 174.31 - samples/sec: 7549.28 - lr: 0.025000 +2023-04-06 03:42:49,093 epoch 95 - iter 2650/2650 - loss 0.01811374 - time (sec): 193.33 - samples/sec: 7564.15 - lr: 0.025000 +2023-04-06 03:42:49,094 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:42:49,094 EPOCH 95 done: loss 0.0181 - lr 0.025000 +2023-04-06 03:42:49,094 BAD EPOCHS (no improvement): 1 +2023-04-06 03:42:49,098 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:43:08,404 epoch 96 - iter 265/2650 - loss 0.01810625 - time (sec): 19.31 - samples/sec: 7551.71 - lr: 0.025000 +2023-04-06 03:43:27,540 epoch 96 - iter 530/2650 - loss 0.01815441 - time (sec): 38.44 - samples/sec: 7588.52 - lr: 0.025000 +2023-04-06 03:43:47,347 epoch 96 - iter 795/2650 - loss 0.01773251 - time (sec): 58.25 - samples/sec: 7530.07 - lr: 0.025000 +2023-04-06 03:44:06,042 epoch 96 - iter 1060/2650 - loss 0.01791772 - time (sec): 76.94 - samples/sec: 7587.15 - lr: 0.025000 +2023-04-06 03:44:25,513 epoch 96 - iter 1325/2650 - loss 0.01809560 - time (sec): 96.41 - samples/sec: 7588.94 - lr: 0.025000 +2023-04-06 03:44:44,972 epoch 96 - iter 1590/2650 - loss 0.01810324 - time (sec): 115.87 - samples/sec: 7574.38 - lr: 0.025000 +2023-04-06 03:45:04,707 epoch 96 - iter 1855/2650 - loss 0.01827558 - time (sec): 135.61 - samples/sec: 7558.64 - lr: 0.025000 +2023-04-06 03:45:24,257 epoch 96 - iter 2120/2650 - loss 0.01821144 - time (sec): 155.16 - samples/sec: 7547.39 - lr: 0.025000 +2023-04-06 03:45:43,890 epoch 96 - iter 2385/2650 - loss 0.01803239 - time (sec): 174.79 - samples/sec: 7534.69 - lr: 0.025000 +2023-04-06 03:46:02,768 epoch 96 - iter 2650/2650 - loss 0.01790687 - time (sec): 193.67 - samples/sec: 7550.79 - lr: 0.025000 +2023-04-06 03:46:02,769 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:46:02,769 EPOCH 96 done: loss 0.0179 - lr 0.025000 +2023-04-06 03:46:02,769 BAD EPOCHS (no improvement): 0 +2023-04-06 03:46:02,772 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:46:21,808 epoch 97 - iter 265/2650 - loss 0.01842335 - time (sec): 19.04 - samples/sec: 7651.18 - lr: 0.025000 +2023-04-06 03:46:40,904 epoch 97 - iter 530/2650 - loss 0.01836702 - time (sec): 38.13 - samples/sec: 7624.98 - lr: 0.025000 +2023-04-06 03:46:59,787 epoch 97 - iter 795/2650 - loss 0.01766383 - time (sec): 57.01 - samples/sec: 7684.09 - lr: 0.025000 +2023-04-06 03:47:19,214 epoch 97 - iter 1060/2650 - loss 0.01778333 - time (sec): 76.44 - samples/sec: 7635.82 - lr: 0.025000 +2023-04-06 03:47:38,205 epoch 97 - iter 1325/2650 - loss 0.01764984 - time (sec): 95.43 - samples/sec: 7646.86 - lr: 0.025000 +2023-04-06 03:47:57,910 epoch 97 - iter 1590/2650 - loss 0.01779518 - time (sec): 115.14 - samples/sec: 7607.87 - lr: 0.025000 +2023-04-06 03:48:17,644 epoch 97 - iter 1855/2650 - loss 0.01777098 - time (sec): 134.87 - samples/sec: 7580.50 - lr: 0.025000 +2023-04-06 03:48:36,952 epoch 97 - iter 2120/2650 - loss 0.01778203 - time (sec): 154.18 - samples/sec: 7575.63 - lr: 0.025000 +2023-04-06 03:48:56,316 epoch 97 - iter 2385/2650 - loss 0.01781730 - time (sec): 173.54 - samples/sec: 7577.50 - lr: 0.025000 +2023-04-06 03:49:16,281 epoch 97 - iter 2650/2650 - loss 0.01778663 - time (sec): 193.51 - samples/sec: 7557.11 - lr: 0.025000 +2023-04-06 03:49:16,281 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:49:16,281 EPOCH 97 done: loss 0.0178 - lr 0.025000 +2023-04-06 03:49:16,281 BAD EPOCHS (no improvement): 0 +2023-04-06 03:49:16,285 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:49:35,582 epoch 98 - iter 265/2650 - loss 0.01873937 - time (sec): 19.30 - samples/sec: 7534.37 - lr: 0.025000 +2023-04-06 03:49:54,804 epoch 98 - iter 530/2650 - loss 0.01764710 - time (sec): 38.52 - samples/sec: 7580.86 - lr: 0.025000 +2023-04-06 03:50:14,042 epoch 98 - iter 795/2650 - loss 0.01768454 - time (sec): 57.76 - samples/sec: 7588.24 - lr: 0.025000 +2023-04-06 03:50:33,263 epoch 98 - iter 1060/2650 - loss 0.01774067 - time (sec): 76.98 - samples/sec: 7603.12 - lr: 0.025000 +2023-04-06 03:50:52,872 epoch 98 - iter 1325/2650 - loss 0.01775046 - time (sec): 96.59 - samples/sec: 7571.95 - lr: 0.025000 +2023-04-06 03:51:12,010 epoch 98 - iter 1590/2650 - loss 0.01765197 - time (sec): 115.72 - samples/sec: 7574.35 - lr: 0.025000 +2023-04-06 03:51:31,442 epoch 98 - iter 1855/2650 - loss 0.01765816 - time (sec): 135.16 - samples/sec: 7570.01 - lr: 0.025000 +2023-04-06 03:51:50,361 epoch 98 - iter 2120/2650 - loss 0.01758818 - time (sec): 154.08 - samples/sec: 7585.09 - lr: 0.025000 +2023-04-06 03:52:09,653 epoch 98 - iter 2385/2650 - loss 0.01754489 - time (sec): 173.37 - samples/sec: 7587.51 - lr: 0.025000 +2023-04-06 03:52:29,103 epoch 98 - iter 2650/2650 - loss 0.01757753 - time (sec): 192.82 - samples/sec: 7584.16 - lr: 0.025000 +2023-04-06 03:52:29,103 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:52:29,103 EPOCH 98 done: loss 0.0176 - lr 0.025000 +2023-04-06 03:52:29,103 BAD EPOCHS (no improvement): 0 +2023-04-06 03:52:29,107 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:52:48,533 epoch 99 - iter 265/2650 - loss 0.01717458 - time (sec): 19.43 - samples/sec: 7514.37 - lr: 0.025000 +2023-04-06 03:53:08,232 epoch 99 - iter 530/2650 - loss 0.01716876 - time (sec): 39.12 - samples/sec: 7477.50 - lr: 0.025000 +2023-04-06 03:53:27,878 epoch 99 - iter 795/2650 - loss 0.01756395 - time (sec): 58.77 - samples/sec: 7486.66 - lr: 0.025000 +2023-04-06 03:53:47,273 epoch 99 - iter 1060/2650 - loss 0.01735170 - time (sec): 78.17 - samples/sec: 7502.60 - lr: 0.025000 +2023-04-06 03:54:06,939 epoch 99 - iter 1325/2650 - loss 0.01725931 - time (sec): 97.83 - samples/sec: 7476.96 - lr: 0.025000 +2023-04-06 03:54:26,141 epoch 99 - iter 1590/2650 - loss 0.01742408 - time (sec): 117.03 - samples/sec: 7498.20 - lr: 0.025000 +2023-04-06 03:54:45,480 epoch 99 - iter 1855/2650 - loss 0.01750477 - time (sec): 136.37 - samples/sec: 7509.30 - lr: 0.025000 +2023-04-06 03:55:04,472 epoch 99 - iter 2120/2650 - loss 0.01758883 - time (sec): 155.37 - samples/sec: 7527.48 - lr: 0.025000 +2023-04-06 03:55:23,893 epoch 99 - iter 2385/2650 - loss 0.01747955 - time (sec): 174.79 - samples/sec: 7534.47 - lr: 0.025000 +2023-04-06 03:55:42,700 epoch 99 - iter 2650/2650 - loss 0.01750235 - time (sec): 193.59 - samples/sec: 7553.81 - lr: 0.025000 +2023-04-06 03:55:42,700 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:55:42,700 EPOCH 99 done: loss 0.0175 - lr 0.025000 +2023-04-06 03:55:42,700 BAD EPOCHS (no improvement): 0 +2023-04-06 03:55:42,703 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:56:01,924 epoch 100 - iter 265/2650 - loss 0.01653783 - time (sec): 19.22 - samples/sec: 7591.19 - lr: 0.025000 +2023-04-06 03:56:20,775 epoch 100 - iter 530/2650 - loss 0.01675143 - time (sec): 38.07 - samples/sec: 7645.45 - lr: 0.025000 +2023-04-06 03:56:40,019 epoch 100 - iter 795/2650 - loss 0.01721218 - time (sec): 57.32 - samples/sec: 7636.22 - lr: 0.025000 +2023-04-06 03:56:59,734 epoch 100 - iter 1060/2650 - loss 0.01744620 - time (sec): 77.03 - samples/sec: 7574.79 - lr: 0.025000 +2023-04-06 03:57:20,084 epoch 100 - iter 1325/2650 - loss 0.01772068 - time (sec): 97.38 - samples/sec: 7512.66 - lr: 0.025000 +2023-04-06 03:57:39,413 epoch 100 - iter 1590/2650 - loss 0.01755216 - time (sec): 116.71 - samples/sec: 7520.37 - lr: 0.025000 +2023-04-06 03:57:58,445 epoch 100 - iter 1855/2650 - loss 0.01745576 - time (sec): 135.74 - samples/sec: 7545.76 - lr: 0.025000 +2023-04-06 03:58:17,193 epoch 100 - iter 2120/2650 - loss 0.01750841 - time (sec): 154.49 - samples/sec: 7568.44 - lr: 0.025000 +2023-04-06 03:58:36,863 epoch 100 - iter 2385/2650 - loss 0.01759284 - time (sec): 174.16 - samples/sec: 7551.47 - lr: 0.025000 +2023-04-06 03:58:56,527 epoch 100 - iter 2650/2650 - loss 0.01757857 - time (sec): 193.82 - samples/sec: 7544.83 - lr: 0.025000 +2023-04-06 03:58:56,527 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:58:56,527 EPOCH 100 done: loss 0.0176 - lr 0.025000 +2023-04-06 03:58:56,527 BAD EPOCHS (no improvement): 1 +2023-04-06 03:58:56,530 ---------------------------------------------------------------------------------------------------- +2023-04-06 03:59:16,593 epoch 101 - iter 265/2650 - loss 0.01708355 - time (sec): 20.06 - samples/sec: 7356.97 - lr: 0.025000 +2023-04-06 03:59:36,126 epoch 101 - iter 530/2650 - loss 0.01676864 - time (sec): 39.60 - samples/sec: 7424.09 - lr: 0.025000 +2023-04-06 03:59:55,855 epoch 101 - iter 795/2650 - loss 0.01737744 - time (sec): 59.33 - samples/sec: 7443.52 - lr: 0.025000 +2023-04-06 04:00:14,915 epoch 101 - iter 1060/2650 - loss 0.01718627 - time (sec): 78.39 - samples/sec: 7492.13 - lr: 0.025000 +2023-04-06 04:00:34,324 epoch 101 - iter 1325/2650 - loss 0.01738846 - time (sec): 97.79 - samples/sec: 7485.67 - lr: 0.025000 +2023-04-06 04:00:53,518 epoch 101 - iter 1590/2650 - loss 0.01738547 - time (sec): 116.99 - samples/sec: 7505.97 - lr: 0.025000 +2023-04-06 04:01:12,622 epoch 101 - iter 1855/2650 - loss 0.01723389 - time (sec): 136.09 - samples/sec: 7507.76 - lr: 0.025000 +2023-04-06 04:01:31,829 epoch 101 - iter 2120/2650 - loss 0.01720360 - time (sec): 155.30 - samples/sec: 7521.89 - lr: 0.025000 +2023-04-06 04:01:52,037 epoch 101 - iter 2385/2650 - loss 0.01715515 - time (sec): 175.51 - samples/sec: 7496.87 - lr: 0.025000 +2023-04-06 04:02:11,900 epoch 101 - iter 2650/2650 - loss 0.01716259 - time (sec): 195.37 - samples/sec: 7485.07 - lr: 0.025000 +2023-04-06 04:02:11,901 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:02:11,901 EPOCH 101 done: loss 0.0172 - lr 0.025000 +2023-04-06 04:02:11,901 BAD EPOCHS (no improvement): 0 +2023-04-06 04:02:11,905 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:02:31,292 epoch 102 - iter 265/2650 - loss 0.01771113 - time (sec): 19.39 - samples/sec: 7562.66 - lr: 0.025000 +2023-04-06 04:02:50,751 epoch 102 - iter 530/2650 - loss 0.01683032 - time (sec): 38.85 - samples/sec: 7549.14 - lr: 0.025000 +2023-04-06 04:03:10,579 epoch 102 - iter 795/2650 - loss 0.01718120 - time (sec): 58.67 - samples/sec: 7475.45 - lr: 0.025000 +2023-04-06 04:03:29,851 epoch 102 - iter 1060/2650 - loss 0.01712816 - time (sec): 77.95 - samples/sec: 7502.14 - lr: 0.025000 +2023-04-06 04:03:49,513 epoch 102 - iter 1325/2650 - loss 0.01701223 - time (sec): 97.61 - samples/sec: 7493.42 - lr: 0.025000 +2023-04-06 04:04:08,672 epoch 102 - iter 1590/2650 - loss 0.01708399 - time (sec): 116.77 - samples/sec: 7505.23 - lr: 0.025000 +2023-04-06 04:04:28,038 epoch 102 - iter 1855/2650 - loss 0.01709347 - time (sec): 136.13 - samples/sec: 7521.19 - lr: 0.025000 +2023-04-06 04:04:47,120 epoch 102 - iter 2120/2650 - loss 0.01708681 - time (sec): 155.21 - samples/sec: 7543.42 - lr: 0.025000 +2023-04-06 04:05:06,751 epoch 102 - iter 2385/2650 - loss 0.01710372 - time (sec): 174.85 - samples/sec: 7529.01 - lr: 0.025000 +2023-04-06 04:05:26,431 epoch 102 - iter 2650/2650 - loss 0.01713520 - time (sec): 194.53 - samples/sec: 7517.55 - lr: 0.025000 +2023-04-06 04:05:26,432 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:05:26,432 EPOCH 102 done: loss 0.0171 - lr 0.025000 +2023-04-06 04:05:26,432 BAD EPOCHS (no improvement): 0 +2023-04-06 04:05:26,436 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:05:46,838 epoch 103 - iter 265/2650 - loss 0.01693677 - time (sec): 20.40 - samples/sec: 7235.82 - lr: 0.025000 +2023-04-06 04:06:05,956 epoch 103 - iter 530/2650 - loss 0.01693291 - time (sec): 39.52 - samples/sec: 7412.55 - lr: 0.025000 +2023-04-06 04:06:25,030 epoch 103 - iter 795/2650 - loss 0.01713680 - time (sec): 58.59 - samples/sec: 7476.81 - lr: 0.025000 +2023-04-06 04:06:44,335 epoch 103 - iter 1060/2650 - loss 0.01710151 - time (sec): 77.90 - samples/sec: 7478.01 - lr: 0.025000 +2023-04-06 04:07:04,468 epoch 103 - iter 1325/2650 - loss 0.01730369 - time (sec): 98.03 - samples/sec: 7437.24 - lr: 0.025000 +2023-04-06 04:07:23,745 epoch 103 - iter 1590/2650 - loss 0.01727228 - time (sec): 117.31 - samples/sec: 7464.26 - lr: 0.025000 +2023-04-06 04:07:43,283 epoch 103 - iter 1855/2650 - loss 0.01722724 - time (sec): 136.85 - samples/sec: 7477.51 - lr: 0.025000 +2023-04-06 04:08:02,896 epoch 103 - iter 2120/2650 - loss 0.01716343 - time (sec): 156.46 - samples/sec: 7476.75 - lr: 0.025000 +2023-04-06 04:08:22,176 epoch 103 - iter 2385/2650 - loss 0.01711566 - time (sec): 175.74 - samples/sec: 7495.27 - lr: 0.025000 +2023-04-06 04:08:41,029 epoch 103 - iter 2650/2650 - loss 0.01716014 - time (sec): 194.59 - samples/sec: 7514.97 - lr: 0.025000 +2023-04-06 04:08:41,029 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:08:41,029 EPOCH 103 done: loss 0.0172 - lr 0.025000 +2023-04-06 04:08:41,029 BAD EPOCHS (no improvement): 1 +2023-04-06 04:08:41,033 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:09:01,535 epoch 104 - iter 265/2650 - loss 0.01693417 - time (sec): 20.50 - samples/sec: 7155.75 - lr: 0.025000 +2023-04-06 04:09:20,609 epoch 104 - iter 530/2650 - loss 0.01685370 - time (sec): 39.58 - samples/sec: 7400.11 - lr: 0.025000 +2023-04-06 04:09:39,567 epoch 104 - iter 795/2650 - loss 0.01692015 - time (sec): 58.53 - samples/sec: 7498.01 - lr: 0.025000 +2023-04-06 04:09:59,074 epoch 104 - iter 1060/2650 - loss 0.01705000 - time (sec): 78.04 - samples/sec: 7488.39 - lr: 0.025000 +2023-04-06 04:10:18,738 epoch 104 - iter 1325/2650 - loss 0.01719044 - time (sec): 97.71 - samples/sec: 7499.43 - lr: 0.025000 +2023-04-06 04:10:38,381 epoch 104 - iter 1590/2650 - loss 0.01725429 - time (sec): 117.35 - samples/sec: 7503.62 - lr: 0.025000 +2023-04-06 04:10:57,497 epoch 104 - iter 1855/2650 - loss 0.01709761 - time (sec): 136.46 - samples/sec: 7514.84 - lr: 0.025000 +2023-04-06 04:11:17,167 epoch 104 - iter 2120/2650 - loss 0.01711381 - time (sec): 156.13 - samples/sec: 7506.61 - lr: 0.025000 +2023-04-06 04:11:36,525 epoch 104 - iter 2385/2650 - loss 0.01709983 - time (sec): 175.49 - samples/sec: 7509.00 - lr: 0.025000 +2023-04-06 04:11:55,654 epoch 104 - iter 2650/2650 - loss 0.01710809 - time (sec): 194.62 - samples/sec: 7513.89 - lr: 0.025000 +2023-04-06 04:11:55,655 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:11:55,655 EPOCH 104 done: loss 0.0171 - lr 0.025000 +2023-04-06 04:11:55,655 BAD EPOCHS (no improvement): 0 +2023-04-06 04:11:55,658 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:12:15,128 epoch 105 - iter 265/2650 - loss 0.01631357 - time (sec): 19.47 - samples/sec: 7510.77 - lr: 0.025000 +2023-04-06 04:12:34,317 epoch 105 - iter 530/2650 - loss 0.01673442 - time (sec): 38.66 - samples/sec: 7510.69 - lr: 0.025000 +2023-04-06 04:12:53,939 epoch 105 - iter 795/2650 - loss 0.01688012 - time (sec): 58.28 - samples/sec: 7466.04 - lr: 0.025000 +2023-04-06 04:13:12,920 epoch 105 - iter 1060/2650 - loss 0.01650347 - time (sec): 77.26 - samples/sec: 7503.40 - lr: 0.025000 +2023-04-06 04:13:32,641 epoch 105 - iter 1325/2650 - loss 0.01656678 - time (sec): 96.98 - samples/sec: 7488.10 - lr: 0.025000 +2023-04-06 04:13:52,608 epoch 105 - iter 1590/2650 - loss 0.01675649 - time (sec): 116.95 - samples/sec: 7480.16 - lr: 0.025000 +2023-04-06 04:14:11,887 epoch 105 - iter 1855/2650 - loss 0.01683192 - time (sec): 136.23 - samples/sec: 7501.78 - lr: 0.025000 +2023-04-06 04:14:40,662 epoch 105 - iter 2120/2650 - loss 0.01692088 - time (sec): 165.00 - samples/sec: 7079.35 - lr: 0.025000 +2023-04-06 04:15:00,227 epoch 105 - iter 2385/2650 - loss 0.01687815 - time (sec): 184.57 - samples/sec: 7126.79 - lr: 0.025000 +2023-04-06 04:15:19,973 epoch 105 - iter 2650/2650 - loss 0.01692683 - time (sec): 204.32 - samples/sec: 7157.39 - lr: 0.025000 +2023-04-06 04:15:19,974 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:15:19,974 EPOCH 105 done: loss 0.0169 - lr 0.025000 +2023-04-06 04:15:19,974 BAD EPOCHS (no improvement): 0 +2023-04-06 04:15:19,977 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:15:39,817 epoch 106 - iter 265/2650 - loss 0.01673648 - time (sec): 19.84 - samples/sec: 7458.28 - lr: 0.025000 +2023-04-06 04:15:59,784 epoch 106 - iter 530/2650 - loss 0.01715912 - time (sec): 39.81 - samples/sec: 7442.78 - lr: 0.025000 +2023-04-06 04:16:20,040 epoch 106 - iter 795/2650 - loss 0.01675035 - time (sec): 60.06 - samples/sec: 7396.12 - lr: 0.025000 +2023-04-06 04:16:38,975 epoch 106 - iter 1060/2650 - loss 0.01695581 - time (sec): 79.00 - samples/sec: 7453.50 - lr: 0.025000 +2023-04-06 04:16:58,872 epoch 106 - iter 1325/2650 - loss 0.01665794 - time (sec): 98.89 - samples/sec: 7430.63 - lr: 0.025000 +2023-04-06 04:17:18,918 epoch 106 - iter 1590/2650 - loss 0.01669753 - time (sec): 118.94 - samples/sec: 7414.86 - lr: 0.025000 +2023-04-06 04:17:38,280 epoch 106 - iter 1855/2650 - loss 0.01666533 - time (sec): 138.30 - samples/sec: 7436.68 - lr: 0.025000 +2023-04-06 04:17:56,821 epoch 106 - iter 2120/2650 - loss 0.01664147 - time (sec): 156.84 - samples/sec: 7471.10 - lr: 0.025000 +2023-04-06 04:18:16,098 epoch 106 - iter 2385/2650 - loss 0.01665772 - time (sec): 176.12 - samples/sec: 7479.77 - lr: 0.025000 +2023-04-06 04:18:35,545 epoch 106 - iter 2650/2650 - loss 0.01672930 - time (sec): 195.57 - samples/sec: 7477.51 - lr: 0.025000 +2023-04-06 04:18:35,546 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:18:35,546 EPOCH 106 done: loss 0.0167 - lr 0.025000 +2023-04-06 04:18:35,546 BAD EPOCHS (no improvement): 0 +2023-04-06 04:18:35,549 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:18:55,116 epoch 107 - iter 265/2650 - loss 0.01700508 - time (sec): 19.57 - samples/sec: 7511.28 - lr: 0.025000 +2023-04-06 04:19:14,129 epoch 107 - iter 530/2650 - loss 0.01666121 - time (sec): 38.58 - samples/sec: 7604.94 - lr: 0.025000 +2023-04-06 04:19:33,583 epoch 107 - iter 795/2650 - loss 0.01687065 - time (sec): 58.03 - samples/sec: 7542.21 - lr: 0.025000 +2023-04-06 04:19:53,108 epoch 107 - iter 1060/2650 - loss 0.01674413 - time (sec): 77.56 - samples/sec: 7525.50 - lr: 0.025000 +2023-04-06 04:20:13,013 epoch 107 - iter 1325/2650 - loss 0.01678768 - time (sec): 97.46 - samples/sec: 7495.03 - lr: 0.025000 +2023-04-06 04:20:32,140 epoch 107 - iter 1590/2650 - loss 0.01692871 - time (sec): 116.59 - samples/sec: 7534.34 - lr: 0.025000 +2023-04-06 04:20:51,488 epoch 107 - iter 1855/2650 - loss 0.01694868 - time (sec): 135.94 - samples/sec: 7528.95 - lr: 0.025000 +2023-04-06 04:21:11,046 epoch 107 - iter 2120/2650 - loss 0.01675980 - time (sec): 155.50 - samples/sec: 7527.58 - lr: 0.025000 +2023-04-06 04:21:30,648 epoch 107 - iter 2385/2650 - loss 0.01670803 - time (sec): 175.10 - samples/sec: 7515.14 - lr: 0.025000 +2023-04-06 04:21:50,596 epoch 107 - iter 2650/2650 - loss 0.01666834 - time (sec): 195.05 - samples/sec: 7497.46 - lr: 0.025000 +2023-04-06 04:21:50,597 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:21:50,597 EPOCH 107 done: loss 0.0167 - lr 0.025000 +2023-04-06 04:21:50,597 BAD EPOCHS (no improvement): 0 +2023-04-06 04:21:50,600 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:22:09,566 epoch 108 - iter 265/2650 - loss 0.01716220 - time (sec): 18.97 - samples/sec: 7621.41 - lr: 0.025000 +2023-04-06 04:22:28,648 epoch 108 - iter 530/2650 - loss 0.01683258 - time (sec): 38.05 - samples/sec: 7587.19 - lr: 0.025000 +2023-04-06 04:22:48,430 epoch 108 - iter 795/2650 - loss 0.01684678 - time (sec): 57.83 - samples/sec: 7504.31 - lr: 0.025000 +2023-04-06 04:23:08,549 epoch 108 - iter 1060/2650 - loss 0.01679694 - time (sec): 77.95 - samples/sec: 7459.97 - lr: 0.025000 +2023-04-06 04:23:27,790 epoch 108 - iter 1325/2650 - loss 0.01653009 - time (sec): 97.19 - samples/sec: 7483.36 - lr: 0.025000 +2023-04-06 04:23:47,274 epoch 108 - iter 1590/2650 - loss 0.01634798 - time (sec): 116.67 - samples/sec: 7494.83 - lr: 0.025000 +2023-04-06 04:24:07,013 epoch 108 - iter 1855/2650 - loss 0.01655042 - time (sec): 136.41 - samples/sec: 7487.22 - lr: 0.025000 +2023-04-06 04:24:26,489 epoch 108 - iter 2120/2650 - loss 0.01659093 - time (sec): 155.89 - samples/sec: 7487.43 - lr: 0.025000 +2023-04-06 04:24:46,638 epoch 108 - iter 2385/2650 - loss 0.01656739 - time (sec): 176.04 - samples/sec: 7473.98 - lr: 0.025000 +2023-04-06 04:25:05,799 epoch 108 - iter 2650/2650 - loss 0.01656419 - time (sec): 195.20 - samples/sec: 7491.64 - lr: 0.025000 +2023-04-06 04:25:05,799 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:25:05,799 EPOCH 108 done: loss 0.0166 - lr 0.025000 +2023-04-06 04:25:05,799 BAD EPOCHS (no improvement): 0 +2023-04-06 04:25:05,802 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:25:25,059 epoch 109 - iter 265/2650 - loss 0.01699372 - time (sec): 19.26 - samples/sec: 7505.63 - lr: 0.025000 +2023-04-06 04:25:44,922 epoch 109 - iter 530/2650 - loss 0.01680227 - time (sec): 39.12 - samples/sec: 7469.97 - lr: 0.025000 +2023-04-06 04:26:04,672 epoch 109 - iter 795/2650 - loss 0.01718436 - time (sec): 58.87 - samples/sec: 7477.72 - lr: 0.025000 +2023-04-06 04:26:23,887 epoch 109 - iter 1060/2650 - loss 0.01706081 - time (sec): 78.08 - samples/sec: 7502.46 - lr: 0.025000 +2023-04-06 04:26:43,007 epoch 109 - iter 1325/2650 - loss 0.01710698 - time (sec): 97.21 - samples/sec: 7517.76 - lr: 0.025000 +2023-04-06 04:27:02,407 epoch 109 - iter 1590/2650 - loss 0.01703925 - time (sec): 116.60 - samples/sec: 7518.70 - lr: 0.025000 +2023-04-06 04:27:21,907 epoch 109 - iter 1855/2650 - loss 0.01701318 - time (sec): 136.10 - samples/sec: 7510.53 - lr: 0.025000 +2023-04-06 04:27:41,434 epoch 109 - iter 2120/2650 - loss 0.01684682 - time (sec): 155.63 - samples/sec: 7514.95 - lr: 0.025000 +2023-04-06 04:28:01,438 epoch 109 - iter 2385/2650 - loss 0.01683687 - time (sec): 175.64 - samples/sec: 7495.55 - lr: 0.025000 +2023-04-06 04:28:21,167 epoch 109 - iter 2650/2650 - loss 0.01681963 - time (sec): 195.36 - samples/sec: 7485.30 - lr: 0.025000 +2023-04-06 04:28:21,167 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:28:21,167 EPOCH 109 done: loss 0.0168 - lr 0.025000 +2023-04-06 04:28:21,167 BAD EPOCHS (no improvement): 1 +2023-04-06 04:28:21,170 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:28:40,916 epoch 110 - iter 265/2650 - loss 0.01628376 - time (sec): 19.75 - samples/sec: 7409.00 - lr: 0.025000 +2023-04-06 04:29:00,112 epoch 110 - iter 530/2650 - loss 0.01609302 - time (sec): 38.94 - samples/sec: 7485.10 - lr: 0.025000 +2023-04-06 04:29:19,558 epoch 110 - iter 795/2650 - loss 0.01640575 - time (sec): 58.39 - samples/sec: 7501.30 - lr: 0.025000 +2023-04-06 04:29:38,710 epoch 110 - iter 1060/2650 - loss 0.01642829 - time (sec): 77.54 - samples/sec: 7517.67 - lr: 0.025000 +2023-04-06 04:29:58,303 epoch 110 - iter 1325/2650 - loss 0.01654595 - time (sec): 97.13 - samples/sec: 7496.37 - lr: 0.025000 +2023-04-06 04:30:17,415 epoch 110 - iter 1590/2650 - loss 0.01668240 - time (sec): 116.24 - samples/sec: 7522.48 - lr: 0.025000 +2023-04-06 04:30:36,820 epoch 110 - iter 1855/2650 - loss 0.01666119 - time (sec): 135.65 - samples/sec: 7524.03 - lr: 0.025000 +2023-04-06 04:30:57,228 epoch 110 - iter 2120/2650 - loss 0.01670959 - time (sec): 156.06 - samples/sec: 7491.56 - lr: 0.025000 +2023-04-06 04:31:16,814 epoch 110 - iter 2385/2650 - loss 0.01654634 - time (sec): 175.64 - samples/sec: 7496.33 - lr: 0.025000 +2023-04-06 04:31:36,498 epoch 110 - iter 2650/2650 - loss 0.01649117 - time (sec): 195.33 - samples/sec: 7486.71 - lr: 0.025000 +2023-04-06 04:31:36,498 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:31:36,498 EPOCH 110 done: loss 0.0165 - lr 0.025000 +2023-04-06 04:31:36,498 BAD EPOCHS (no improvement): 0 +2023-04-06 04:31:36,502 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:31:55,822 epoch 111 - iter 265/2650 - loss 0.01547960 - time (sec): 19.32 - samples/sec: 7653.66 - lr: 0.025000 +2023-04-06 04:32:15,205 epoch 111 - iter 530/2650 - loss 0.01568430 - time (sec): 38.70 - samples/sec: 7565.61 - lr: 0.025000 +2023-04-06 04:32:34,897 epoch 111 - iter 795/2650 - loss 0.01607482 - time (sec): 58.39 - samples/sec: 7503.04 - lr: 0.025000 +2023-04-06 04:32:54,654 epoch 111 - iter 1060/2650 - loss 0.01612207 - time (sec): 78.15 - samples/sec: 7464.00 - lr: 0.025000 +2023-04-06 04:33:13,848 epoch 111 - iter 1325/2650 - loss 0.01611149 - time (sec): 97.35 - samples/sec: 7491.33 - lr: 0.025000 +2023-04-06 04:33:33,709 epoch 111 - iter 1590/2650 - loss 0.01641411 - time (sec): 117.21 - samples/sec: 7475.68 - lr: 0.025000 +2023-04-06 04:33:53,695 epoch 111 - iter 1855/2650 - loss 0.01632107 - time (sec): 137.19 - samples/sec: 7469.89 - lr: 0.025000 +2023-04-06 04:34:13,108 epoch 111 - iter 2120/2650 - loss 0.01642444 - time (sec): 156.61 - samples/sec: 7478.19 - lr: 0.025000 +2023-04-06 04:34:32,231 epoch 111 - iter 2385/2650 - loss 0.01634078 - time (sec): 175.73 - samples/sec: 7482.79 - lr: 0.025000 +2023-04-06 04:34:52,337 epoch 111 - iter 2650/2650 - loss 0.01639498 - time (sec): 195.84 - samples/sec: 7467.30 - lr: 0.025000 +2023-04-06 04:34:52,338 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:34:52,338 EPOCH 111 done: loss 0.0164 - lr 0.025000 +2023-04-06 04:34:52,338 BAD EPOCHS (no improvement): 0 +2023-04-06 04:34:52,340 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:35:11,809 epoch 112 - iter 265/2650 - loss 0.01689996 - time (sec): 19.47 - samples/sec: 7473.54 - lr: 0.025000 +2023-04-06 04:35:31,695 epoch 112 - iter 530/2650 - loss 0.01663563 - time (sec): 39.35 - samples/sec: 7414.24 - lr: 0.025000 +2023-04-06 04:35:51,241 epoch 112 - iter 795/2650 - loss 0.01646828 - time (sec): 58.90 - samples/sec: 7444.65 - lr: 0.025000 +2023-04-06 04:36:10,563 epoch 112 - iter 1060/2650 - loss 0.01630354 - time (sec): 78.22 - samples/sec: 7486.80 - lr: 0.025000 +2023-04-06 04:36:30,165 epoch 112 - iter 1325/2650 - loss 0.01636160 - time (sec): 97.82 - samples/sec: 7493.21 - lr: 0.025000 +2023-04-06 04:36:49,512 epoch 112 - iter 1590/2650 - loss 0.01635887 - time (sec): 117.17 - samples/sec: 7500.02 - lr: 0.025000 +2023-04-06 04:37:08,296 epoch 112 - iter 1855/2650 - loss 0.01639079 - time (sec): 135.96 - samples/sec: 7526.10 - lr: 0.025000 +2023-04-06 04:37:28,064 epoch 112 - iter 2120/2650 - loss 0.01649152 - time (sec): 155.72 - samples/sec: 7511.91 - lr: 0.025000 +2023-04-06 04:37:47,686 epoch 112 - iter 2385/2650 - loss 0.01636407 - time (sec): 175.35 - samples/sec: 7514.33 - lr: 0.025000 +2023-04-06 04:38:07,327 epoch 112 - iter 2650/2650 - loss 0.01643489 - time (sec): 194.99 - samples/sec: 7499.80 - lr: 0.025000 +2023-04-06 04:38:07,328 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:38:07,328 EPOCH 112 done: loss 0.0164 - lr 0.025000 +2023-04-06 04:38:07,328 BAD EPOCHS (no improvement): 1 +2023-04-06 04:38:07,331 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:38:26,839 epoch 113 - iter 265/2650 - loss 0.01588915 - time (sec): 19.51 - samples/sec: 7449.40 - lr: 0.025000 +2023-04-06 04:38:46,314 epoch 113 - iter 530/2650 - loss 0.01567703 - time (sec): 38.98 - samples/sec: 7494.46 - lr: 0.025000 +2023-04-06 04:39:05,624 epoch 113 - iter 795/2650 - loss 0.01571463 - time (sec): 58.29 - samples/sec: 7532.94 - lr: 0.025000 +2023-04-06 04:39:24,892 epoch 113 - iter 1060/2650 - loss 0.01554186 - time (sec): 77.56 - samples/sec: 7554.24 - lr: 0.025000 +2023-04-06 04:39:44,216 epoch 113 - iter 1325/2650 - loss 0.01570454 - time (sec): 96.88 - samples/sec: 7549.37 - lr: 0.025000 +2023-04-06 04:40:04,074 epoch 113 - iter 1590/2650 - loss 0.01562611 - time (sec): 116.74 - samples/sec: 7519.75 - lr: 0.025000 +2023-04-06 04:40:24,155 epoch 113 - iter 1855/2650 - loss 0.01569171 - time (sec): 136.82 - samples/sec: 7481.73 - lr: 0.025000 +2023-04-06 04:40:43,424 epoch 113 - iter 2120/2650 - loss 0.01575266 - time (sec): 156.09 - samples/sec: 7496.72 - lr: 0.025000 +2023-04-06 04:41:02,890 epoch 113 - iter 2385/2650 - loss 0.01588818 - time (sec): 175.56 - samples/sec: 7495.26 - lr: 0.025000 +2023-04-06 04:41:22,410 epoch 113 - iter 2650/2650 - loss 0.01589302 - time (sec): 195.08 - samples/sec: 7496.28 - lr: 0.025000 +2023-04-06 04:41:22,410 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:41:22,410 EPOCH 113 done: loss 0.0159 - lr 0.025000 +2023-04-06 04:41:22,410 BAD EPOCHS (no improvement): 0 +2023-04-06 04:41:22,414 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:41:41,875 epoch 114 - iter 265/2650 - loss 0.01641695 - time (sec): 19.46 - samples/sec: 7484.16 - lr: 0.025000 +2023-04-06 04:42:01,777 epoch 114 - iter 530/2650 - loss 0.01602753 - time (sec): 39.36 - samples/sec: 7417.53 - lr: 0.025000 +2023-04-06 04:42:20,785 epoch 114 - iter 795/2650 - loss 0.01602222 - time (sec): 58.37 - samples/sec: 7500.14 - lr: 0.025000 +2023-04-06 04:42:39,912 epoch 114 - iter 1060/2650 - loss 0.01601872 - time (sec): 77.50 - samples/sec: 7536.27 - lr: 0.025000 +2023-04-06 04:42:59,322 epoch 114 - iter 1325/2650 - loss 0.01606059 - time (sec): 96.91 - samples/sec: 7536.92 - lr: 0.025000 +2023-04-06 04:43:18,274 epoch 114 - iter 1590/2650 - loss 0.01620848 - time (sec): 115.86 - samples/sec: 7556.75 - lr: 0.025000 +2023-04-06 04:43:38,052 epoch 114 - iter 1855/2650 - loss 0.01604542 - time (sec): 135.64 - samples/sec: 7536.29 - lr: 0.025000 +2023-04-06 04:43:58,144 epoch 114 - iter 2120/2650 - loss 0.01623785 - time (sec): 155.73 - samples/sec: 7513.91 - lr: 0.025000 +2023-04-06 04:44:18,005 epoch 114 - iter 2385/2650 - loss 0.01632508 - time (sec): 175.59 - samples/sec: 7502.14 - lr: 0.025000 +2023-04-06 04:44:37,152 epoch 114 - iter 2650/2650 - loss 0.01639981 - time (sec): 194.74 - samples/sec: 7509.39 - lr: 0.025000 +2023-04-06 04:44:37,152 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:44:37,152 EPOCH 114 done: loss 0.0164 - lr 0.025000 +2023-04-06 04:44:37,152 BAD EPOCHS (no improvement): 1 +2023-04-06 04:44:37,156 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:44:57,155 epoch 115 - iter 265/2650 - loss 0.01589350 - time (sec): 20.00 - samples/sec: 7412.51 - lr: 0.025000 +2023-04-06 04:45:16,335 epoch 115 - iter 530/2650 - loss 0.01542737 - time (sec): 39.18 - samples/sec: 7501.90 - lr: 0.025000 +2023-04-06 04:45:36,109 epoch 115 - iter 795/2650 - loss 0.01603309 - time (sec): 58.95 - samples/sec: 7444.78 - lr: 0.025000 +2023-04-06 04:45:56,056 epoch 115 - iter 1060/2650 - loss 0.01606387 - time (sec): 78.90 - samples/sec: 7427.18 - lr: 0.025000 +2023-04-06 04:46:15,235 epoch 115 - iter 1325/2650 - loss 0.01614928 - time (sec): 98.08 - samples/sec: 7459.92 - lr: 0.025000 +2023-04-06 04:46:34,601 epoch 115 - iter 1590/2650 - loss 0.01621075 - time (sec): 117.45 - samples/sec: 7473.39 - lr: 0.025000 +2023-04-06 04:46:54,036 epoch 115 - iter 1855/2650 - loss 0.01621625 - time (sec): 136.88 - samples/sec: 7483.58 - lr: 0.025000 +2023-04-06 04:47:13,430 epoch 115 - iter 2120/2650 - loss 0.01625940 - time (sec): 156.27 - samples/sec: 7487.70 - lr: 0.025000 +2023-04-06 04:47:33,464 epoch 115 - iter 2385/2650 - loss 0.01622751 - time (sec): 176.31 - samples/sec: 7470.01 - lr: 0.025000 +2023-04-06 04:47:52,640 epoch 115 - iter 2650/2650 - loss 0.01630412 - time (sec): 195.48 - samples/sec: 7480.74 - lr: 0.025000 +2023-04-06 04:47:52,640 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:47:52,640 EPOCH 115 done: loss 0.0163 - lr 0.025000 +2023-04-06 04:47:52,640 BAD EPOCHS (no improvement): 2 +2023-04-06 04:47:52,643 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:48:11,932 epoch 116 - iter 265/2650 - loss 0.01536506 - time (sec): 19.29 - samples/sec: 7535.20 - lr: 0.025000 +2023-04-06 04:48:31,269 epoch 116 - iter 530/2650 - loss 0.01609121 - time (sec): 38.63 - samples/sec: 7530.97 - lr: 0.025000 +2023-04-06 04:48:50,319 epoch 116 - iter 795/2650 - loss 0.01622454 - time (sec): 57.68 - samples/sec: 7575.80 - lr: 0.025000 +2023-04-06 04:49:10,411 epoch 116 - iter 1060/2650 - loss 0.01612029 - time (sec): 77.77 - samples/sec: 7536.24 - lr: 0.025000 +2023-04-06 04:49:30,066 epoch 116 - iter 1325/2650 - loss 0.01615203 - time (sec): 97.42 - samples/sec: 7528.20 - lr: 0.025000 +2023-04-06 04:49:49,394 epoch 116 - iter 1590/2650 - loss 0.01613982 - time (sec): 116.75 - samples/sec: 7524.63 - lr: 0.025000 +2023-04-06 04:50:09,161 epoch 116 - iter 1855/2650 - loss 0.01635254 - time (sec): 136.52 - samples/sec: 7502.44 - lr: 0.025000 +2023-04-06 04:50:29,033 epoch 116 - iter 2120/2650 - loss 0.01640006 - time (sec): 156.39 - samples/sec: 7491.37 - lr: 0.025000 +2023-04-06 04:50:48,337 epoch 116 - iter 2385/2650 - loss 0.01637971 - time (sec): 175.69 - samples/sec: 7502.04 - lr: 0.025000 +2023-04-06 04:51:07,827 epoch 116 - iter 2650/2650 - loss 0.01640377 - time (sec): 195.18 - samples/sec: 7492.25 - lr: 0.025000 +2023-04-06 04:51:07,827 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:51:07,827 EPOCH 116 done: loss 0.0164 - lr 0.025000 +2023-04-06 04:51:07,827 BAD EPOCHS (no improvement): 3 +2023-04-06 04:51:07,830 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:51:27,010 epoch 117 - iter 265/2650 - loss 0.01633434 - time (sec): 19.18 - samples/sec: 7570.02 - lr: 0.025000 +2023-04-06 04:51:46,495 epoch 117 - iter 530/2650 - loss 0.01653491 - time (sec): 38.67 - samples/sec: 7545.14 - lr: 0.025000 +2023-04-06 04:52:06,320 epoch 117 - iter 795/2650 - loss 0.01642501 - time (sec): 58.49 - samples/sec: 7496.55 - lr: 0.025000 +2023-04-06 04:52:26,413 epoch 117 - iter 1060/2650 - loss 0.01635945 - time (sec): 78.58 - samples/sec: 7469.19 - lr: 0.025000 +2023-04-06 04:52:45,899 epoch 117 - iter 1325/2650 - loss 0.01626213 - time (sec): 98.07 - samples/sec: 7470.09 - lr: 0.025000 +2023-04-06 04:53:05,123 epoch 117 - iter 1590/2650 - loss 0.01606817 - time (sec): 117.29 - samples/sec: 7488.13 - lr: 0.025000 +2023-04-06 04:53:24,306 epoch 117 - iter 1855/2650 - loss 0.01599580 - time (sec): 136.48 - samples/sec: 7512.75 - lr: 0.025000 +2023-04-06 04:53:43,664 epoch 117 - iter 2120/2650 - loss 0.01603104 - time (sec): 155.83 - samples/sec: 7505.18 - lr: 0.025000 +2023-04-06 04:54:03,572 epoch 117 - iter 2385/2650 - loss 0.01609921 - time (sec): 175.74 - samples/sec: 7489.18 - lr: 0.025000 +2023-04-06 04:54:23,263 epoch 117 - iter 2650/2650 - loss 0.01608671 - time (sec): 195.43 - samples/sec: 7482.66 - lr: 0.025000 +2023-04-06 04:54:23,264 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:54:23,264 EPOCH 117 done: loss 0.0161 - lr 0.025000 +2023-04-06 04:54:23,264 Epoch 117: reducing learning rate of group 0 to 1.2500e-02. +2023-04-06 04:54:23,264 BAD EPOCHS (no improvement): 4 +2023-04-06 04:54:23,267 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:54:43,207 epoch 118 - iter 265/2650 - loss 0.01572736 - time (sec): 19.94 - samples/sec: 7397.38 - lr: 0.012500 +2023-04-06 04:55:03,167 epoch 118 - iter 530/2650 - loss 0.01576683 - time (sec): 39.90 - samples/sec: 7359.14 - lr: 0.012500 +2023-04-06 04:55:22,565 epoch 118 - iter 795/2650 - loss 0.01577112 - time (sec): 59.30 - samples/sec: 7418.71 - lr: 0.012500 +2023-04-06 04:55:42,039 epoch 118 - iter 1060/2650 - loss 0.01594208 - time (sec): 78.77 - samples/sec: 7441.57 - lr: 0.012500 +2023-04-06 04:56:01,557 epoch 118 - iter 1325/2650 - loss 0.01577340 - time (sec): 98.29 - samples/sec: 7448.52 - lr: 0.012500 +2023-04-06 04:56:21,217 epoch 118 - iter 1590/2650 - loss 0.01589593 - time (sec): 117.95 - samples/sec: 7454.72 - lr: 0.012500 +2023-04-06 04:56:40,511 epoch 118 - iter 1855/2650 - loss 0.01566565 - time (sec): 137.24 - samples/sec: 7461.78 - lr: 0.012500 +2023-04-06 04:56:59,741 epoch 118 - iter 2120/2650 - loss 0.01577624 - time (sec): 156.47 - samples/sec: 7477.95 - lr: 0.012500 +2023-04-06 04:57:19,407 epoch 118 - iter 2385/2650 - loss 0.01564434 - time (sec): 176.14 - samples/sec: 7478.04 - lr: 0.012500 +2023-04-06 04:57:38,335 epoch 118 - iter 2650/2650 - loss 0.01564190 - time (sec): 195.07 - samples/sec: 7496.68 - lr: 0.012500 +2023-04-06 04:57:38,335 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:57:38,335 EPOCH 118 done: loss 0.0156 - lr 0.012500 +2023-04-06 04:57:38,335 BAD EPOCHS (no improvement): 0 +2023-04-06 04:57:38,338 ---------------------------------------------------------------------------------------------------- +2023-04-06 04:57:57,840 epoch 119 - iter 265/2650 - loss 0.01544832 - time (sec): 19.50 - samples/sec: 7484.69 - lr: 0.012500 +2023-04-06 04:58:17,000 epoch 119 - iter 530/2650 - loss 0.01587479 - time (sec): 38.66 - samples/sec: 7518.91 - lr: 0.012500 +2023-04-06 04:58:36,746 epoch 119 - iter 795/2650 - loss 0.01555283 - time (sec): 58.41 - samples/sec: 7491.82 - lr: 0.012500 +2023-04-06 04:58:56,828 epoch 119 - iter 1060/2650 - loss 0.01553353 - time (sec): 78.49 - samples/sec: 7462.88 - lr: 0.012500 +2023-04-06 04:59:16,461 epoch 119 - iter 1325/2650 - loss 0.01547635 - time (sec): 98.12 - samples/sec: 7461.17 - lr: 0.012500 +2023-04-06 04:59:36,238 epoch 119 - iter 1590/2650 - loss 0.01561315 - time (sec): 117.90 - samples/sec: 7446.70 - lr: 0.012500 +2023-04-06 04:59:55,961 epoch 119 - iter 1855/2650 - loss 0.01553643 - time (sec): 137.62 - samples/sec: 7448.51 - lr: 0.012500 +2023-04-06 05:00:15,689 epoch 119 - iter 2120/2650 - loss 0.01549607 - time (sec): 157.35 - samples/sec: 7441.51 - lr: 0.012500 +2023-04-06 05:00:35,122 epoch 119 - iter 2385/2650 - loss 0.01548650 - time (sec): 176.78 - samples/sec: 7449.04 - lr: 0.012500 +2023-04-06 05:00:54,424 epoch 119 - iter 2650/2650 - loss 0.01550406 - time (sec): 196.09 - samples/sec: 7457.77 - lr: 0.012500 +2023-04-06 05:00:54,424 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:00:54,424 EPOCH 119 done: loss 0.0155 - lr 0.012500 +2023-04-06 05:00:54,425 BAD EPOCHS (no improvement): 0 +2023-04-06 05:00:54,427 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:01:13,848 epoch 120 - iter 265/2650 - loss 0.01597121 - time (sec): 19.42 - samples/sec: 7571.36 - lr: 0.012500 +2023-04-06 05:01:32,913 epoch 120 - iter 530/2650 - loss 0.01562538 - time (sec): 38.49 - samples/sec: 7560.34 - lr: 0.012500 +2023-04-06 05:01:52,116 epoch 120 - iter 795/2650 - loss 0.01504738 - time (sec): 57.69 - samples/sec: 7577.00 - lr: 0.012500 +2023-04-06 05:02:11,577 epoch 120 - iter 1060/2650 - loss 0.01522187 - time (sec): 77.15 - samples/sec: 7560.62 - lr: 0.012500 +2023-04-06 05:02:31,395 epoch 120 - iter 1325/2650 - loss 0.01543737 - time (sec): 96.97 - samples/sec: 7536.76 - lr: 0.012500 +2023-04-06 05:02:50,522 epoch 120 - iter 1590/2650 - loss 0.01524426 - time (sec): 116.10 - samples/sec: 7558.10 - lr: 0.012500 +2023-04-06 05:03:09,981 epoch 120 - iter 1855/2650 - loss 0.01537529 - time (sec): 135.55 - samples/sec: 7544.10 - lr: 0.012500 +2023-04-06 05:03:29,407 epoch 120 - iter 2120/2650 - loss 0.01547088 - time (sec): 154.98 - samples/sec: 7546.16 - lr: 0.012500 +2023-04-06 05:03:49,386 epoch 120 - iter 2385/2650 - loss 0.01553172 - time (sec): 174.96 - samples/sec: 7521.27 - lr: 0.012500 +2023-04-06 05:04:09,003 epoch 120 - iter 2650/2650 - loss 0.01543942 - time (sec): 194.58 - samples/sec: 7515.65 - lr: 0.012500 +2023-04-06 05:04:09,003 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:04:09,003 EPOCH 120 done: loss 0.0154 - lr 0.012500 +2023-04-06 05:04:09,004 BAD EPOCHS (no improvement): 0 +2023-04-06 05:04:09,009 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:04:28,765 epoch 121 - iter 265/2650 - loss 0.01497412 - time (sec): 19.76 - samples/sec: 7400.69 - lr: 0.012500 +2023-04-06 05:04:48,575 epoch 121 - iter 530/2650 - loss 0.01491218 - time (sec): 39.57 - samples/sec: 7371.06 - lr: 0.012500 +2023-04-06 05:05:07,424 epoch 121 - iter 795/2650 - loss 0.01539899 - time (sec): 58.42 - samples/sec: 7452.82 - lr: 0.012500 +2023-04-06 05:05:36,724 epoch 121 - iter 1060/2650 - loss 0.01533294 - time (sec): 87.72 - samples/sec: 6641.88 - lr: 0.012500 +2023-04-06 05:05:56,474 epoch 121 - iter 1325/2650 - loss 0.01573708 - time (sec): 107.47 - samples/sec: 6797.94 - lr: 0.012500 +2023-04-06 05:06:16,239 epoch 121 - iter 1590/2650 - loss 0.01573506 - time (sec): 127.23 - samples/sec: 6893.72 - lr: 0.012500 +2023-04-06 05:06:36,098 epoch 121 - iter 1855/2650 - loss 0.01554577 - time (sec): 147.09 - samples/sec: 6973.30 - lr: 0.012500 +2023-04-06 05:06:55,557 epoch 121 - iter 2120/2650 - loss 0.01547218 - time (sec): 166.55 - samples/sec: 7036.89 - lr: 0.012500 +2023-04-06 05:07:14,558 epoch 121 - iter 2385/2650 - loss 0.01542829 - time (sec): 185.55 - samples/sec: 7105.84 - lr: 0.012500 +2023-04-06 05:07:33,788 epoch 121 - iter 2650/2650 - loss 0.01539740 - time (sec): 204.78 - samples/sec: 7141.16 - lr: 0.012500 +2023-04-06 05:07:33,789 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:07:33,789 EPOCH 121 done: loss 0.0154 - lr 0.012500 +2023-04-06 05:07:33,789 BAD EPOCHS (no improvement): 0 +2023-04-06 05:07:33,792 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:07:52,848 epoch 122 - iter 265/2650 - loss 0.01522095 - time (sec): 19.06 - samples/sec: 7632.38 - lr: 0.012500 +2023-04-06 05:08:11,998 epoch 122 - iter 530/2650 - loss 0.01540688 - time (sec): 38.21 - samples/sec: 7635.93 - lr: 0.012500 +2023-04-06 05:08:32,034 epoch 122 - iter 795/2650 - loss 0.01539960 - time (sec): 58.24 - samples/sec: 7539.04 - lr: 0.012500 +2023-04-06 05:08:51,610 epoch 122 - iter 1060/2650 - loss 0.01555039 - time (sec): 77.82 - samples/sec: 7521.02 - lr: 0.012500 +2023-04-06 05:09:11,443 epoch 122 - iter 1325/2650 - loss 0.01545018 - time (sec): 97.65 - samples/sec: 7494.06 - lr: 0.012500 +2023-04-06 05:09:31,793 epoch 122 - iter 1590/2650 - loss 0.01533201 - time (sec): 118.00 - samples/sec: 7446.09 - lr: 0.012500 +2023-04-06 05:09:51,521 epoch 122 - iter 1855/2650 - loss 0.01518317 - time (sec): 137.73 - samples/sec: 7441.34 - lr: 0.012500 +2023-04-06 05:10:11,666 epoch 122 - iter 2120/2650 - loss 0.01505003 - time (sec): 157.87 - samples/sec: 7425.26 - lr: 0.012500 +2023-04-06 05:10:30,686 epoch 122 - iter 2385/2650 - loss 0.01508182 - time (sec): 176.89 - samples/sec: 7443.41 - lr: 0.012500 +2023-04-06 05:10:50,143 epoch 122 - iter 2650/2650 - loss 0.01498612 - time (sec): 196.35 - samples/sec: 7447.69 - lr: 0.012500 +2023-04-06 05:10:50,144 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:10:50,144 EPOCH 122 done: loss 0.0150 - lr 0.012500 +2023-04-06 05:10:50,144 BAD EPOCHS (no improvement): 0 +2023-04-06 05:10:50,146 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:11:10,063 epoch 123 - iter 265/2650 - loss 0.01470506 - time (sec): 19.92 - samples/sec: 7423.66 - lr: 0.012500 +2023-04-06 05:11:29,486 epoch 123 - iter 530/2650 - loss 0.01487188 - time (sec): 39.34 - samples/sec: 7451.92 - lr: 0.012500 +2023-04-06 05:11:49,222 epoch 123 - iter 795/2650 - loss 0.01489015 - time (sec): 59.08 - samples/sec: 7435.45 - lr: 0.012500 +2023-04-06 05:12:08,947 epoch 123 - iter 1060/2650 - loss 0.01474841 - time (sec): 78.80 - samples/sec: 7418.42 - lr: 0.012500 +2023-04-06 05:12:28,255 epoch 123 - iter 1325/2650 - loss 0.01467092 - time (sec): 98.11 - samples/sec: 7435.07 - lr: 0.012500 +2023-04-06 05:12:48,166 epoch 123 - iter 1590/2650 - loss 0.01481652 - time (sec): 118.02 - samples/sec: 7422.88 - lr: 0.012500 +2023-04-06 05:13:07,432 epoch 123 - iter 1855/2650 - loss 0.01484548 - time (sec): 137.29 - samples/sec: 7438.84 - lr: 0.012500 +2023-04-06 05:13:27,212 epoch 123 - iter 2120/2650 - loss 0.01496353 - time (sec): 157.07 - samples/sec: 7429.72 - lr: 0.012500 +2023-04-06 05:13:47,247 epoch 123 - iter 2385/2650 - loss 0.01503001 - time (sec): 177.10 - samples/sec: 7424.86 - lr: 0.012500 +2023-04-06 05:14:06,852 epoch 123 - iter 2650/2650 - loss 0.01504476 - time (sec): 196.71 - samples/sec: 7434.29 - lr: 0.012500 +2023-04-06 05:14:06,852 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:14:06,852 EPOCH 123 done: loss 0.0150 - lr 0.012500 +2023-04-06 05:14:06,852 BAD EPOCHS (no improvement): 1 +2023-04-06 05:14:06,855 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:14:25,863 epoch 124 - iter 265/2650 - loss 0.01539088 - time (sec): 19.01 - samples/sec: 7579.83 - lr: 0.012500 +2023-04-06 05:14:45,041 epoch 124 - iter 530/2650 - loss 0.01506490 - time (sec): 38.19 - samples/sec: 7640.23 - lr: 0.012500 +2023-04-06 05:15:04,858 epoch 124 - iter 795/2650 - loss 0.01504928 - time (sec): 58.00 - samples/sec: 7542.27 - lr: 0.012500 +2023-04-06 05:15:24,342 epoch 124 - iter 1060/2650 - loss 0.01497258 - time (sec): 77.49 - samples/sec: 7516.65 - lr: 0.012500 +2023-04-06 05:15:44,537 epoch 124 - iter 1325/2650 - loss 0.01504758 - time (sec): 97.68 - samples/sec: 7466.76 - lr: 0.012500 +2023-04-06 05:16:04,348 epoch 124 - iter 1590/2650 - loss 0.01524514 - time (sec): 117.49 - samples/sec: 7464.53 - lr: 0.012500 +2023-04-06 05:16:23,723 epoch 124 - iter 1855/2650 - loss 0.01527755 - time (sec): 136.87 - samples/sec: 7475.24 - lr: 0.012500 +2023-04-06 05:16:43,793 epoch 124 - iter 2120/2650 - loss 0.01520258 - time (sec): 156.94 - samples/sec: 7460.86 - lr: 0.012500 +2023-04-06 05:17:03,585 epoch 124 - iter 2385/2650 - loss 0.01519706 - time (sec): 176.73 - samples/sec: 7454.04 - lr: 0.012500 +2023-04-06 05:17:22,742 epoch 124 - iter 2650/2650 - loss 0.01513811 - time (sec): 195.89 - samples/sec: 7465.32 - lr: 0.012500 +2023-04-06 05:17:22,743 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:17:22,743 EPOCH 124 done: loss 0.0151 - lr 0.012500 +2023-04-06 05:17:22,743 BAD EPOCHS (no improvement): 2 +2023-04-06 05:17:22,747 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:17:42,155 epoch 125 - iter 265/2650 - loss 0.01519875 - time (sec): 19.41 - samples/sec: 7424.43 - lr: 0.012500 +2023-04-06 05:18:02,164 epoch 125 - iter 530/2650 - loss 0.01453886 - time (sec): 39.42 - samples/sec: 7404.47 - lr: 0.012500 +2023-04-06 05:18:22,162 epoch 125 - iter 795/2650 - loss 0.01475092 - time (sec): 59.42 - samples/sec: 7344.99 - lr: 0.012500 +2023-04-06 05:18:41,660 epoch 125 - iter 1060/2650 - loss 0.01459919 - time (sec): 78.91 - samples/sec: 7392.98 - lr: 0.012500 +2023-04-06 05:19:00,702 epoch 125 - iter 1325/2650 - loss 0.01459180 - time (sec): 97.95 - samples/sec: 7442.23 - lr: 0.012500 +2023-04-06 05:19:20,153 epoch 125 - iter 1590/2650 - loss 0.01453606 - time (sec): 117.41 - samples/sec: 7447.28 - lr: 0.012500 +2023-04-06 05:19:39,636 epoch 125 - iter 1855/2650 - loss 0.01454958 - time (sec): 136.89 - samples/sec: 7455.66 - lr: 0.012500 +2023-04-06 05:19:59,960 epoch 125 - iter 2120/2650 - loss 0.01468428 - time (sec): 157.21 - samples/sec: 7438.56 - lr: 0.012500 +2023-04-06 05:20:19,720 epoch 125 - iter 2385/2650 - loss 0.01479486 - time (sec): 176.97 - samples/sec: 7437.00 - lr: 0.012500 +2023-04-06 05:20:39,274 epoch 125 - iter 2650/2650 - loss 0.01489035 - time (sec): 196.53 - samples/sec: 7441.03 - lr: 0.012500 +2023-04-06 05:20:39,274 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:20:39,274 EPOCH 125 done: loss 0.0149 - lr 0.012500 +2023-04-06 05:20:39,274 BAD EPOCHS (no improvement): 0 +2023-04-06 05:20:39,277 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:20:58,860 epoch 126 - iter 265/2650 - loss 0.01443809 - time (sec): 19.58 - samples/sec: 7481.96 - lr: 0.012500 +2023-04-06 05:21:18,302 epoch 126 - iter 530/2650 - loss 0.01480784 - time (sec): 39.02 - samples/sec: 7457.83 - lr: 0.012500 +2023-04-06 05:21:37,497 epoch 126 - iter 795/2650 - loss 0.01472748 - time (sec): 58.22 - samples/sec: 7511.14 - lr: 0.012500 +2023-04-06 05:21:57,661 epoch 126 - iter 1060/2650 - loss 0.01466737 - time (sec): 78.38 - samples/sec: 7465.04 - lr: 0.012500 +2023-04-06 05:22:16,688 epoch 126 - iter 1325/2650 - loss 0.01479125 - time (sec): 97.41 - samples/sec: 7510.36 - lr: 0.012500 +2023-04-06 05:22:36,933 epoch 126 - iter 1590/2650 - loss 0.01488758 - time (sec): 117.66 - samples/sec: 7452.42 - lr: 0.012500 +2023-04-06 05:22:56,564 epoch 126 - iter 1855/2650 - loss 0.01478776 - time (sec): 137.29 - samples/sec: 7464.98 - lr: 0.012500 +2023-04-06 05:23:16,327 epoch 126 - iter 2120/2650 - loss 0.01487469 - time (sec): 157.05 - samples/sec: 7458.96 - lr: 0.012500 +2023-04-06 05:23:35,553 epoch 126 - iter 2385/2650 - loss 0.01481078 - time (sec): 176.27 - samples/sec: 7477.71 - lr: 0.012500 +2023-04-06 05:23:54,331 epoch 126 - iter 2650/2650 - loss 0.01490695 - time (sec): 195.05 - samples/sec: 7497.26 - lr: 0.012500 +2023-04-06 05:23:54,331 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:23:54,331 EPOCH 126 done: loss 0.0149 - lr 0.012500 +2023-04-06 05:23:54,331 BAD EPOCHS (no improvement): 1 +2023-04-06 05:23:54,335 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:24:13,560 epoch 127 - iter 265/2650 - loss 0.01494358 - time (sec): 19.22 - samples/sec: 7692.66 - lr: 0.012500 +2023-04-06 05:24:31,934 epoch 127 - iter 530/2650 - loss 0.01438251 - time (sec): 37.60 - samples/sec: 7768.28 - lr: 0.012500 +2023-04-06 05:24:50,828 epoch 127 - iter 795/2650 - loss 0.01453142 - time (sec): 56.49 - samples/sec: 7727.62 - lr: 0.012500 +2023-04-06 05:25:10,570 epoch 127 - iter 1060/2650 - loss 0.01448338 - time (sec): 76.24 - samples/sec: 7646.57 - lr: 0.012500 +2023-04-06 05:25:30,351 epoch 127 - iter 1325/2650 - loss 0.01470342 - time (sec): 96.02 - samples/sec: 7586.13 - lr: 0.012500 +2023-04-06 05:25:49,210 epoch 127 - iter 1590/2650 - loss 0.01467779 - time (sec): 114.88 - samples/sec: 7618.79 - lr: 0.012500 +2023-04-06 05:26:08,853 epoch 127 - iter 1855/2650 - loss 0.01483106 - time (sec): 134.52 - samples/sec: 7600.50 - lr: 0.012500 +2023-04-06 05:26:28,519 epoch 127 - iter 2120/2650 - loss 0.01483370 - time (sec): 154.18 - samples/sec: 7586.21 - lr: 0.012500 +2023-04-06 05:26:47,915 epoch 127 - iter 2385/2650 - loss 0.01489453 - time (sec): 173.58 - samples/sec: 7583.08 - lr: 0.012500 +2023-04-06 05:27:07,077 epoch 127 - iter 2650/2650 - loss 0.01483909 - time (sec): 192.74 - samples/sec: 7587.17 - lr: 0.012500 +2023-04-06 05:27:07,077 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:27:07,077 EPOCH 127 done: loss 0.0148 - lr 0.012500 +2023-04-06 05:27:07,077 BAD EPOCHS (no improvement): 0 +2023-04-06 05:27:07,080 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:27:26,185 epoch 128 - iter 265/2650 - loss 0.01330828 - time (sec): 19.10 - samples/sec: 7637.54 - lr: 0.012500 +2023-04-06 05:27:45,170 epoch 128 - iter 530/2650 - loss 0.01389517 - time (sec): 38.09 - samples/sec: 7672.04 - lr: 0.012500 +2023-04-06 05:28:04,920 epoch 128 - iter 795/2650 - loss 0.01439307 - time (sec): 57.84 - samples/sec: 7602.19 - lr: 0.012500 +2023-04-06 05:28:23,969 epoch 128 - iter 1060/2650 - loss 0.01442468 - time (sec): 76.89 - samples/sec: 7623.01 - lr: 0.012500 +2023-04-06 05:28:43,401 epoch 128 - iter 1325/2650 - loss 0.01435687 - time (sec): 96.32 - samples/sec: 7605.01 - lr: 0.012500 +2023-04-06 05:29:02,493 epoch 128 - iter 1590/2650 - loss 0.01448037 - time (sec): 115.41 - samples/sec: 7606.04 - lr: 0.012500 +2023-04-06 05:29:22,351 epoch 128 - iter 1855/2650 - loss 0.01457775 - time (sec): 135.27 - samples/sec: 7574.22 - lr: 0.012500 +2023-04-06 05:29:41,201 epoch 128 - iter 2120/2650 - loss 0.01458015 - time (sec): 154.12 - samples/sec: 7596.71 - lr: 0.012500 +2023-04-06 05:30:00,668 epoch 128 - iter 2385/2650 - loss 0.01455667 - time (sec): 173.59 - samples/sec: 7582.95 - lr: 0.012500 +2023-04-06 05:30:20,331 epoch 128 - iter 2650/2650 - loss 0.01469323 - time (sec): 193.25 - samples/sec: 7567.17 - lr: 0.012500 +2023-04-06 05:30:20,332 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:30:20,332 EPOCH 128 done: loss 0.0147 - lr 0.012500 +2023-04-06 05:30:20,332 BAD EPOCHS (no improvement): 0 +2023-04-06 05:30:20,334 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:30:39,071 epoch 129 - iter 265/2650 - loss 0.01529547 - time (sec): 18.74 - samples/sec: 7756.95 - lr: 0.012500 +2023-04-06 05:30:58,404 epoch 129 - iter 530/2650 - loss 0.01535124 - time (sec): 38.07 - samples/sec: 7606.11 - lr: 0.012500 +2023-04-06 05:31:18,098 epoch 129 - iter 795/2650 - loss 0.01554276 - time (sec): 57.76 - samples/sec: 7565.15 - lr: 0.012500 +2023-04-06 05:31:37,527 epoch 129 - iter 1060/2650 - loss 0.01559818 - time (sec): 77.19 - samples/sec: 7566.23 - lr: 0.012500 +2023-04-06 05:31:56,752 epoch 129 - iter 1325/2650 - loss 0.01520606 - time (sec): 96.42 - samples/sec: 7571.29 - lr: 0.012500 +2023-04-06 05:32:15,710 epoch 129 - iter 1590/2650 - loss 0.01510911 - time (sec): 115.38 - samples/sec: 7591.14 - lr: 0.012500 +2023-04-06 05:32:35,439 epoch 129 - iter 1855/2650 - loss 0.01509652 - time (sec): 135.10 - samples/sec: 7573.27 - lr: 0.012500 +2023-04-06 05:32:54,959 epoch 129 - iter 2120/2650 - loss 0.01495564 - time (sec): 154.62 - samples/sec: 7563.53 - lr: 0.012500 +2023-04-06 05:33:14,305 epoch 129 - iter 2385/2650 - loss 0.01505397 - time (sec): 173.97 - samples/sec: 7566.63 - lr: 0.012500 +2023-04-06 05:33:33,699 epoch 129 - iter 2650/2650 - loss 0.01503245 - time (sec): 193.36 - samples/sec: 7562.72 - lr: 0.012500 +2023-04-06 05:33:33,699 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:33:33,700 EPOCH 129 done: loss 0.0150 - lr 0.012500 +2023-04-06 05:33:33,700 BAD EPOCHS (no improvement): 1 +2023-04-06 05:33:33,704 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:33:52,916 epoch 130 - iter 265/2650 - loss 0.01440739 - time (sec): 19.21 - samples/sec: 7625.30 - lr: 0.012500 +2023-04-06 05:34:12,542 epoch 130 - iter 530/2650 - loss 0.01467286 - time (sec): 38.84 - samples/sec: 7583.85 - lr: 0.012500 +2023-04-06 05:34:31,842 epoch 130 - iter 795/2650 - loss 0.01481253 - time (sec): 58.14 - samples/sec: 7606.58 - lr: 0.012500 +2023-04-06 05:34:50,991 epoch 130 - iter 1060/2650 - loss 0.01486888 - time (sec): 77.29 - samples/sec: 7587.94 - lr: 0.012500 +2023-04-06 05:35:09,945 epoch 130 - iter 1325/2650 - loss 0.01495354 - time (sec): 96.24 - samples/sec: 7615.37 - lr: 0.012500 +2023-04-06 05:35:29,735 epoch 130 - iter 1590/2650 - loss 0.01486580 - time (sec): 116.03 - samples/sec: 7571.54 - lr: 0.012500 +2023-04-06 05:35:48,574 epoch 130 - iter 1855/2650 - loss 0.01489353 - time (sec): 134.87 - samples/sec: 7592.53 - lr: 0.012500 +2023-04-06 05:36:07,525 epoch 130 - iter 2120/2650 - loss 0.01496772 - time (sec): 153.82 - samples/sec: 7606.63 - lr: 0.012500 +2023-04-06 05:36:26,664 epoch 130 - iter 2385/2650 - loss 0.01511212 - time (sec): 172.96 - samples/sec: 7605.53 - lr: 0.012500 +2023-04-06 05:36:46,245 epoch 130 - iter 2650/2650 - loss 0.01508575 - time (sec): 192.54 - samples/sec: 7595.07 - lr: 0.012500 +2023-04-06 05:36:46,245 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:36:46,245 EPOCH 130 done: loss 0.0151 - lr 0.012500 +2023-04-06 05:36:46,245 BAD EPOCHS (no improvement): 2 +2023-04-06 05:36:46,248 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:37:05,511 epoch 131 - iter 265/2650 - loss 0.01446491 - time (sec): 19.26 - samples/sec: 7560.79 - lr: 0.012500 +2023-04-06 05:37:25,319 epoch 131 - iter 530/2650 - loss 0.01506208 - time (sec): 39.07 - samples/sec: 7537.75 - lr: 0.012500 +2023-04-06 05:37:44,215 epoch 131 - iter 795/2650 - loss 0.01514512 - time (sec): 57.97 - samples/sec: 7591.27 - lr: 0.012500 +2023-04-06 05:38:03,157 epoch 131 - iter 1060/2650 - loss 0.01489944 - time (sec): 76.91 - samples/sec: 7599.56 - lr: 0.012500 +2023-04-06 05:38:22,366 epoch 131 - iter 1325/2650 - loss 0.01488990 - time (sec): 96.12 - samples/sec: 7593.80 - lr: 0.012500 +2023-04-06 05:38:41,400 epoch 131 - iter 1590/2650 - loss 0.01471249 - time (sec): 115.15 - samples/sec: 7597.70 - lr: 0.012500 +2023-04-06 05:39:00,492 epoch 131 - iter 1855/2650 - loss 0.01469313 - time (sec): 134.24 - samples/sec: 7609.12 - lr: 0.012500 +2023-04-06 05:39:20,145 epoch 131 - iter 2120/2650 - loss 0.01469184 - time (sec): 153.90 - samples/sec: 7588.20 - lr: 0.012500 +2023-04-06 05:39:39,345 epoch 131 - iter 2385/2650 - loss 0.01467354 - time (sec): 173.10 - samples/sec: 7594.57 - lr: 0.012500 +2023-04-06 05:39:58,977 epoch 131 - iter 2650/2650 - loss 0.01470156 - time (sec): 192.73 - samples/sec: 7587.70 - lr: 0.012500 +2023-04-06 05:39:58,977 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:39:58,977 EPOCH 131 done: loss 0.0147 - lr 0.012500 +2023-04-06 05:39:58,977 BAD EPOCHS (no improvement): 3 +2023-04-06 05:39:58,981 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:40:18,410 epoch 132 - iter 265/2650 - loss 0.01402472 - time (sec): 19.43 - samples/sec: 7546.64 - lr: 0.012500 +2023-04-06 05:40:37,951 epoch 132 - iter 530/2650 - loss 0.01387620 - time (sec): 38.97 - samples/sec: 7546.59 - lr: 0.012500 +2023-04-06 05:40:57,265 epoch 132 - iter 795/2650 - loss 0.01447668 - time (sec): 58.28 - samples/sec: 7539.39 - lr: 0.012500 +2023-04-06 05:41:16,845 epoch 132 - iter 1060/2650 - loss 0.01441731 - time (sec): 77.86 - samples/sec: 7524.46 - lr: 0.012500 +2023-04-06 05:41:36,534 epoch 132 - iter 1325/2650 - loss 0.01455027 - time (sec): 97.55 - samples/sec: 7518.21 - lr: 0.012500 +2023-04-06 05:41:56,027 epoch 132 - iter 1590/2650 - loss 0.01477634 - time (sec): 117.05 - samples/sec: 7503.18 - lr: 0.012500 +2023-04-06 05:42:15,953 epoch 132 - iter 1855/2650 - loss 0.01460992 - time (sec): 136.97 - samples/sec: 7488.91 - lr: 0.012500 +2023-04-06 05:42:34,943 epoch 132 - iter 2120/2650 - loss 0.01463616 - time (sec): 155.96 - samples/sec: 7520.09 - lr: 0.012500 +2023-04-06 05:42:53,826 epoch 132 - iter 2385/2650 - loss 0.01453154 - time (sec): 174.85 - samples/sec: 7539.21 - lr: 0.012500 +2023-04-06 05:43:12,514 epoch 132 - iter 2650/2650 - loss 0.01462108 - time (sec): 193.53 - samples/sec: 7556.13 - lr: 0.012500 +2023-04-06 05:43:12,514 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:43:12,514 EPOCH 132 done: loss 0.0146 - lr 0.012500 +2023-04-06 05:43:12,514 BAD EPOCHS (no improvement): 0 +2023-04-06 05:43:12,518 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:43:31,289 epoch 133 - iter 265/2650 - loss 0.01458705 - time (sec): 18.77 - samples/sec: 7711.86 - lr: 0.012500 +2023-04-06 05:43:50,662 epoch 133 - iter 530/2650 - loss 0.01442090 - time (sec): 38.14 - samples/sec: 7656.27 - lr: 0.012500 +2023-04-06 05:44:09,901 epoch 133 - iter 795/2650 - loss 0.01468548 - time (sec): 57.38 - samples/sec: 7641.48 - lr: 0.012500 +2023-04-06 05:44:29,827 epoch 133 - iter 1060/2650 - loss 0.01478404 - time (sec): 77.31 - samples/sec: 7580.43 - lr: 0.012500 +2023-04-06 05:44:49,384 epoch 133 - iter 1325/2650 - loss 0.01488169 - time (sec): 96.87 - samples/sec: 7578.17 - lr: 0.012500 +2023-04-06 05:45:09,169 epoch 133 - iter 1590/2650 - loss 0.01482854 - time (sec): 116.65 - samples/sec: 7555.91 - lr: 0.012500 +2023-04-06 05:45:28,197 epoch 133 - iter 1855/2650 - loss 0.01475581 - time (sec): 135.68 - samples/sec: 7571.01 - lr: 0.012500 +2023-04-06 05:45:47,271 epoch 133 - iter 2120/2650 - loss 0.01470370 - time (sec): 154.75 - samples/sec: 7573.67 - lr: 0.012500 +2023-04-06 05:46:06,677 epoch 133 - iter 2385/2650 - loss 0.01462834 - time (sec): 174.16 - samples/sec: 7566.31 - lr: 0.012500 +2023-04-06 05:46:25,642 epoch 133 - iter 2650/2650 - loss 0.01453582 - time (sec): 193.12 - samples/sec: 7572.14 - lr: 0.012500 +2023-04-06 05:46:25,643 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:46:25,643 EPOCH 133 done: loss 0.0145 - lr 0.012500 +2023-04-06 05:46:25,643 BAD EPOCHS (no improvement): 0 +2023-04-06 05:46:25,646 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:46:44,673 epoch 134 - iter 265/2650 - loss 0.01378162 - time (sec): 19.03 - samples/sec: 7633.28 - lr: 0.012500 +2023-04-06 05:47:03,953 epoch 134 - iter 530/2650 - loss 0.01430512 - time (sec): 38.31 - samples/sec: 7609.09 - lr: 0.012500 +2023-04-06 05:47:22,821 epoch 134 - iter 795/2650 - loss 0.01462161 - time (sec): 57.17 - samples/sec: 7646.50 - lr: 0.012500 +2023-04-06 05:47:42,398 epoch 134 - iter 1060/2650 - loss 0.01462484 - time (sec): 76.75 - samples/sec: 7612.45 - lr: 0.012500 +2023-04-06 05:48:01,903 epoch 134 - iter 1325/2650 - loss 0.01463830 - time (sec): 96.26 - samples/sec: 7583.10 - lr: 0.012500 +2023-04-06 05:48:21,970 epoch 134 - iter 1590/2650 - loss 0.01461591 - time (sec): 116.32 - samples/sec: 7553.78 - lr: 0.012500 +2023-04-06 05:48:40,954 epoch 134 - iter 1855/2650 - loss 0.01471125 - time (sec): 135.31 - samples/sec: 7562.39 - lr: 0.012500 +2023-04-06 05:49:00,216 epoch 134 - iter 2120/2650 - loss 0.01470502 - time (sec): 154.57 - samples/sec: 7562.36 - lr: 0.012500 +2023-04-06 05:49:19,917 epoch 134 - iter 2385/2650 - loss 0.01477117 - time (sec): 174.27 - samples/sec: 7549.15 - lr: 0.012500 +2023-04-06 05:49:39,209 epoch 134 - iter 2650/2650 - loss 0.01479876 - time (sec): 193.56 - samples/sec: 7555.00 - lr: 0.012500 +2023-04-06 05:49:39,209 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:49:39,209 EPOCH 134 done: loss 0.0148 - lr 0.012500 +2023-04-06 05:49:39,209 BAD EPOCHS (no improvement): 1 +2023-04-06 05:49:39,213 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:49:58,684 epoch 135 - iter 265/2650 - loss 0.01536626 - time (sec): 19.47 - samples/sec: 7510.91 - lr: 0.012500 +2023-04-06 05:50:17,766 epoch 135 - iter 530/2650 - loss 0.01467966 - time (sec): 38.55 - samples/sec: 7599.05 - lr: 0.012500 +2023-04-06 05:50:36,752 epoch 135 - iter 795/2650 - loss 0.01483821 - time (sec): 57.54 - samples/sec: 7636.84 - lr: 0.012500 +2023-04-06 05:50:56,102 epoch 135 - iter 1060/2650 - loss 0.01454432 - time (sec): 76.89 - samples/sec: 7629.91 - lr: 0.012500 +2023-04-06 05:51:14,508 epoch 135 - iter 1325/2650 - loss 0.01465525 - time (sec): 95.29 - samples/sec: 7662.09 - lr: 0.012500 +2023-04-06 05:51:34,360 epoch 135 - iter 1590/2650 - loss 0.01470205 - time (sec): 115.15 - samples/sec: 7613.35 - lr: 0.012500 +2023-04-06 05:51:54,301 epoch 135 - iter 1855/2650 - loss 0.01484550 - time (sec): 135.09 - samples/sec: 7579.60 - lr: 0.012500 +2023-04-06 05:52:13,391 epoch 135 - iter 2120/2650 - loss 0.01474346 - time (sec): 154.18 - samples/sec: 7587.99 - lr: 0.012500 +2023-04-06 05:52:33,126 epoch 135 - iter 2385/2650 - loss 0.01471970 - time (sec): 173.91 - samples/sec: 7572.28 - lr: 0.012500 +2023-04-06 05:52:52,946 epoch 135 - iter 2650/2650 - loss 0.01456113 - time (sec): 193.73 - samples/sec: 7548.36 - lr: 0.012500 +2023-04-06 05:52:52,947 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:52:52,947 EPOCH 135 done: loss 0.0146 - lr 0.012500 +2023-04-06 05:52:52,947 BAD EPOCHS (no improvement): 2 +2023-04-06 05:52:52,950 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:53:12,206 epoch 136 - iter 265/2650 - loss 0.01441718 - time (sec): 19.26 - samples/sec: 7606.99 - lr: 0.012500 +2023-04-06 05:53:31,136 epoch 136 - iter 530/2650 - loss 0.01404814 - time (sec): 38.19 - samples/sec: 7637.20 - lr: 0.012500 +2023-04-06 05:53:50,751 epoch 136 - iter 795/2650 - loss 0.01430622 - time (sec): 57.80 - samples/sec: 7567.07 - lr: 0.012500 +2023-04-06 05:54:09,669 epoch 136 - iter 1060/2650 - loss 0.01443636 - time (sec): 76.72 - samples/sec: 7617.86 - lr: 0.012500 +2023-04-06 05:54:29,302 epoch 136 - iter 1325/2650 - loss 0.01435117 - time (sec): 96.35 - samples/sec: 7596.06 - lr: 0.012500 +2023-04-06 05:54:48,401 epoch 136 - iter 1590/2650 - loss 0.01442731 - time (sec): 115.45 - samples/sec: 7603.86 - lr: 0.012500 +2023-04-06 05:55:08,104 epoch 136 - iter 1855/2650 - loss 0.01440801 - time (sec): 135.15 - samples/sec: 7585.67 - lr: 0.012500 +2023-04-06 05:55:27,737 epoch 136 - iter 2120/2650 - loss 0.01439947 - time (sec): 154.79 - samples/sec: 7568.15 - lr: 0.012500 +2023-04-06 05:55:56,689 epoch 136 - iter 2385/2650 - loss 0.01448215 - time (sec): 183.74 - samples/sec: 7162.90 - lr: 0.012500 +2023-04-06 05:56:16,139 epoch 136 - iter 2650/2650 - loss 0.01442108 - time (sec): 203.19 - samples/sec: 7197.04 - lr: 0.012500 +2023-04-06 05:56:16,140 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:56:16,140 EPOCH 136 done: loss 0.0144 - lr 0.012500 +2023-04-06 05:56:16,140 BAD EPOCHS (no improvement): 0 +2023-04-06 05:56:16,143 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:56:35,544 epoch 137 - iter 265/2650 - loss 0.01418556 - time (sec): 19.40 - samples/sec: 7487.81 - lr: 0.012500 +2023-04-06 05:56:54,880 epoch 137 - iter 530/2650 - loss 0.01440564 - time (sec): 38.74 - samples/sec: 7553.99 - lr: 0.012500 +2023-04-06 05:57:14,854 epoch 137 - iter 795/2650 - loss 0.01466204 - time (sec): 58.71 - samples/sec: 7470.50 - lr: 0.012500 +2023-04-06 05:57:34,415 epoch 137 - iter 1060/2650 - loss 0.01454787 - time (sec): 78.27 - samples/sec: 7494.09 - lr: 0.012500 +2023-04-06 05:57:53,576 epoch 137 - iter 1325/2650 - loss 0.01459829 - time (sec): 97.43 - samples/sec: 7517.48 - lr: 0.012500 +2023-04-06 05:58:12,892 epoch 137 - iter 1590/2650 - loss 0.01479954 - time (sec): 116.75 - samples/sec: 7532.83 - lr: 0.012500 +2023-04-06 05:58:31,880 epoch 137 - iter 1855/2650 - loss 0.01476799 - time (sec): 135.74 - samples/sec: 7555.51 - lr: 0.012500 +2023-04-06 05:58:51,109 epoch 137 - iter 2120/2650 - loss 0.01470614 - time (sec): 154.97 - samples/sec: 7550.95 - lr: 0.012500 +2023-04-06 05:59:10,367 epoch 137 - iter 2385/2650 - loss 0.01464214 - time (sec): 174.22 - samples/sec: 7554.78 - lr: 0.012500 +2023-04-06 05:59:29,923 epoch 137 - iter 2650/2650 - loss 0.01458605 - time (sec): 193.78 - samples/sec: 7546.53 - lr: 0.012500 +2023-04-06 05:59:29,923 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:59:29,923 EPOCH 137 done: loss 0.0146 - lr 0.012500 +2023-04-06 05:59:29,923 BAD EPOCHS (no improvement): 1 +2023-04-06 05:59:29,925 ---------------------------------------------------------------------------------------------------- +2023-04-06 05:59:49,431 epoch 138 - iter 265/2650 - loss 0.01387904 - time (sec): 19.51 - samples/sec: 7516.98 - lr: 0.012500 +2023-04-06 06:00:08,708 epoch 138 - iter 530/2650 - loss 0.01413778 - time (sec): 38.78 - samples/sec: 7514.24 - lr: 0.012500 +2023-04-06 06:00:28,031 epoch 138 - iter 795/2650 - loss 0.01417219 - time (sec): 58.11 - samples/sec: 7556.13 - lr: 0.012500 +2023-04-06 06:00:47,304 epoch 138 - iter 1060/2650 - loss 0.01402947 - time (sec): 77.38 - samples/sec: 7557.51 - lr: 0.012500 +2023-04-06 06:01:06,419 epoch 138 - iter 1325/2650 - loss 0.01410139 - time (sec): 96.49 - samples/sec: 7562.92 - lr: 0.012500 +2023-04-06 06:01:25,520 epoch 138 - iter 1590/2650 - loss 0.01423930 - time (sec): 115.59 - samples/sec: 7585.03 - lr: 0.012500 +2023-04-06 06:01:45,120 epoch 138 - iter 1855/2650 - loss 0.01419281 - time (sec): 135.19 - samples/sec: 7565.23 - lr: 0.012500 +2023-04-06 06:02:04,645 epoch 138 - iter 2120/2650 - loss 0.01413906 - time (sec): 154.72 - samples/sec: 7560.99 - lr: 0.012500 +2023-04-06 06:02:24,388 epoch 138 - iter 2385/2650 - loss 0.01407052 - time (sec): 174.46 - samples/sec: 7545.44 - lr: 0.012500 +2023-04-06 06:02:44,140 epoch 138 - iter 2650/2650 - loss 0.01409925 - time (sec): 194.21 - samples/sec: 7529.62 - lr: 0.012500 +2023-04-06 06:02:44,141 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:02:44,141 EPOCH 138 done: loss 0.0141 - lr 0.012500 +2023-04-06 06:02:44,141 BAD EPOCHS (no improvement): 0 +2023-04-06 06:02:44,145 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:03:03,505 epoch 139 - iter 265/2650 - loss 0.01371773 - time (sec): 19.36 - samples/sec: 7502.62 - lr: 0.012500 +2023-04-06 06:03:22,884 epoch 139 - iter 530/2650 - loss 0.01398037 - time (sec): 38.74 - samples/sec: 7521.65 - lr: 0.012500 +2023-04-06 06:03:42,336 epoch 139 - iter 795/2650 - loss 0.01426211 - time (sec): 58.19 - samples/sec: 7530.80 - lr: 0.012500 +2023-04-06 06:04:01,748 epoch 139 - iter 1060/2650 - loss 0.01412886 - time (sec): 77.60 - samples/sec: 7530.13 - lr: 0.012500 +2023-04-06 06:04:21,062 epoch 139 - iter 1325/2650 - loss 0.01436571 - time (sec): 96.92 - samples/sec: 7532.59 - lr: 0.012500 +2023-04-06 06:04:40,471 epoch 139 - iter 1590/2650 - loss 0.01435607 - time (sec): 116.33 - samples/sec: 7544.25 - lr: 0.012500 +2023-04-06 06:05:00,303 epoch 139 - iter 1855/2650 - loss 0.01431783 - time (sec): 136.16 - samples/sec: 7532.75 - lr: 0.012500 +2023-04-06 06:05:19,735 epoch 139 - iter 2120/2650 - loss 0.01428623 - time (sec): 155.59 - samples/sec: 7538.18 - lr: 0.012500 +2023-04-06 06:05:38,948 epoch 139 - iter 2385/2650 - loss 0.01427922 - time (sec): 174.80 - samples/sec: 7544.83 - lr: 0.012500 +2023-04-06 06:05:58,023 epoch 139 - iter 2650/2650 - loss 0.01434115 - time (sec): 193.88 - samples/sec: 7542.70 - lr: 0.012500 +2023-04-06 06:05:58,023 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:05:58,023 EPOCH 139 done: loss 0.0143 - lr 0.012500 +2023-04-06 06:05:58,023 BAD EPOCHS (no improvement): 1 +2023-04-06 06:05:58,026 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:06:17,155 epoch 140 - iter 265/2650 - loss 0.01388865 - time (sec): 19.13 - samples/sec: 7612.04 - lr: 0.012500 +2023-04-06 06:06:36,950 epoch 140 - iter 530/2650 - loss 0.01412673 - time (sec): 38.92 - samples/sec: 7524.84 - lr: 0.012500 +2023-04-06 06:06:56,634 epoch 140 - iter 795/2650 - loss 0.01444320 - time (sec): 58.61 - samples/sec: 7483.20 - lr: 0.012500 +2023-04-06 06:07:15,709 epoch 140 - iter 1060/2650 - loss 0.01426230 - time (sec): 77.68 - samples/sec: 7497.09 - lr: 0.012500 +2023-04-06 06:07:34,901 epoch 140 - iter 1325/2650 - loss 0.01404629 - time (sec): 96.87 - samples/sec: 7516.03 - lr: 0.012500 +2023-04-06 06:07:54,177 epoch 140 - iter 1590/2650 - loss 0.01417075 - time (sec): 116.15 - samples/sec: 7537.23 - lr: 0.012500 +2023-04-06 06:08:13,602 epoch 140 - iter 1855/2650 - loss 0.01410698 - time (sec): 135.58 - samples/sec: 7545.13 - lr: 0.012500 +2023-04-06 06:08:32,973 epoch 140 - iter 2120/2650 - loss 0.01420417 - time (sec): 154.95 - samples/sec: 7543.83 - lr: 0.012500 +2023-04-06 06:08:52,114 epoch 140 - iter 2385/2650 - loss 0.01431294 - time (sec): 174.09 - samples/sec: 7552.37 - lr: 0.012500 +2023-04-06 06:09:11,976 epoch 140 - iter 2650/2650 - loss 0.01426967 - time (sec): 193.95 - samples/sec: 7539.93 - lr: 0.012500 +2023-04-06 06:09:11,976 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:09:11,976 EPOCH 140 done: loss 0.0143 - lr 0.012500 +2023-04-06 06:09:11,976 BAD EPOCHS (no improvement): 2 +2023-04-06 06:09:11,979 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:09:31,085 epoch 141 - iter 265/2650 - loss 0.01483339 - time (sec): 19.11 - samples/sec: 7691.85 - lr: 0.012500 +2023-04-06 06:09:50,692 epoch 141 - iter 530/2650 - loss 0.01421327 - time (sec): 38.71 - samples/sec: 7550.01 - lr: 0.012500 +2023-04-06 06:10:09,939 epoch 141 - iter 795/2650 - loss 0.01421356 - time (sec): 57.96 - samples/sec: 7545.94 - lr: 0.012500 +2023-04-06 06:10:28,557 epoch 141 - iter 1060/2650 - loss 0.01401051 - time (sec): 76.58 - samples/sec: 7598.22 - lr: 0.012500 +2023-04-06 06:10:47,708 epoch 141 - iter 1325/2650 - loss 0.01386224 - time (sec): 95.73 - samples/sec: 7603.73 - lr: 0.012500 +2023-04-06 06:11:07,253 epoch 141 - iter 1590/2650 - loss 0.01376792 - time (sec): 115.27 - samples/sec: 7589.31 - lr: 0.012500 +2023-04-06 06:11:26,720 epoch 141 - iter 1855/2650 - loss 0.01388443 - time (sec): 134.74 - samples/sec: 7584.78 - lr: 0.012500 +2023-04-06 06:11:45,849 epoch 141 - iter 2120/2650 - loss 0.01397421 - time (sec): 153.87 - samples/sec: 7586.05 - lr: 0.012500 +2023-04-06 06:12:05,071 epoch 141 - iter 2385/2650 - loss 0.01401607 - time (sec): 173.09 - samples/sec: 7588.91 - lr: 0.012500 +2023-04-06 06:12:25,643 epoch 141 - iter 2650/2650 - loss 0.01398971 - time (sec): 193.66 - samples/sec: 7551.04 - lr: 0.012500 +2023-04-06 06:12:25,643 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:12:25,644 EPOCH 141 done: loss 0.0140 - lr 0.012500 +2023-04-06 06:12:25,644 BAD EPOCHS (no improvement): 0 +2023-04-06 06:12:25,647 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:12:45,272 epoch 142 - iter 265/2650 - loss 0.01492568 - time (sec): 19.63 - samples/sec: 7471.85 - lr: 0.012500 +2023-04-06 06:13:04,403 epoch 142 - iter 530/2650 - loss 0.01491387 - time (sec): 38.76 - samples/sec: 7525.58 - lr: 0.012500 +2023-04-06 06:13:23,827 epoch 142 - iter 795/2650 - loss 0.01493666 - time (sec): 58.18 - samples/sec: 7534.23 - lr: 0.012500 +2023-04-06 06:13:43,009 epoch 142 - iter 1060/2650 - loss 0.01469487 - time (sec): 77.36 - samples/sec: 7552.93 - lr: 0.012500 +2023-04-06 06:14:02,295 epoch 142 - iter 1325/2650 - loss 0.01457024 - time (sec): 96.65 - samples/sec: 7567.52 - lr: 0.012500 +2023-04-06 06:14:21,615 epoch 142 - iter 1590/2650 - loss 0.01462338 - time (sec): 115.97 - samples/sec: 7580.24 - lr: 0.012500 +2023-04-06 06:14:40,841 epoch 142 - iter 1855/2650 - loss 0.01455104 - time (sec): 135.19 - samples/sec: 7560.59 - lr: 0.012500 +2023-04-06 06:15:00,266 epoch 142 - iter 2120/2650 - loss 0.01464407 - time (sec): 154.62 - samples/sec: 7567.31 - lr: 0.012500 +2023-04-06 06:15:19,623 epoch 142 - iter 2385/2650 - loss 0.01442747 - time (sec): 173.98 - samples/sec: 7565.96 - lr: 0.012500 +2023-04-06 06:15:39,477 epoch 142 - iter 2650/2650 - loss 0.01442749 - time (sec): 193.83 - samples/sec: 7544.58 - lr: 0.012500 +2023-04-06 06:15:39,477 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:15:39,477 EPOCH 142 done: loss 0.0144 - lr 0.012500 +2023-04-06 06:15:39,477 BAD EPOCHS (no improvement): 1 +2023-04-06 06:15:39,480 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:15:58,813 epoch 143 - iter 265/2650 - loss 0.01342462 - time (sec): 19.33 - samples/sec: 7586.76 - lr: 0.012500 +2023-04-06 06:16:17,904 epoch 143 - iter 530/2650 - loss 0.01399027 - time (sec): 38.42 - samples/sec: 7613.30 - lr: 0.012500 +2023-04-06 06:16:37,406 epoch 143 - iter 795/2650 - loss 0.01393818 - time (sec): 57.93 - samples/sec: 7577.84 - lr: 0.012500 +2023-04-06 06:16:57,208 epoch 143 - iter 1060/2650 - loss 0.01379454 - time (sec): 77.73 - samples/sec: 7524.77 - lr: 0.012500 +2023-04-06 06:17:16,711 epoch 143 - iter 1325/2650 - loss 0.01415027 - time (sec): 97.23 - samples/sec: 7527.34 - lr: 0.012500 +2023-04-06 06:17:35,816 epoch 143 - iter 1590/2650 - loss 0.01426226 - time (sec): 116.34 - samples/sec: 7564.19 - lr: 0.012500 +2023-04-06 06:17:55,396 epoch 143 - iter 1855/2650 - loss 0.01416672 - time (sec): 135.92 - samples/sec: 7546.90 - lr: 0.012500 +2023-04-06 06:18:14,599 epoch 143 - iter 2120/2650 - loss 0.01414412 - time (sec): 155.12 - samples/sec: 7560.38 - lr: 0.012500 +2023-04-06 06:18:33,549 epoch 143 - iter 2385/2650 - loss 0.01417352 - time (sec): 174.07 - samples/sec: 7567.48 - lr: 0.012500 +2023-04-06 06:18:52,945 epoch 143 - iter 2650/2650 - loss 0.01415801 - time (sec): 193.47 - samples/sec: 7558.80 - lr: 0.012500 +2023-04-06 06:18:52,946 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:18:52,946 EPOCH 143 done: loss 0.0142 - lr 0.012500 +2023-04-06 06:18:52,946 BAD EPOCHS (no improvement): 2 +2023-04-06 06:18:52,950 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:19:13,230 epoch 144 - iter 265/2650 - loss 0.01439706 - time (sec): 20.28 - samples/sec: 7281.39 - lr: 0.012500 +2023-04-06 06:19:32,097 epoch 144 - iter 530/2650 - loss 0.01460570 - time (sec): 39.15 - samples/sec: 7498.94 - lr: 0.012500 +2023-04-06 06:19:51,181 epoch 144 - iter 795/2650 - loss 0.01447005 - time (sec): 58.23 - samples/sec: 7526.91 - lr: 0.012500 +2023-04-06 06:20:10,808 epoch 144 - iter 1060/2650 - loss 0.01429584 - time (sec): 77.86 - samples/sec: 7518.26 - lr: 0.012500 +2023-04-06 06:20:30,101 epoch 144 - iter 1325/2650 - loss 0.01433315 - time (sec): 97.15 - samples/sec: 7544.39 - lr: 0.012500 +2023-04-06 06:20:49,528 epoch 144 - iter 1590/2650 - loss 0.01429718 - time (sec): 116.58 - samples/sec: 7542.67 - lr: 0.012500 +2023-04-06 06:21:09,281 epoch 144 - iter 1855/2650 - loss 0.01432114 - time (sec): 136.33 - samples/sec: 7519.67 - lr: 0.012500 +2023-04-06 06:21:28,496 epoch 144 - iter 2120/2650 - loss 0.01426102 - time (sec): 155.55 - samples/sec: 7528.75 - lr: 0.012500 +2023-04-06 06:21:47,225 epoch 144 - iter 2385/2650 - loss 0.01412843 - time (sec): 174.28 - samples/sec: 7557.57 - lr: 0.012500 +2023-04-06 06:22:06,502 epoch 144 - iter 2650/2650 - loss 0.01404888 - time (sec): 193.55 - samples/sec: 7555.41 - lr: 0.012500 +2023-04-06 06:22:06,502 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:22:06,502 EPOCH 144 done: loss 0.0140 - lr 0.012500 +2023-04-06 06:22:06,502 BAD EPOCHS (no improvement): 3 +2023-04-06 06:22:06,506 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:22:25,653 epoch 145 - iter 265/2650 - loss 0.01311236 - time (sec): 19.15 - samples/sec: 7619.58 - lr: 0.012500 +2023-04-06 06:22:44,408 epoch 145 - iter 530/2650 - loss 0.01345983 - time (sec): 37.90 - samples/sec: 7643.92 - lr: 0.012500 +2023-04-06 06:23:03,812 epoch 145 - iter 795/2650 - loss 0.01331181 - time (sec): 57.31 - samples/sec: 7601.85 - lr: 0.012500 +2023-04-06 06:23:24,110 epoch 145 - iter 1060/2650 - loss 0.01325242 - time (sec): 77.60 - samples/sec: 7538.83 - lr: 0.012500 +2023-04-06 06:23:43,830 epoch 145 - iter 1325/2650 - loss 0.01335888 - time (sec): 97.32 - samples/sec: 7530.14 - lr: 0.012500 +2023-04-06 06:24:02,494 epoch 145 - iter 1590/2650 - loss 0.01347614 - time (sec): 115.99 - samples/sec: 7558.09 - lr: 0.012500 +2023-04-06 06:24:22,216 epoch 145 - iter 1855/2650 - loss 0.01356882 - time (sec): 135.71 - samples/sec: 7544.91 - lr: 0.012500 +2023-04-06 06:24:41,584 epoch 145 - iter 2120/2650 - loss 0.01375189 - time (sec): 155.08 - samples/sec: 7547.38 - lr: 0.012500 +2023-04-06 06:25:01,376 epoch 145 - iter 2385/2650 - loss 0.01385438 - time (sec): 174.87 - samples/sec: 7525.13 - lr: 0.012500 +2023-04-06 06:25:20,693 epoch 145 - iter 2650/2650 - loss 0.01388776 - time (sec): 194.19 - samples/sec: 7530.71 - lr: 0.012500 +2023-04-06 06:25:20,693 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:25:20,693 EPOCH 145 done: loss 0.0139 - lr 0.012500 +2023-04-06 06:25:20,693 BAD EPOCHS (no improvement): 0 +2023-04-06 06:25:20,697 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:25:40,333 epoch 146 - iter 265/2650 - loss 0.01455168 - time (sec): 19.64 - samples/sec: 7403.36 - lr: 0.012500 +2023-04-06 06:25:59,169 epoch 146 - iter 530/2650 - loss 0.01398470 - time (sec): 38.47 - samples/sec: 7565.48 - lr: 0.012500 +2023-04-06 06:26:18,869 epoch 146 - iter 795/2650 - loss 0.01401679 - time (sec): 58.17 - samples/sec: 7540.09 - lr: 0.012500 +2023-04-06 06:26:38,052 epoch 146 - iter 1060/2650 - loss 0.01379408 - time (sec): 77.35 - samples/sec: 7549.56 - lr: 0.012500 +2023-04-06 06:26:57,596 epoch 146 - iter 1325/2650 - loss 0.01412683 - time (sec): 96.90 - samples/sec: 7531.75 - lr: 0.012500 +2023-04-06 06:27:16,587 epoch 146 - iter 1590/2650 - loss 0.01408474 - time (sec): 115.89 - samples/sec: 7563.33 - lr: 0.012500 +2023-04-06 06:27:36,384 epoch 146 - iter 1855/2650 - loss 0.01411956 - time (sec): 135.69 - samples/sec: 7551.18 - lr: 0.012500 +2023-04-06 06:27:56,469 epoch 146 - iter 2120/2650 - loss 0.01406314 - time (sec): 155.77 - samples/sec: 7515.15 - lr: 0.012500 +2023-04-06 06:28:15,731 epoch 146 - iter 2385/2650 - loss 0.01403210 - time (sec): 175.03 - samples/sec: 7515.80 - lr: 0.012500 +2023-04-06 06:28:34,767 epoch 146 - iter 2650/2650 - loss 0.01407356 - time (sec): 194.07 - samples/sec: 7535.24 - lr: 0.012500 +2023-04-06 06:28:34,768 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:28:34,768 EPOCH 146 done: loss 0.0141 - lr 0.012500 +2023-04-06 06:28:34,768 BAD EPOCHS (no improvement): 1 +2023-04-06 06:28:34,771 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:28:54,217 epoch 147 - iter 265/2650 - loss 0.01418719 - time (sec): 19.45 - samples/sec: 7502.48 - lr: 0.012500 +2023-04-06 06:29:13,710 epoch 147 - iter 530/2650 - loss 0.01411179 - time (sec): 38.94 - samples/sec: 7463.49 - lr: 0.012500 +2023-04-06 06:29:33,020 epoch 147 - iter 795/2650 - loss 0.01412138 - time (sec): 58.25 - samples/sec: 7536.43 - lr: 0.012500 +2023-04-06 06:29:52,262 epoch 147 - iter 1060/2650 - loss 0.01396798 - time (sec): 77.49 - samples/sec: 7551.24 - lr: 0.012500 +2023-04-06 06:30:11,013 epoch 147 - iter 1325/2650 - loss 0.01399830 - time (sec): 96.24 - samples/sec: 7588.42 - lr: 0.012500 +2023-04-06 06:30:30,030 epoch 147 - iter 1590/2650 - loss 0.01387271 - time (sec): 115.26 - samples/sec: 7599.16 - lr: 0.012500 +2023-04-06 06:30:49,647 epoch 147 - iter 1855/2650 - loss 0.01384587 - time (sec): 134.88 - samples/sec: 7575.70 - lr: 0.012500 +2023-04-06 06:31:09,479 epoch 147 - iter 2120/2650 - loss 0.01375414 - time (sec): 154.71 - samples/sec: 7552.97 - lr: 0.012500 +2023-04-06 06:31:29,283 epoch 147 - iter 2385/2650 - loss 0.01386285 - time (sec): 174.51 - samples/sec: 7538.87 - lr: 0.012500 +2023-04-06 06:31:48,474 epoch 147 - iter 2650/2650 - loss 0.01388996 - time (sec): 193.70 - samples/sec: 7549.55 - lr: 0.012500 +2023-04-06 06:31:48,474 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:31:48,474 EPOCH 147 done: loss 0.0139 - lr 0.012500 +2023-04-06 06:31:48,474 BAD EPOCHS (no improvement): 2 +2023-04-06 06:31:48,478 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:32:07,471 epoch 148 - iter 265/2650 - loss 0.01381004 - time (sec): 18.99 - samples/sec: 7643.01 - lr: 0.012500 +2023-04-06 06:32:27,043 epoch 148 - iter 530/2650 - loss 0.01378548 - time (sec): 38.56 - samples/sec: 7561.93 - lr: 0.012500 +2023-04-06 06:32:46,643 epoch 148 - iter 795/2650 - loss 0.01400589 - time (sec): 58.16 - samples/sec: 7530.61 - lr: 0.012500 +2023-04-06 06:33:05,984 epoch 148 - iter 1060/2650 - loss 0.01382955 - time (sec): 77.50 - samples/sec: 7517.63 - lr: 0.012500 +2023-04-06 06:33:25,204 epoch 148 - iter 1325/2650 - loss 0.01385333 - time (sec): 96.73 - samples/sec: 7540.77 - lr: 0.012500 +2023-04-06 06:33:44,251 epoch 148 - iter 1590/2650 - loss 0.01364464 - time (sec): 115.77 - samples/sec: 7572.58 - lr: 0.012500 +2023-04-06 06:34:03,865 epoch 148 - iter 1855/2650 - loss 0.01356889 - time (sec): 135.39 - samples/sec: 7549.23 - lr: 0.012500 +2023-04-06 06:34:23,007 epoch 148 - iter 2120/2650 - loss 0.01379351 - time (sec): 154.53 - samples/sec: 7558.19 - lr: 0.012500 +2023-04-06 06:34:42,509 epoch 148 - iter 2385/2650 - loss 0.01379599 - time (sec): 174.03 - samples/sec: 7555.43 - lr: 0.012500 +2023-04-06 06:35:02,098 epoch 148 - iter 2650/2650 - loss 0.01377780 - time (sec): 193.62 - samples/sec: 7552.78 - lr: 0.012500 +2023-04-06 06:35:02,098 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:35:02,098 EPOCH 148 done: loss 0.0138 - lr 0.012500 +2023-04-06 06:35:02,098 BAD EPOCHS (no improvement): 0 +2023-04-06 06:35:02,102 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:35:21,337 epoch 149 - iter 265/2650 - loss 0.01349160 - time (sec): 19.23 - samples/sec: 7530.39 - lr: 0.012500 +2023-04-06 06:35:40,832 epoch 149 - iter 530/2650 - loss 0.01332417 - time (sec): 38.73 - samples/sec: 7581.07 - lr: 0.012500 +2023-04-06 06:35:59,732 epoch 149 - iter 795/2650 - loss 0.01344141 - time (sec): 57.63 - samples/sec: 7621.96 - lr: 0.012500 +2023-04-06 06:36:18,867 epoch 149 - iter 1060/2650 - loss 0.01359838 - time (sec): 76.76 - samples/sec: 7605.84 - lr: 0.012500 +2023-04-06 06:36:38,601 epoch 149 - iter 1325/2650 - loss 0.01373508 - time (sec): 96.50 - samples/sec: 7585.66 - lr: 0.012500 +2023-04-06 06:36:58,180 epoch 149 - iter 1590/2650 - loss 0.01366690 - time (sec): 116.08 - samples/sec: 7574.86 - lr: 0.012500 +2023-04-06 06:37:17,459 epoch 149 - iter 1855/2650 - loss 0.01368187 - time (sec): 135.36 - samples/sec: 7573.26 - lr: 0.012500 +2023-04-06 06:37:36,823 epoch 149 - iter 2120/2650 - loss 0.01367709 - time (sec): 154.72 - samples/sec: 7573.34 - lr: 0.012500 +2023-04-06 06:37:55,833 epoch 149 - iter 2385/2650 - loss 0.01376543 - time (sec): 173.73 - samples/sec: 7584.03 - lr: 0.012500 +2023-04-06 06:38:15,407 epoch 149 - iter 2650/2650 - loss 0.01381202 - time (sec): 193.30 - samples/sec: 7565.07 - lr: 0.012500 +2023-04-06 06:38:15,407 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:38:15,407 EPOCH 149 done: loss 0.0138 - lr 0.012500 +2023-04-06 06:38:15,407 BAD EPOCHS (no improvement): 1 +2023-04-06 06:38:15,411 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:38:34,363 epoch 150 - iter 265/2650 - loss 0.01307237 - time (sec): 18.95 - samples/sec: 7651.57 - lr: 0.012500 +2023-04-06 06:38:53,718 epoch 150 - iter 530/2650 - loss 0.01364276 - time (sec): 38.31 - samples/sec: 7563.62 - lr: 0.012500 +2023-04-06 06:39:12,803 epoch 150 - iter 795/2650 - loss 0.01353410 - time (sec): 57.39 - samples/sec: 7616.72 - lr: 0.012500 +2023-04-06 06:39:32,501 epoch 150 - iter 1060/2650 - loss 0.01331620 - time (sec): 77.09 - samples/sec: 7579.86 - lr: 0.012500 +2023-04-06 06:39:51,368 epoch 150 - iter 1325/2650 - loss 0.01338058 - time (sec): 95.96 - samples/sec: 7602.26 - lr: 0.012500 +2023-04-06 06:40:11,198 epoch 150 - iter 1590/2650 - loss 0.01352856 - time (sec): 115.79 - samples/sec: 7567.79 - lr: 0.012500 +2023-04-06 06:40:30,094 epoch 150 - iter 1855/2650 - loss 0.01353281 - time (sec): 134.68 - samples/sec: 7588.53 - lr: 0.012500 +2023-04-06 06:40:49,339 epoch 150 - iter 2120/2650 - loss 0.01353930 - time (sec): 153.93 - samples/sec: 7591.61 - lr: 0.012500 +2023-04-06 06:41:08,425 epoch 150 - iter 2385/2650 - loss 0.01353857 - time (sec): 173.01 - samples/sec: 7595.69 - lr: 0.012500 +2023-04-06 06:41:28,425 epoch 150 - iter 2650/2650 - loss 0.01360721 - time (sec): 193.01 - samples/sec: 7576.47 - lr: 0.012500 +2023-04-06 06:41:28,426 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:41:28,426 EPOCH 150 done: loss 0.0136 - lr 0.012500 +2023-04-06 06:41:28,426 BAD EPOCHS (no improvement): 0 +2023-04-06 06:41:36,515 ---------------------------------------------------------------------------------------------------- +2023-04-06 06:41:36,515 Testing using last state of model ... +2023-04-06 06:42:14,804 Evaluating as a multi-label problem: False +2023-04-06 06:42:14,874 0.8966 0.8885 0.8926 0.8242 +2023-04-06 06:42:14,874 +Results: +- F-score (micro) 0.8926 +- F-score (macro) 0.8017 +- Accuracy 0.8242 + +By class: + precision recall f1-score support + + GPE 0.9649 0.9576 0.9612 2240 + PERSON 0.9410 0.9311 0.9360 1988 + ORG 0.8985 0.8925 0.8955 1795 + DATE 0.8679 0.8695 0.8687 1602 + CARDINAL 0.8594 0.8299 0.8444 935 + NORP 0.9010 0.9203 0.9106 841 + PERCENT 0.9107 0.9054 0.9080 349 + MONEY 0.9085 0.9172 0.9128 314 + TIME 0.6605 0.6698 0.6651 212 + ORDINAL 0.8020 0.8308 0.8161 195 + LOC 0.7771 0.7598 0.7684 179 + WORK_OF_ART 0.7007 0.6205 0.6581 166 + FAC 0.7674 0.7333 0.7500 135 + QUANTITY 0.7890 0.8190 0.8037 105 + PRODUCT 0.7606 0.7105 0.7347 76 + EVENT 0.6833 0.6508 0.6667 63 + LAW 0.7241 0.5250 0.6087 40 + LANGUAGE 0.9286 0.5909 0.7222 22 + + micro avg 0.8966 0.8885 0.8926 11257 + macro avg 0.8247 0.7852 0.8017 11257 +weighted avg 0.8962 0.8885 0.8921 11257 + +2023-04-06 06:42:14,875 ----------------------------------------------------------------------------------------------------