|
2021-12-31 08:35:07,676 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,680 Model: "SequenceTagger( |
|
(embeddings): StackedEmbeddings( |
|
(list_embedding_0): FlairEmbeddings( |
|
(lm): LanguageModel( |
|
(drop): Dropout(p=0.5, inplace=False) |
|
(encoder): Embedding(275, 100) |
|
(rnn): LSTM(100, 1024) |
|
(decoder): Linear(in_features=1024, out_features=275, bias=True) |
|
) |
|
) |
|
(list_embedding_1): FlairEmbeddings( |
|
(lm): LanguageModel( |
|
(drop): Dropout(p=0.5, inplace=False) |
|
(encoder): Embedding(275, 100) |
|
(rnn): LSTM(100, 1024) |
|
(decoder): Linear(in_features=1024, out_features=275, bias=True) |
|
) |
|
) |
|
(list_embedding_2): TransformerWordEmbeddings( |
|
(model): CamembertModel( |
|
(embeddings): RobertaEmbeddings( |
|
(word_embeddings): Embedding(32005, 768, padding_idx=1) |
|
(position_embeddings): Embedding(514, 768, padding_idx=1) |
|
(token_type_embeddings): Embedding(1, 768) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(encoder): RobertaEncoder( |
|
(layer): ModuleList( |
|
(0): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(1): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(2): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(3): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(4): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(5): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(6): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(7): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(8): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(9): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(10): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(11): RobertaLayer( |
|
(attention): RobertaAttention( |
|
(self): RobertaSelfAttention( |
|
(query): Linear(in_features=768, out_features=768, bias=True) |
|
(key): Linear(in_features=768, out_features=768, bias=True) |
|
(value): Linear(in_features=768, out_features=768, bias=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
(output): RobertaSelfOutput( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
(intermediate): RobertaIntermediate( |
|
(dense): Linear(in_features=768, out_features=3072, bias=True) |
|
) |
|
(output): RobertaOutput( |
|
(dense): Linear(in_features=3072, out_features=768, bias=True) |
|
(LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True) |
|
(dropout): Dropout(p=0.1, inplace=False) |
|
) |
|
) |
|
) |
|
) |
|
(pooler): RobertaPooler( |
|
(dense): Linear(in_features=768, out_features=768, bias=True) |
|
(activation): Tanh() |
|
) |
|
) |
|
) |
|
) |
|
(word_dropout): WordDropout(p=0.05) |
|
(locked_dropout): LockedDropout(p=0.5) |
|
(embedding2nn): Linear(in_features=2816, out_features=2816, bias=True) |
|
(rnn): LSTM(2816, 256, batch_first=True, bidirectional=True) |
|
(linear): Linear(in_features=512, out_features=68, bias=True) |
|
(beta): 1.0 |
|
(weights): None |
|
(weight_tensor) None |
|
)" |
|
2021-12-31 08:35:07,680 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,681 Corpus: "Corpus: 14449 train + 1476 dev + 416 test sentences" |
|
2021-12-31 08:35:07,681 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,681 Parameters: |
|
2021-12-31 08:35:07,681 - learning_rate: "0.1" |
|
2021-12-31 08:35:07,681 - mini_batch_size: "8" |
|
2021-12-31 08:35:07,681 - patience: "3" |
|
2021-12-31 08:35:07,681 - anneal_factor: "0.5" |
|
2021-12-31 08:35:07,681 - max_epochs: "50" |
|
2021-12-31 08:35:07,681 - shuffle: "True" |
|
2021-12-31 08:35:07,681 - train_with_dev: "False" |
|
2021-12-31 08:35:07,681 - batch_growth_annealing: "False" |
|
2021-12-31 08:35:07,681 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,681 Model training base path: "models/UPOS_UD_FRENCH_GSD_PLUS_Flair-Embeddings_50_2021-12-31-08:34:44" |
|
2021-12-31 08:35:07,681 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,682 Device: cuda:0 |
|
2021-12-31 08:35:07,682 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:07,682 Embeddings storage mode: cpu |
|
2021-12-31 08:35:07,686 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:35:35,600 epoch 1 - iter 180/1807 - loss 1.43338722 - samples/sec: 51.63 - lr: 0.100000 |
|
2021-12-31 08:36:03,642 epoch 1 - iter 360/1807 - loss 0.97278560 - samples/sec: 51.39 - lr: 0.100000 |
|
2021-12-31 08:36:31,448 epoch 1 - iter 540/1807 - loss 0.77628898 - samples/sec: 51.83 - lr: 0.100000 |
|
2021-12-31 08:37:00,007 epoch 1 - iter 720/1807 - loss 0.66122431 - samples/sec: 50.46 - lr: 0.100000 |
|
2021-12-31 08:37:29,449 epoch 1 - iter 900/1807 - loss 0.58637716 - samples/sec: 48.94 - lr: 0.100000 |
|
2021-12-31 08:37:57,842 epoch 1 - iter 1080/1807 - loss 0.53261867 - samples/sec: 50.75 - lr: 0.100000 |
|
2021-12-31 08:38:27,836 epoch 1 - iter 1260/1807 - loss 0.49236809 - samples/sec: 48.04 - lr: 0.100000 |
|
2021-12-31 08:38:56,177 epoch 1 - iter 1440/1807 - loss 0.46224064 - samples/sec: 50.84 - lr: 0.100000 |
|
2021-12-31 08:39:25,301 epoch 1 - iter 1620/1807 - loss 0.43700232 - samples/sec: 49.48 - lr: 0.100000 |
|
2021-12-31 08:39:53,843 epoch 1 - iter 1800/1807 - loss 0.41459922 - samples/sec: 50.49 - lr: 0.100000 |
|
2021-12-31 08:39:54,850 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:39:54,851 EPOCH 1 done: loss 0.4139 - lr 0.1000000 |
|
2021-12-31 08:40:38,186 DEV : loss 0.09867297857999802 - f1-score (micro avg) 0.9723 |
|
2021-12-31 08:40:38,373 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:40:38,375 saving best model |
|
2021-12-31 08:40:43,945 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:40:59,809 epoch 2 - iter 180/1807 - loss 0.20282785 - samples/sec: 90.92 - lr: 0.100000 |
|
2021-12-31 08:41:15,798 epoch 2 - iter 360/1807 - loss 0.20600484 - samples/sec: 90.20 - lr: 0.100000 |
|
2021-12-31 08:41:31,824 epoch 2 - iter 540/1807 - loss 0.20352355 - samples/sec: 89.99 - lr: 0.100000 |
|
2021-12-31 08:41:47,291 epoch 2 - iter 720/1807 - loss 0.19945298 - samples/sec: 93.24 - lr: 0.100000 |
|
2021-12-31 08:42:03,389 epoch 2 - iter 900/1807 - loss 0.19672769 - samples/sec: 89.58 - lr: 0.100000 |
|
2021-12-31 08:42:19,546 epoch 2 - iter 1080/1807 - loss 0.19404584 - samples/sec: 89.25 - lr: 0.100000 |
|
2021-12-31 08:42:35,186 epoch 2 - iter 1260/1807 - loss 0.19211776 - samples/sec: 92.22 - lr: 0.100000 |
|
2021-12-31 08:42:51,014 epoch 2 - iter 1440/1807 - loss 0.19040930 - samples/sec: 91.11 - lr: 0.100000 |
|
2021-12-31 08:43:07,108 epoch 2 - iter 1620/1807 - loss 0.18835936 - samples/sec: 89.60 - lr: 0.100000 |
|
2021-12-31 08:43:22,664 epoch 2 - iter 1800/1807 - loss 0.18684498 - samples/sec: 92.71 - lr: 0.100000 |
|
2021-12-31 08:43:23,166 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:43:23,166 EPOCH 2 done: loss 0.1868 - lr 0.1000000 |
|
2021-12-31 08:43:59,411 DEV : loss 0.08219591528177261 - f1-score (micro avg) 0.9761 |
|
2021-12-31 08:43:59,601 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:43:59,602 saving best model |
|
2021-12-31 08:44:04,994 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:44:21,188 epoch 3 - iter 180/1807 - loss 0.16248988 - samples/sec: 89.06 - lr: 0.100000 |
|
2021-12-31 08:44:37,143 epoch 3 - iter 360/1807 - loss 0.16012805 - samples/sec: 90.38 - lr: 0.100000 |
|
2021-12-31 08:44:53,240 epoch 3 - iter 540/1807 - loss 0.15771573 - samples/sec: 89.59 - lr: 0.100000 |
|
2021-12-31 08:45:08,820 epoch 3 - iter 720/1807 - loss 0.15678918 - samples/sec: 92.57 - lr: 0.100000 |
|
2021-12-31 08:45:24,447 epoch 3 - iter 900/1807 - loss 0.15583330 - samples/sec: 92.28 - lr: 0.100000 |
|
2021-12-31 08:45:40,453 epoch 3 - iter 1080/1807 - loss 0.15551694 - samples/sec: 90.10 - lr: 0.100000 |
|
2021-12-31 08:45:56,421 epoch 3 - iter 1260/1807 - loss 0.15503272 - samples/sec: 90.32 - lr: 0.100000 |
|
2021-12-31 08:46:12,207 epoch 3 - iter 1440/1807 - loss 0.15478837 - samples/sec: 91.35 - lr: 0.100000 |
|
2021-12-31 08:46:28,067 epoch 3 - iter 1620/1807 - loss 0.15437671 - samples/sec: 90.93 - lr: 0.100000 |
|
2021-12-31 08:46:44,096 epoch 3 - iter 1800/1807 - loss 0.15334210 - samples/sec: 89.96 - lr: 0.100000 |
|
2021-12-31 08:46:44,638 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:46:44,638 EPOCH 3 done: loss 0.1533 - lr 0.1000000 |
|
2021-12-31 08:47:19,364 DEV : loss 0.07821641117334366 - f1-score (micro avg) 0.9771 |
|
2021-12-31 08:47:19,574 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:47:19,576 saving best model |
|
2021-12-31 08:47:25,807 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:47:42,295 epoch 4 - iter 180/1807 - loss 0.14078583 - samples/sec: 87.48 - lr: 0.100000 |
|
2021-12-31 08:47:58,394 epoch 4 - iter 360/1807 - loss 0.14084079 - samples/sec: 89.58 - lr: 0.100000 |
|
2021-12-31 08:48:14,377 epoch 4 - iter 540/1807 - loss 0.13969043 - samples/sec: 90.22 - lr: 0.100000 |
|
2021-12-31 08:48:30,411 epoch 4 - iter 720/1807 - loss 0.13901425 - samples/sec: 89.95 - lr: 0.100000 |
|
2021-12-31 08:48:45,985 epoch 4 - iter 900/1807 - loss 0.13965987 - samples/sec: 92.60 - lr: 0.100000 |
|
2021-12-31 08:49:01,706 epoch 4 - iter 1080/1807 - loss 0.13942263 - samples/sec: 91.73 - lr: 0.100000 |
|
2021-12-31 08:49:17,833 epoch 4 - iter 1260/1807 - loss 0.13931213 - samples/sec: 89.42 - lr: 0.100000 |
|
2021-12-31 08:49:33,693 epoch 4 - iter 1440/1807 - loss 0.13835426 - samples/sec: 90.94 - lr: 0.100000 |
|
2021-12-31 08:49:49,444 epoch 4 - iter 1620/1807 - loss 0.13722078 - samples/sec: 91.56 - lr: 0.100000 |
|
2021-12-31 08:50:05,233 epoch 4 - iter 1800/1807 - loss 0.13680325 - samples/sec: 91.33 - lr: 0.100000 |
|
2021-12-31 08:50:05,825 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:50:05,826 EPOCH 4 done: loss 0.1368 - lr 0.1000000 |
|
2021-12-31 08:50:40,951 DEV : loss 0.07048774510622025 - f1-score (micro avg) 0.9784 |
|
2021-12-31 08:50:41,121 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:50:41,123 saving best model |
|
2021-12-31 08:50:46,985 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:51:03,480 epoch 5 - iter 180/1807 - loss 0.12576483 - samples/sec: 87.44 - lr: 0.100000 |
|
2021-12-31 08:51:19,312 epoch 5 - iter 360/1807 - loss 0.12838224 - samples/sec: 91.10 - lr: 0.100000 |
|
2021-12-31 08:51:35,140 epoch 5 - iter 540/1807 - loss 0.13027925 - samples/sec: 91.11 - lr: 0.100000 |
|
2021-12-31 08:51:51,382 epoch 5 - iter 720/1807 - loss 0.13001079 - samples/sec: 88.78 - lr: 0.100000 |
|
2021-12-31 08:52:07,009 epoch 5 - iter 900/1807 - loss 0.12990639 - samples/sec: 92.28 - lr: 0.100000 |
|
2021-12-31 08:52:22,749 epoch 5 - iter 1080/1807 - loss 0.12927608 - samples/sec: 91.63 - lr: 0.100000 |
|
2021-12-31 08:52:38,459 epoch 5 - iter 1260/1807 - loss 0.12839810 - samples/sec: 91.79 - lr: 0.100000 |
|
2021-12-31 08:52:54,183 epoch 5 - iter 1440/1807 - loss 0.12750076 - samples/sec: 91.71 - lr: 0.100000 |
|
2021-12-31 08:53:09,782 epoch 5 - iter 1620/1807 - loss 0.12744081 - samples/sec: 92.45 - lr: 0.100000 |
|
2021-12-31 08:53:26,181 epoch 5 - iter 1800/1807 - loss 0.12697954 - samples/sec: 87.94 - lr: 0.100000 |
|
2021-12-31 08:53:26,718 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:53:26,718 EPOCH 5 done: loss 0.1270 - lr 0.1000000 |
|
2021-12-31 08:54:05,303 DEV : loss 0.06857253611087799 - f1-score (micro avg) 0.9795 |
|
2021-12-31 08:54:05,490 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:54:05,491 saving best model |
|
2021-12-31 08:54:11,317 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:54:27,729 epoch 6 - iter 180/1807 - loss 0.12012197 - samples/sec: 87.88 - lr: 0.100000 |
|
2021-12-31 08:54:43,570 epoch 6 - iter 360/1807 - loss 0.12134345 - samples/sec: 91.04 - lr: 0.100000 |
|
2021-12-31 08:54:59,298 epoch 6 - iter 540/1807 - loss 0.12010472 - samples/sec: 91.70 - lr: 0.100000 |
|
2021-12-31 08:55:14,710 epoch 6 - iter 720/1807 - loss 0.11985671 - samples/sec: 93.58 - lr: 0.100000 |
|
2021-12-31 08:55:30,873 epoch 6 - iter 900/1807 - loss 0.12032070 - samples/sec: 89.22 - lr: 0.100000 |
|
2021-12-31 08:55:46,705 epoch 6 - iter 1080/1807 - loss 0.11976455 - samples/sec: 91.08 - lr: 0.100000 |
|
2021-12-31 08:56:02,915 epoch 6 - iter 1260/1807 - loss 0.11964832 - samples/sec: 88.97 - lr: 0.100000 |
|
2021-12-31 08:56:18,616 epoch 6 - iter 1440/1807 - loss 0.11958148 - samples/sec: 91.86 - lr: 0.100000 |
|
2021-12-31 08:56:34,478 epoch 6 - iter 1620/1807 - loss 0.12003314 - samples/sec: 90.91 - lr: 0.100000 |
|
2021-12-31 08:56:50,548 epoch 6 - iter 1800/1807 - loss 0.11950787 - samples/sec: 89.75 - lr: 0.100000 |
|
2021-12-31 08:56:51,070 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:56:51,070 EPOCH 6 done: loss 0.1195 - lr 0.1000000 |
|
2021-12-31 08:57:26,881 DEV : loss 0.06588418781757355 - f1-score (micro avg) 0.9805 |
|
2021-12-31 08:57:27,077 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 08:57:27,079 saving best model |
|
2021-12-31 08:57:32,878 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 08:57:49,222 epoch 7 - iter 180/1807 - loss 0.11622596 - samples/sec: 88.27 - lr: 0.100000 |
|
2021-12-31 08:58:05,154 epoch 7 - iter 360/1807 - loss 0.11182908 - samples/sec: 90.52 - lr: 0.100000 |
|
2021-12-31 08:58:21,316 epoch 7 - iter 540/1807 - loss 0.11325284 - samples/sec: 89.23 - lr: 0.100000 |
|
2021-12-31 08:58:37,501 epoch 7 - iter 720/1807 - loss 0.11356510 - samples/sec: 89.11 - lr: 0.100000 |
|
2021-12-31 08:58:53,437 epoch 7 - iter 900/1807 - loss 0.11375009 - samples/sec: 90.50 - lr: 0.100000 |
|
2021-12-31 08:59:09,683 epoch 7 - iter 1080/1807 - loss 0.11424006 - samples/sec: 88.76 - lr: 0.100000 |
|
2021-12-31 08:59:25,513 epoch 7 - iter 1260/1807 - loss 0.11502991 - samples/sec: 91.10 - lr: 0.100000 |
|
2021-12-31 08:59:41,355 epoch 7 - iter 1440/1807 - loss 0.11465724 - samples/sec: 91.04 - lr: 0.100000 |
|
2021-12-31 08:59:57,048 epoch 7 - iter 1620/1807 - loss 0.11489345 - samples/sec: 91.91 - lr: 0.100000 |
|
2021-12-31 09:00:13,626 epoch 7 - iter 1800/1807 - loss 0.11495780 - samples/sec: 86.99 - lr: 0.100000 |
|
2021-12-31 09:00:14,225 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:00:14,225 EPOCH 7 done: loss 0.1149 - lr 0.1000000 |
|
2021-12-31 09:00:50,356 DEV : loss 0.06450950354337692 - f1-score (micro avg) 0.981 |
|
2021-12-31 09:00:50,566 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:00:50,572 saving best model |
|
2021-12-31 09:00:56,353 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:01:12,703 epoch 8 - iter 180/1807 - loss 0.10372694 - samples/sec: 88.23 - lr: 0.100000 |
|
2021-12-31 09:01:28,785 epoch 8 - iter 360/1807 - loss 0.10507104 - samples/sec: 89.68 - lr: 0.100000 |
|
2021-12-31 09:01:45,134 epoch 8 - iter 540/1807 - loss 0.10666062 - samples/sec: 88.21 - lr: 0.100000 |
|
2021-12-31 09:02:01,507 epoch 8 - iter 720/1807 - loss 0.10750728 - samples/sec: 88.08 - lr: 0.100000 |
|
2021-12-31 09:02:17,626 epoch 8 - iter 900/1807 - loss 0.10760637 - samples/sec: 89.47 - lr: 0.100000 |
|
2021-12-31 09:02:33,374 epoch 8 - iter 1080/1807 - loss 0.10788257 - samples/sec: 91.58 - lr: 0.100000 |
|
2021-12-31 09:02:49,200 epoch 8 - iter 1260/1807 - loss 0.10808589 - samples/sec: 91.12 - lr: 0.100000 |
|
2021-12-31 09:03:05,738 epoch 8 - iter 1440/1807 - loss 0.10815170 - samples/sec: 87.20 - lr: 0.100000 |
|
2021-12-31 09:03:21,442 epoch 8 - iter 1620/1807 - loss 0.10840840 - samples/sec: 91.84 - lr: 0.100000 |
|
2021-12-31 09:03:37,709 epoch 8 - iter 1800/1807 - loss 0.10855634 - samples/sec: 88.66 - lr: 0.100000 |
|
2021-12-31 09:03:38,280 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:03:38,280 EPOCH 8 done: loss 0.1086 - lr 0.1000000 |
|
2021-12-31 09:04:17,043 DEV : loss 0.06390747427940369 - f1-score (micro avg) 0.9805 |
|
2021-12-31 09:04:17,194 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:04:17,196 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:04:33,331 epoch 9 - iter 180/1807 - loss 0.10260778 - samples/sec: 89.39 - lr: 0.100000 |
|
2021-12-31 09:04:49,336 epoch 9 - iter 360/1807 - loss 0.10566575 - samples/sec: 90.11 - lr: 0.100000 |
|
2021-12-31 09:05:05,083 epoch 9 - iter 540/1807 - loss 0.10556216 - samples/sec: 91.59 - lr: 0.100000 |
|
2021-12-31 09:05:21,004 epoch 9 - iter 720/1807 - loss 0.10506801 - samples/sec: 90.58 - lr: 0.100000 |
|
2021-12-31 09:05:37,109 epoch 9 - iter 900/1807 - loss 0.10596338 - samples/sec: 89.54 - lr: 0.100000 |
|
2021-12-31 09:05:52,784 epoch 9 - iter 1080/1807 - loss 0.10577668 - samples/sec: 92.02 - lr: 0.100000 |
|
2021-12-31 09:06:08,937 epoch 9 - iter 1260/1807 - loss 0.10613509 - samples/sec: 89.28 - lr: 0.100000 |
|
2021-12-31 09:06:24,601 epoch 9 - iter 1440/1807 - loss 0.10637150 - samples/sec: 92.06 - lr: 0.100000 |
|
2021-12-31 09:06:40,409 epoch 9 - iter 1620/1807 - loss 0.10629708 - samples/sec: 91.23 - lr: 0.100000 |
|
2021-12-31 09:06:55,972 epoch 9 - iter 1800/1807 - loss 0.10610710 - samples/sec: 92.67 - lr: 0.100000 |
|
2021-12-31 09:06:56,557 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:06:56,557 EPOCH 9 done: loss 0.1061 - lr 0.1000000 |
|
2021-12-31 09:07:32,784 DEV : loss 0.06607701629400253 - f1-score (micro avg) 0.9814 |
|
2021-12-31 09:07:32,970 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:07:32,972 saving best model |
|
2021-12-31 09:07:38,755 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:07:55,004 epoch 10 - iter 180/1807 - loss 0.10366226 - samples/sec: 88.76 - lr: 0.100000 |
|
2021-12-31 09:08:11,104 epoch 10 - iter 360/1807 - loss 0.10828055 - samples/sec: 89.58 - lr: 0.100000 |
|
2021-12-31 09:08:26,748 epoch 10 - iter 540/1807 - loss 0.10589800 - samples/sec: 92.20 - lr: 0.100000 |
|
2021-12-31 09:08:42,772 epoch 10 - iter 720/1807 - loss 0.10467961 - samples/sec: 90.00 - lr: 0.100000 |
|
2021-12-31 09:08:58,992 epoch 10 - iter 900/1807 - loss 0.10355149 - samples/sec: 88.91 - lr: 0.100000 |
|
2021-12-31 09:09:14,753 epoch 10 - iter 1080/1807 - loss 0.10313717 - samples/sec: 91.50 - lr: 0.100000 |
|
2021-12-31 09:09:30,631 epoch 10 - iter 1260/1807 - loss 0.10353533 - samples/sec: 90.84 - lr: 0.100000 |
|
2021-12-31 09:09:46,654 epoch 10 - iter 1440/1807 - loss 0.10386166 - samples/sec: 90.02 - lr: 0.100000 |
|
2021-12-31 09:10:02,791 epoch 10 - iter 1620/1807 - loss 0.10346798 - samples/sec: 89.36 - lr: 0.100000 |
|
2021-12-31 09:10:18,970 epoch 10 - iter 1800/1807 - loss 0.10358051 - samples/sec: 89.14 - lr: 0.100000 |
|
2021-12-31 09:10:19,492 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:10:19,492 EPOCH 10 done: loss 0.1036 - lr 0.1000000 |
|
2021-12-31 09:10:55,557 DEV : loss 0.06536506861448288 - f1-score (micro avg) 0.9811 |
|
2021-12-31 09:10:55,753 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:10:55,756 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:11:12,024 epoch 11 - iter 180/1807 - loss 0.10182872 - samples/sec: 88.66 - lr: 0.100000 |
|
2021-12-31 09:11:28,246 epoch 11 - iter 360/1807 - loss 0.10175535 - samples/sec: 88.90 - lr: 0.100000 |
|
2021-12-31 09:11:43,844 epoch 11 - iter 540/1807 - loss 0.10107946 - samples/sec: 92.46 - lr: 0.100000 |
|
2021-12-31 09:11:59,559 epoch 11 - iter 720/1807 - loss 0.10053922 - samples/sec: 91.77 - lr: 0.100000 |
|
2021-12-31 09:12:15,490 epoch 11 - iter 900/1807 - loss 0.10047028 - samples/sec: 90.54 - lr: 0.100000 |
|
2021-12-31 09:12:31,195 epoch 11 - iter 1080/1807 - loss 0.09993958 - samples/sec: 91.82 - lr: 0.100000 |
|
2021-12-31 09:12:47,013 epoch 11 - iter 1260/1807 - loss 0.09996914 - samples/sec: 91.17 - lr: 0.100000 |
|
2021-12-31 09:13:03,156 epoch 11 - iter 1440/1807 - loss 0.09980985 - samples/sec: 89.35 - lr: 0.100000 |
|
2021-12-31 09:13:18,852 epoch 11 - iter 1620/1807 - loss 0.09941318 - samples/sec: 91.88 - lr: 0.100000 |
|
2021-12-31 09:13:35,014 epoch 11 - iter 1800/1807 - loss 0.09934768 - samples/sec: 89.23 - lr: 0.100000 |
|
2021-12-31 09:13:35,650 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:13:35,650 EPOCH 11 done: loss 0.0993 - lr 0.1000000 |
|
2021-12-31 09:14:14,419 DEV : loss 0.06659943610429764 - f1-score (micro avg) 0.9811 |
|
2021-12-31 09:14:14,622 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 09:14:14,623 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:14:30,892 epoch 12 - iter 180/1807 - loss 0.09334718 - samples/sec: 88.66 - lr: 0.100000 |
|
2021-12-31 09:14:46,737 epoch 12 - iter 360/1807 - loss 0.09477923 - samples/sec: 91.02 - lr: 0.100000 |
|
2021-12-31 09:15:02,926 epoch 12 - iter 540/1807 - loss 0.09677398 - samples/sec: 89.09 - lr: 0.100000 |
|
2021-12-31 09:15:19,177 epoch 12 - iter 720/1807 - loss 0.09825518 - samples/sec: 88.74 - lr: 0.100000 |
|
2021-12-31 09:15:34,958 epoch 12 - iter 900/1807 - loss 0.09910665 - samples/sec: 91.38 - lr: 0.100000 |
|
2021-12-31 09:15:51,056 epoch 12 - iter 1080/1807 - loss 0.09820501 - samples/sec: 89.59 - lr: 0.100000 |
|
2021-12-31 09:16:07,231 epoch 12 - iter 1260/1807 - loss 0.09858638 - samples/sec: 89.16 - lr: 0.100000 |
|
2021-12-31 09:16:22,988 epoch 12 - iter 1440/1807 - loss 0.09845736 - samples/sec: 91.52 - lr: 0.100000 |
|
2021-12-31 09:16:38,631 epoch 12 - iter 1620/1807 - loss 0.09859390 - samples/sec: 92.21 - lr: 0.100000 |
|
2021-12-31 09:16:54,209 epoch 12 - iter 1800/1807 - loss 0.09847298 - samples/sec: 92.58 - lr: 0.100000 |
|
2021-12-31 09:16:54,729 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:16:54,730 EPOCH 12 done: loss 0.0984 - lr 0.1000000 |
|
2021-12-31 09:17:31,308 DEV : loss 0.06410104781389236 - f1-score (micro avg) 0.9816 |
|
2021-12-31 09:17:31,487 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:17:31,489 saving best model |
|
2021-12-31 09:17:37,260 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:17:54,060 epoch 13 - iter 180/1807 - loss 0.10013605 - samples/sec: 85.86 - lr: 0.100000 |
|
2021-12-31 09:18:09,827 epoch 13 - iter 360/1807 - loss 0.09881566 - samples/sec: 91.47 - lr: 0.100000 |
|
2021-12-31 09:18:25,218 epoch 13 - iter 540/1807 - loss 0.09860664 - samples/sec: 93.71 - lr: 0.100000 |
|
2021-12-31 09:18:41,246 epoch 13 - iter 720/1807 - loss 0.09768065 - samples/sec: 89.97 - lr: 0.100000 |
|
2021-12-31 09:18:57,306 epoch 13 - iter 900/1807 - loss 0.09766501 - samples/sec: 89.79 - lr: 0.100000 |
|
2021-12-31 09:19:12,914 epoch 13 - iter 1080/1807 - loss 0.09767968 - samples/sec: 92.41 - lr: 0.100000 |
|
2021-12-31 09:19:29,144 epoch 13 - iter 1260/1807 - loss 0.09667902 - samples/sec: 88.86 - lr: 0.100000 |
|
2021-12-31 09:19:45,573 epoch 13 - iter 1440/1807 - loss 0.09670686 - samples/sec: 87.78 - lr: 0.100000 |
|
2021-12-31 09:20:01,566 epoch 13 - iter 1620/1807 - loss 0.09672936 - samples/sec: 90.18 - lr: 0.100000 |
|
2021-12-31 09:20:17,572 epoch 13 - iter 1800/1807 - loss 0.09666135 - samples/sec: 90.10 - lr: 0.100000 |
|
2021-12-31 09:20:18,200 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:20:18,200 EPOCH 13 done: loss 0.0967 - lr 0.1000000 |
|
2021-12-31 09:20:54,147 DEV : loss 0.06427688896656036 - f1-score (micro avg) 0.9816 |
|
2021-12-31 09:20:54,334 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:20:54,335 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:21:10,174 epoch 14 - iter 180/1807 - loss 0.09391481 - samples/sec: 91.06 - lr: 0.100000 |
|
2021-12-31 09:21:26,400 epoch 14 - iter 360/1807 - loss 0.09267418 - samples/sec: 88.88 - lr: 0.100000 |
|
2021-12-31 09:21:42,313 epoch 14 - iter 540/1807 - loss 0.09273735 - samples/sec: 90.64 - lr: 0.100000 |
|
2021-12-31 09:21:58,477 epoch 14 - iter 720/1807 - loss 0.09237732 - samples/sec: 89.22 - lr: 0.100000 |
|
2021-12-31 09:22:14,088 epoch 14 - iter 900/1807 - loss 0.09290387 - samples/sec: 92.38 - lr: 0.100000 |
|
2021-12-31 09:22:29,793 epoch 14 - iter 1080/1807 - loss 0.09305725 - samples/sec: 91.82 - lr: 0.100000 |
|
2021-12-31 09:22:45,455 epoch 14 - iter 1260/1807 - loss 0.09321173 - samples/sec: 92.09 - lr: 0.100000 |
|
2021-12-31 09:23:01,412 epoch 14 - iter 1440/1807 - loss 0.09321459 - samples/sec: 90.38 - lr: 0.100000 |
|
2021-12-31 09:23:17,629 epoch 14 - iter 1620/1807 - loss 0.09332877 - samples/sec: 88.93 - lr: 0.100000 |
|
2021-12-31 09:23:33,527 epoch 14 - iter 1800/1807 - loss 0.09313892 - samples/sec: 90.71 - lr: 0.100000 |
|
2021-12-31 09:23:34,165 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:23:34,165 EPOCH 14 done: loss 0.0931 - lr 0.1000000 |
|
2021-12-31 09:24:12,840 DEV : loss 0.06639766693115234 - f1-score (micro avg) 0.9817 |
|
2021-12-31 09:24:13,034 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:24:13,036 saving best model |
|
2021-12-31 09:24:18,822 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:24:34,568 epoch 15 - iter 180/1807 - loss 0.09134784 - samples/sec: 91.60 - lr: 0.100000 |
|
2021-12-31 09:24:50,712 epoch 15 - iter 360/1807 - loss 0.09119751 - samples/sec: 89.33 - lr: 0.100000 |
|
2021-12-31 09:25:07,155 epoch 15 - iter 540/1807 - loss 0.08993505 - samples/sec: 87.70 - lr: 0.100000 |
|
2021-12-31 09:25:23,092 epoch 15 - iter 720/1807 - loss 0.09062331 - samples/sec: 90.50 - lr: 0.100000 |
|
2021-12-31 09:25:39,643 epoch 15 - iter 900/1807 - loss 0.09054947 - samples/sec: 87.13 - lr: 0.100000 |
|
2021-12-31 09:25:56,080 epoch 15 - iter 1080/1807 - loss 0.09120586 - samples/sec: 87.73 - lr: 0.100000 |
|
2021-12-31 09:26:12,023 epoch 15 - iter 1260/1807 - loss 0.09202164 - samples/sec: 90.49 - lr: 0.100000 |
|
2021-12-31 09:26:27,452 epoch 15 - iter 1440/1807 - loss 0.09257595 - samples/sec: 93.48 - lr: 0.100000 |
|
2021-12-31 09:26:43,293 epoch 15 - iter 1620/1807 - loss 0.09296868 - samples/sec: 91.04 - lr: 0.100000 |
|
2021-12-31 09:26:59,412 epoch 15 - iter 1800/1807 - loss 0.09272942 - samples/sec: 89.47 - lr: 0.100000 |
|
2021-12-31 09:26:59,991 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:26:59,991 EPOCH 15 done: loss 0.0927 - lr 0.1000000 |
|
2021-12-31 09:27:36,227 DEV : loss 0.06283392012119293 - f1-score (micro avg) 0.982 |
|
2021-12-31 09:27:36,433 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:27:36,435 saving best model |
|
2021-12-31 09:27:42,216 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:27:58,274 epoch 16 - iter 180/1807 - loss 0.08868552 - samples/sec: 89.83 - lr: 0.100000 |
|
2021-12-31 09:28:14,083 epoch 16 - iter 360/1807 - loss 0.08898795 - samples/sec: 91.23 - lr: 0.100000 |
|
2021-12-31 09:28:30,428 epoch 16 - iter 540/1807 - loss 0.08723848 - samples/sec: 88.23 - lr: 0.100000 |
|
2021-12-31 09:28:46,065 epoch 16 - iter 720/1807 - loss 0.08840922 - samples/sec: 92.21 - lr: 0.100000 |
|
2021-12-31 09:29:01,697 epoch 16 - iter 900/1807 - loss 0.08907246 - samples/sec: 92.26 - lr: 0.100000 |
|
2021-12-31 09:29:17,387 epoch 16 - iter 1080/1807 - loss 0.09016391 - samples/sec: 91.91 - lr: 0.100000 |
|
2021-12-31 09:29:33,637 epoch 16 - iter 1260/1807 - loss 0.09090909 - samples/sec: 88.74 - lr: 0.100000 |
|
2021-12-31 09:29:49,596 epoch 16 - iter 1440/1807 - loss 0.09079363 - samples/sec: 90.36 - lr: 0.100000 |
|
2021-12-31 09:30:05,085 epoch 16 - iter 1620/1807 - loss 0.09144623 - samples/sec: 93.12 - lr: 0.100000 |
|
2021-12-31 09:30:21,000 epoch 16 - iter 1800/1807 - loss 0.09062250 - samples/sec: 90.62 - lr: 0.100000 |
|
2021-12-31 09:30:21,608 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:30:21,608 EPOCH 16 done: loss 0.0906 - lr 0.1000000 |
|
2021-12-31 09:30:58,333 DEV : loss 0.06354553997516632 - f1-score (micro avg) 0.982 |
|
2021-12-31 09:30:58,512 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:30:58,514 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:31:14,847 epoch 17 - iter 180/1807 - loss 0.08390522 - samples/sec: 88.30 - lr: 0.100000 |
|
2021-12-31 09:31:30,522 epoch 17 - iter 360/1807 - loss 0.08649584 - samples/sec: 92.01 - lr: 0.100000 |
|
2021-12-31 09:31:46,288 epoch 17 - iter 540/1807 - loss 0.08940335 - samples/sec: 91.48 - lr: 0.100000 |
|
2021-12-31 09:32:02,118 epoch 17 - iter 720/1807 - loss 0.09059873 - samples/sec: 91.09 - lr: 0.100000 |
|
2021-12-31 09:32:17,806 epoch 17 - iter 900/1807 - loss 0.09026440 - samples/sec: 91.93 - lr: 0.100000 |
|
2021-12-31 09:32:33,488 epoch 17 - iter 1080/1807 - loss 0.09038711 - samples/sec: 91.96 - lr: 0.100000 |
|
2021-12-31 09:32:49,442 epoch 17 - iter 1260/1807 - loss 0.08978670 - samples/sec: 90.39 - lr: 0.100000 |
|
2021-12-31 09:33:05,170 epoch 17 - iter 1440/1807 - loss 0.08929018 - samples/sec: 91.69 - lr: 0.100000 |
|
2021-12-31 09:33:21,122 epoch 17 - iter 1620/1807 - loss 0.08920206 - samples/sec: 90.40 - lr: 0.100000 |
|
2021-12-31 09:33:36,598 epoch 17 - iter 1800/1807 - loss 0.08958801 - samples/sec: 93.18 - lr: 0.100000 |
|
2021-12-31 09:33:37,149 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:33:37,149 EPOCH 17 done: loss 0.0895 - lr 0.1000000 |
|
2021-12-31 09:34:16,446 DEV : loss 0.06361010670661926 - f1-score (micro avg) 0.9823 |
|
2021-12-31 09:34:16,599 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:34:16,600 saving best model |
|
2021-12-31 09:34:22,434 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:34:38,419 epoch 18 - iter 180/1807 - loss 0.08343062 - samples/sec: 90.22 - lr: 0.100000 |
|
2021-12-31 09:34:54,655 epoch 18 - iter 360/1807 - loss 0.08575852 - samples/sec: 88.82 - lr: 0.100000 |
|
2021-12-31 09:35:10,385 epoch 18 - iter 540/1807 - loss 0.08392644 - samples/sec: 91.68 - lr: 0.100000 |
|
2021-12-31 09:35:26,310 epoch 18 - iter 720/1807 - loss 0.08351999 - samples/sec: 90.57 - lr: 0.100000 |
|
2021-12-31 09:35:41,876 epoch 18 - iter 900/1807 - loss 0.08509375 - samples/sec: 92.64 - lr: 0.100000 |
|
2021-12-31 09:35:57,882 epoch 18 - iter 1080/1807 - loss 0.08493115 - samples/sec: 90.10 - lr: 0.100000 |
|
2021-12-31 09:36:13,926 epoch 18 - iter 1260/1807 - loss 0.08609299 - samples/sec: 89.88 - lr: 0.100000 |
|
2021-12-31 09:36:30,070 epoch 18 - iter 1440/1807 - loss 0.08644835 - samples/sec: 89.34 - lr: 0.100000 |
|
2021-12-31 09:36:45,689 epoch 18 - iter 1620/1807 - loss 0.08698449 - samples/sec: 92.33 - lr: 0.100000 |
|
2021-12-31 09:37:01,595 epoch 18 - iter 1800/1807 - loss 0.08715385 - samples/sec: 90.66 - lr: 0.100000 |
|
2021-12-31 09:37:02,116 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:37:02,116 EPOCH 18 done: loss 0.0872 - lr 0.1000000 |
|
2021-12-31 09:37:38,287 DEV : loss 0.06376409530639648 - f1-score (micro avg) 0.982 |
|
2021-12-31 09:37:38,491 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:37:38,492 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:37:54,464 epoch 19 - iter 180/1807 - loss 0.07802257 - samples/sec: 90.31 - lr: 0.100000 |
|
2021-12-31 09:38:10,256 epoch 19 - iter 360/1807 - loss 0.07892620 - samples/sec: 91.32 - lr: 0.100000 |
|
2021-12-31 09:38:26,632 epoch 19 - iter 540/1807 - loss 0.08133170 - samples/sec: 88.06 - lr: 0.100000 |
|
2021-12-31 09:38:42,673 epoch 19 - iter 720/1807 - loss 0.08367885 - samples/sec: 89.91 - lr: 0.100000 |
|
2021-12-31 09:38:58,503 epoch 19 - iter 900/1807 - loss 0.08447871 - samples/sec: 91.11 - lr: 0.100000 |
|
2021-12-31 09:39:14,461 epoch 19 - iter 1080/1807 - loss 0.08413767 - samples/sec: 90.37 - lr: 0.100000 |
|
2021-12-31 09:39:30,176 epoch 19 - iter 1260/1807 - loss 0.08455665 - samples/sec: 91.77 - lr: 0.100000 |
|
2021-12-31 09:39:46,325 epoch 19 - iter 1440/1807 - loss 0.08578599 - samples/sec: 89.30 - lr: 0.100000 |
|
2021-12-31 09:40:02,191 epoch 19 - iter 1620/1807 - loss 0.08628902 - samples/sec: 90.90 - lr: 0.100000 |
|
2021-12-31 09:40:18,069 epoch 19 - iter 1800/1807 - loss 0.08634962 - samples/sec: 90.82 - lr: 0.100000 |
|
2021-12-31 09:40:18,635 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:40:18,636 EPOCH 19 done: loss 0.0863 - lr 0.1000000 |
|
2021-12-31 09:40:54,638 DEV : loss 0.06360483914613724 - f1-score (micro avg) 0.9824 |
|
2021-12-31 09:40:54,809 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:40:54,812 saving best model |
|
2021-12-31 09:41:00,532 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:41:16,605 epoch 20 - iter 180/1807 - loss 0.08580796 - samples/sec: 89.75 - lr: 0.100000 |
|
2021-12-31 09:41:32,626 epoch 20 - iter 360/1807 - loss 0.08441046 - samples/sec: 90.02 - lr: 0.100000 |
|
2021-12-31 09:41:48,195 epoch 20 - iter 540/1807 - loss 0.08457436 - samples/sec: 92.63 - lr: 0.100000 |
|
2021-12-31 09:42:03,884 epoch 20 - iter 720/1807 - loss 0.08433505 - samples/sec: 91.92 - lr: 0.100000 |
|
2021-12-31 09:42:19,662 epoch 20 - iter 900/1807 - loss 0.08465375 - samples/sec: 91.40 - lr: 0.100000 |
|
2021-12-31 09:42:35,290 epoch 20 - iter 1080/1807 - loss 0.08384813 - samples/sec: 92.28 - lr: 0.100000 |
|
2021-12-31 09:42:50,667 epoch 20 - iter 1260/1807 - loss 0.08437448 - samples/sec: 93.79 - lr: 0.100000 |
|
2021-12-31 09:43:06,838 epoch 20 - iter 1440/1807 - loss 0.08483000 - samples/sec: 89.18 - lr: 0.100000 |
|
2021-12-31 09:43:23,128 epoch 20 - iter 1620/1807 - loss 0.08554680 - samples/sec: 88.52 - lr: 0.100000 |
|
2021-12-31 09:43:38,996 epoch 20 - iter 1800/1807 - loss 0.08579345 - samples/sec: 90.89 - lr: 0.100000 |
|
2021-12-31 09:43:39,520 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:43:39,520 EPOCH 20 done: loss 0.0858 - lr 0.1000000 |
|
2021-12-31 09:44:18,433 DEV : loss 0.06494450569152832 - f1-score (micro avg) 0.982 |
|
2021-12-31 09:44:18,588 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:44:18,590 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:44:34,495 epoch 21 - iter 180/1807 - loss 0.08058450 - samples/sec: 90.65 - lr: 0.100000 |
|
2021-12-31 09:44:50,061 epoch 21 - iter 360/1807 - loss 0.08169987 - samples/sec: 92.62 - lr: 0.100000 |
|
2021-12-31 09:45:05,780 epoch 21 - iter 540/1807 - loss 0.08147401 - samples/sec: 91.76 - lr: 0.100000 |
|
2021-12-31 09:45:21,869 epoch 21 - iter 720/1807 - loss 0.08235327 - samples/sec: 89.64 - lr: 0.100000 |
|
2021-12-31 09:45:38,316 epoch 21 - iter 900/1807 - loss 0.08324710 - samples/sec: 87.67 - lr: 0.100000 |
|
2021-12-31 09:45:54,314 epoch 21 - iter 1080/1807 - loss 0.08294963 - samples/sec: 90.14 - lr: 0.100000 |
|
2021-12-31 09:46:10,369 epoch 21 - iter 1260/1807 - loss 0.08355307 - samples/sec: 89.83 - lr: 0.100000 |
|
2021-12-31 09:46:26,469 epoch 21 - iter 1440/1807 - loss 0.08343050 - samples/sec: 89.57 - lr: 0.100000 |
|
2021-12-31 09:46:42,401 epoch 21 - iter 1620/1807 - loss 0.08414815 - samples/sec: 90.52 - lr: 0.100000 |
|
2021-12-31 09:46:58,257 epoch 21 - iter 1800/1807 - loss 0.08376554 - samples/sec: 90.95 - lr: 0.100000 |
|
2021-12-31 09:46:58,880 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:46:58,880 EPOCH 21 done: loss 0.0839 - lr 0.1000000 |
|
2021-12-31 09:47:35,248 DEV : loss 0.06328344345092773 - f1-score (micro avg) 0.9827 |
|
2021-12-31 09:47:35,446 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 09:47:35,448 saving best model |
|
2021-12-31 09:47:41,248 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:47:57,255 epoch 22 - iter 180/1807 - loss 0.08050373 - samples/sec: 90.12 - lr: 0.100000 |
|
2021-12-31 09:48:13,186 epoch 22 - iter 360/1807 - loss 0.08239139 - samples/sec: 90.52 - lr: 0.100000 |
|
2021-12-31 09:48:29,067 epoch 22 - iter 540/1807 - loss 0.08228212 - samples/sec: 90.81 - lr: 0.100000 |
|
2021-12-31 09:48:45,039 epoch 22 - iter 720/1807 - loss 0.08279713 - samples/sec: 90.30 - lr: 0.100000 |
|
2021-12-31 09:49:00,510 epoch 22 - iter 900/1807 - loss 0.08334789 - samples/sec: 93.22 - lr: 0.100000 |
|
2021-12-31 09:49:16,362 epoch 22 - iter 1080/1807 - loss 0.08342389 - samples/sec: 90.97 - lr: 0.100000 |
|
2021-12-31 09:49:32,567 epoch 22 - iter 1260/1807 - loss 0.08349166 - samples/sec: 88.99 - lr: 0.100000 |
|
2021-12-31 09:49:48,320 epoch 22 - iter 1440/1807 - loss 0.08427908 - samples/sec: 91.55 - lr: 0.100000 |
|
2021-12-31 09:50:04,570 epoch 22 - iter 1620/1807 - loss 0.08465300 - samples/sec: 88.75 - lr: 0.100000 |
|
2021-12-31 09:50:20,943 epoch 22 - iter 1800/1807 - loss 0.08437528 - samples/sec: 88.07 - lr: 0.100000 |
|
2021-12-31 09:50:21,480 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:50:21,480 EPOCH 22 done: loss 0.0844 - lr 0.1000000 |
|
2021-12-31 09:50:58,771 DEV : loss 0.06346500664949417 - f1-score (micro avg) 0.9815 |
|
2021-12-31 09:50:58,967 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 09:50:58,969 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:51:15,272 epoch 23 - iter 180/1807 - loss 0.07857499 - samples/sec: 88.47 - lr: 0.100000 |
|
2021-12-31 09:51:31,123 epoch 23 - iter 360/1807 - loss 0.07736816 - samples/sec: 91.00 - lr: 0.100000 |
|
2021-12-31 09:51:47,441 epoch 23 - iter 540/1807 - loss 0.07865886 - samples/sec: 88.38 - lr: 0.100000 |
|
2021-12-31 09:52:03,508 epoch 23 - iter 720/1807 - loss 0.08053686 - samples/sec: 89.75 - lr: 0.100000 |
|
2021-12-31 09:52:19,618 epoch 23 - iter 900/1807 - loss 0.08084826 - samples/sec: 89.52 - lr: 0.100000 |
|
2021-12-31 09:52:35,467 epoch 23 - iter 1080/1807 - loss 0.08116025 - samples/sec: 91.00 - lr: 0.100000 |
|
2021-12-31 09:52:51,307 epoch 23 - iter 1260/1807 - loss 0.08137722 - samples/sec: 91.04 - lr: 0.100000 |
|
2021-12-31 09:53:07,605 epoch 23 - iter 1440/1807 - loss 0.08168418 - samples/sec: 88.48 - lr: 0.100000 |
|
2021-12-31 09:53:23,242 epoch 23 - iter 1620/1807 - loss 0.08161521 - samples/sec: 92.22 - lr: 0.100000 |
|
2021-12-31 09:53:38,917 epoch 23 - iter 1800/1807 - loss 0.08147531 - samples/sec: 92.01 - lr: 0.100000 |
|
2021-12-31 09:53:39,396 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:53:39,396 EPOCH 23 done: loss 0.0814 - lr 0.1000000 |
|
2021-12-31 09:54:15,841 DEV : loss 0.06540019810199738 - f1-score (micro avg) 0.9821 |
|
2021-12-31 09:54:16,023 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 09:54:16,025 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:54:32,334 epoch 24 - iter 180/1807 - loss 0.07795468 - samples/sec: 88.43 - lr: 0.100000 |
|
2021-12-31 09:54:48,084 epoch 24 - iter 360/1807 - loss 0.07908717 - samples/sec: 91.57 - lr: 0.100000 |
|
2021-12-31 09:55:04,326 epoch 24 - iter 540/1807 - loss 0.08004992 - samples/sec: 88.79 - lr: 0.100000 |
|
2021-12-31 09:55:20,651 epoch 24 - iter 720/1807 - loss 0.08100541 - samples/sec: 88.34 - lr: 0.100000 |
|
2021-12-31 09:55:36,785 epoch 24 - iter 900/1807 - loss 0.08142507 - samples/sec: 89.38 - lr: 0.100000 |
|
2021-12-31 09:55:52,742 epoch 24 - iter 1080/1807 - loss 0.08232817 - samples/sec: 90.38 - lr: 0.100000 |
|
2021-12-31 09:56:08,164 epoch 24 - iter 1260/1807 - loss 0.08188184 - samples/sec: 93.53 - lr: 0.100000 |
|
2021-12-31 09:56:24,063 epoch 24 - iter 1440/1807 - loss 0.08243719 - samples/sec: 90.71 - lr: 0.100000 |
|
2021-12-31 09:56:40,384 epoch 24 - iter 1620/1807 - loss 0.08222346 - samples/sec: 88.35 - lr: 0.100000 |
|
2021-12-31 09:56:56,011 epoch 24 - iter 1800/1807 - loss 0.08229498 - samples/sec: 92.29 - lr: 0.100000 |
|
2021-12-31 09:56:56,616 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:56:56,616 EPOCH 24 done: loss 0.0822 - lr 0.1000000 |
|
2021-12-31 09:57:35,721 DEV : loss 0.06453310698270798 - f1-score (micro avg) 0.9819 |
|
2021-12-31 09:57:35,917 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 09:57:35,919 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 09:57:52,048 epoch 25 - iter 180/1807 - loss 0.07765362 - samples/sec: 89.42 - lr: 0.100000 |
|
2021-12-31 09:58:07,956 epoch 25 - iter 360/1807 - loss 0.07932940 - samples/sec: 90.65 - lr: 0.100000 |
|
2021-12-31 09:58:23,863 epoch 25 - iter 540/1807 - loss 0.08046614 - samples/sec: 90.65 - lr: 0.100000 |
|
2021-12-31 09:58:39,725 epoch 25 - iter 720/1807 - loss 0.07941669 - samples/sec: 90.92 - lr: 0.100000 |
|
2021-12-31 09:58:55,303 epoch 25 - iter 900/1807 - loss 0.08092722 - samples/sec: 92.57 - lr: 0.100000 |
|
2021-12-31 09:59:11,794 epoch 25 - iter 1080/1807 - loss 0.08150485 - samples/sec: 87.44 - lr: 0.100000 |
|
2021-12-31 09:59:27,795 epoch 25 - iter 1260/1807 - loss 0.08118184 - samples/sec: 90.13 - lr: 0.100000 |
|
2021-12-31 09:59:43,595 epoch 25 - iter 1440/1807 - loss 0.08068256 - samples/sec: 91.28 - lr: 0.100000 |
|
2021-12-31 09:59:59,146 epoch 25 - iter 1620/1807 - loss 0.08113371 - samples/sec: 92.74 - lr: 0.100000 |
|
2021-12-31 10:00:14,684 epoch 25 - iter 1800/1807 - loss 0.08112289 - samples/sec: 92.81 - lr: 0.100000 |
|
2021-12-31 10:00:15,230 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:00:15,230 EPOCH 25 done: loss 0.0812 - lr 0.1000000 |
|
2021-12-31 10:00:51,681 DEV : loss 0.06579063087701797 - f1-score (micro avg) 0.9817 |
|
2021-12-31 10:00:51,872 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 10:00:51,874 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:01:08,252 epoch 26 - iter 180/1807 - loss 0.07473820 - samples/sec: 88.06 - lr: 0.050000 |
|
2021-12-31 10:01:24,095 epoch 26 - iter 360/1807 - loss 0.07741051 - samples/sec: 91.03 - lr: 0.050000 |
|
2021-12-31 10:01:40,042 epoch 26 - iter 540/1807 - loss 0.07612793 - samples/sec: 90.43 - lr: 0.050000 |
|
2021-12-31 10:01:55,977 epoch 26 - iter 720/1807 - loss 0.07597233 - samples/sec: 90.49 - lr: 0.050000 |
|
2021-12-31 10:02:12,264 epoch 26 - iter 900/1807 - loss 0.07560347 - samples/sec: 88.55 - lr: 0.050000 |
|
2021-12-31 10:02:28,030 epoch 26 - iter 1080/1807 - loss 0.07626889 - samples/sec: 91.47 - lr: 0.050000 |
|
2021-12-31 10:02:43,691 epoch 26 - iter 1260/1807 - loss 0.07613186 - samples/sec: 92.08 - lr: 0.050000 |
|
2021-12-31 10:02:59,223 epoch 26 - iter 1440/1807 - loss 0.07558384 - samples/sec: 92.85 - lr: 0.050000 |
|
2021-12-31 10:03:15,259 epoch 26 - iter 1620/1807 - loss 0.07503334 - samples/sec: 89.93 - lr: 0.050000 |
|
2021-12-31 10:03:31,614 epoch 26 - iter 1800/1807 - loss 0.07448614 - samples/sec: 88.18 - lr: 0.050000 |
|
2021-12-31 10:03:32,151 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:03:32,151 EPOCH 26 done: loss 0.0744 - lr 0.0500000 |
|
2021-12-31 10:04:08,767 DEV : loss 0.06646668165922165 - f1-score (micro avg) 0.9822 |
|
2021-12-31 10:04:08,949 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 10:04:08,950 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:04:25,529 epoch 27 - iter 180/1807 - loss 0.06581114 - samples/sec: 86.99 - lr: 0.050000 |
|
2021-12-31 10:04:41,436 epoch 27 - iter 360/1807 - loss 0.06857834 - samples/sec: 90.66 - lr: 0.050000 |
|
2021-12-31 10:04:57,191 epoch 27 - iter 540/1807 - loss 0.07081005 - samples/sec: 91.54 - lr: 0.050000 |
|
2021-12-31 10:05:13,183 epoch 27 - iter 720/1807 - loss 0.07198836 - samples/sec: 90.18 - lr: 0.050000 |
|
2021-12-31 10:05:29,131 epoch 27 - iter 900/1807 - loss 0.07153264 - samples/sec: 90.42 - lr: 0.050000 |
|
2021-12-31 10:05:44,864 epoch 27 - iter 1080/1807 - loss 0.07164274 - samples/sec: 91.66 - lr: 0.050000 |
|
2021-12-31 10:06:00,643 epoch 27 - iter 1260/1807 - loss 0.07167991 - samples/sec: 91.40 - lr: 0.050000 |
|
2021-12-31 10:06:15,929 epoch 27 - iter 1440/1807 - loss 0.07130117 - samples/sec: 94.34 - lr: 0.050000 |
|
2021-12-31 10:06:32,208 epoch 27 - iter 1620/1807 - loss 0.07137995 - samples/sec: 88.59 - lr: 0.050000 |
|
2021-12-31 10:06:48,072 epoch 27 - iter 1800/1807 - loss 0.07123898 - samples/sec: 90.90 - lr: 0.050000 |
|
2021-12-31 10:06:48,616 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:06:48,616 EPOCH 27 done: loss 0.0712 - lr 0.0500000 |
|
2021-12-31 10:07:27,769 DEV : loss 0.06514652073383331 - f1-score (micro avg) 0.9823 |
|
2021-12-31 10:07:27,967 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 10:07:27,968 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:07:43,921 epoch 28 - iter 180/1807 - loss 0.06865415 - samples/sec: 90.41 - lr: 0.050000 |
|
2021-12-31 10:08:00,073 epoch 28 - iter 360/1807 - loss 0.06855531 - samples/sec: 89.28 - lr: 0.050000 |
|
2021-12-31 10:08:16,259 epoch 28 - iter 540/1807 - loss 0.06891820 - samples/sec: 89.09 - lr: 0.050000 |
|
2021-12-31 10:08:31,981 epoch 28 - iter 720/1807 - loss 0.06951336 - samples/sec: 91.73 - lr: 0.050000 |
|
2021-12-31 10:08:47,429 epoch 28 - iter 900/1807 - loss 0.07014278 - samples/sec: 93.35 - lr: 0.050000 |
|
2021-12-31 10:09:03,024 epoch 28 - iter 1080/1807 - loss 0.07071541 - samples/sec: 92.47 - lr: 0.050000 |
|
2021-12-31 10:09:18,974 epoch 28 - iter 1260/1807 - loss 0.07012373 - samples/sec: 90.41 - lr: 0.050000 |
|
2021-12-31 10:09:34,620 epoch 28 - iter 1440/1807 - loss 0.07028479 - samples/sec: 92.17 - lr: 0.050000 |
|
2021-12-31 10:09:50,427 epoch 28 - iter 1620/1807 - loss 0.07017402 - samples/sec: 91.23 - lr: 0.050000 |
|
2021-12-31 10:10:05,997 epoch 28 - iter 1800/1807 - loss 0.07002142 - samples/sec: 92.62 - lr: 0.050000 |
|
2021-12-31 10:10:06,547 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:10:06,548 EPOCH 28 done: loss 0.0701 - lr 0.0500000 |
|
2021-12-31 10:10:43,342 DEV : loss 0.06285692006349564 - f1-score (micro avg) 0.9828 |
|
2021-12-31 10:10:43,549 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 10:10:43,550 saving best model |
|
2021-12-31 10:10:49,346 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:11:05,893 epoch 29 - iter 180/1807 - loss 0.06749112 - samples/sec: 87.17 - lr: 0.050000 |
|
2021-12-31 10:11:21,660 epoch 29 - iter 360/1807 - loss 0.06704871 - samples/sec: 91.46 - lr: 0.050000 |
|
2021-12-31 10:11:37,404 epoch 29 - iter 540/1807 - loss 0.06846136 - samples/sec: 91.60 - lr: 0.050000 |
|
2021-12-31 10:11:53,397 epoch 29 - iter 720/1807 - loss 0.06901632 - samples/sec: 90.17 - lr: 0.050000 |
|
2021-12-31 10:12:09,257 epoch 29 - iter 900/1807 - loss 0.06809349 - samples/sec: 90.93 - lr: 0.050000 |
|
2021-12-31 10:12:24,599 epoch 29 - iter 1080/1807 - loss 0.06824897 - samples/sec: 94.00 - lr: 0.050000 |
|
2021-12-31 10:12:40,447 epoch 29 - iter 1260/1807 - loss 0.06782382 - samples/sec: 91.00 - lr: 0.050000 |
|
2021-12-31 10:12:56,595 epoch 29 - iter 1440/1807 - loss 0.06808796 - samples/sec: 89.30 - lr: 0.050000 |
|
2021-12-31 10:13:12,755 epoch 29 - iter 1620/1807 - loss 0.06798634 - samples/sec: 89.24 - lr: 0.050000 |
|
2021-12-31 10:13:28,701 epoch 29 - iter 1800/1807 - loss 0.06777472 - samples/sec: 90.44 - lr: 0.050000 |
|
2021-12-31 10:13:29,227 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:13:29,228 EPOCH 29 done: loss 0.0678 - lr 0.0500000 |
|
2021-12-31 10:14:05,041 DEV : loss 0.06288447976112366 - f1-score (micro avg) 0.9831 |
|
2021-12-31 10:14:05,221 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 10:14:05,222 saving best model |
|
2021-12-31 10:14:10,675 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:14:26,845 epoch 30 - iter 180/1807 - loss 0.06615046 - samples/sec: 89.20 - lr: 0.050000 |
|
2021-12-31 10:14:42,781 epoch 30 - iter 360/1807 - loss 0.06701908 - samples/sec: 90.50 - lr: 0.050000 |
|
2021-12-31 10:14:58,746 epoch 30 - iter 540/1807 - loss 0.06748578 - samples/sec: 90.33 - lr: 0.050000 |
|
2021-12-31 10:15:14,479 epoch 30 - iter 720/1807 - loss 0.06796474 - samples/sec: 91.66 - lr: 0.050000 |
|
2021-12-31 10:15:30,280 epoch 30 - iter 900/1807 - loss 0.06739311 - samples/sec: 91.26 - lr: 0.050000 |
|
2021-12-31 10:15:45,933 epoch 30 - iter 1080/1807 - loss 0.06699810 - samples/sec: 92.13 - lr: 0.050000 |
|
2021-12-31 10:16:01,690 epoch 30 - iter 1260/1807 - loss 0.06745951 - samples/sec: 91.53 - lr: 0.050000 |
|
2021-12-31 10:16:17,453 epoch 30 - iter 1440/1807 - loss 0.06704309 - samples/sec: 91.49 - lr: 0.050000 |
|
2021-12-31 10:16:33,233 epoch 30 - iter 1620/1807 - loss 0.06649743 - samples/sec: 91.38 - lr: 0.050000 |
|
2021-12-31 10:16:49,143 epoch 30 - iter 1800/1807 - loss 0.06655280 - samples/sec: 90.65 - lr: 0.050000 |
|
2021-12-31 10:16:49,685 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:16:49,685 EPOCH 30 done: loss 0.0666 - lr 0.0500000 |
|
2021-12-31 10:17:28,240 DEV : loss 0.06311798095703125 - f1-score (micro avg) 0.9824 |
|
2021-12-31 10:17:28,433 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 10:17:28,434 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:17:44,966 epoch 31 - iter 180/1807 - loss 0.06627745 - samples/sec: 87.24 - lr: 0.050000 |
|
2021-12-31 10:18:00,662 epoch 31 - iter 360/1807 - loss 0.06286711 - samples/sec: 91.88 - lr: 0.050000 |
|
2021-12-31 10:18:16,307 epoch 31 - iter 540/1807 - loss 0.06454841 - samples/sec: 92.17 - lr: 0.050000 |
|
2021-12-31 10:18:32,243 epoch 31 - iter 720/1807 - loss 0.06465161 - samples/sec: 90.50 - lr: 0.050000 |
|
2021-12-31 10:18:47,799 epoch 31 - iter 900/1807 - loss 0.06488043 - samples/sec: 92.70 - lr: 0.050000 |
|
2021-12-31 10:19:03,602 epoch 31 - iter 1080/1807 - loss 0.06501278 - samples/sec: 91.26 - lr: 0.050000 |
|
2021-12-31 10:19:19,610 epoch 31 - iter 1260/1807 - loss 0.06524649 - samples/sec: 90.08 - lr: 0.050000 |
|
2021-12-31 10:19:35,038 epoch 31 - iter 1440/1807 - loss 0.06554492 - samples/sec: 93.48 - lr: 0.050000 |
|
2021-12-31 10:19:51,164 epoch 31 - iter 1620/1807 - loss 0.06599922 - samples/sec: 89.43 - lr: 0.050000 |
|
2021-12-31 10:20:07,078 epoch 31 - iter 1800/1807 - loss 0.06644678 - samples/sec: 90.61 - lr: 0.050000 |
|
2021-12-31 10:20:07,640 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:20:07,640 EPOCH 31 done: loss 0.0666 - lr 0.0500000 |
|
2021-12-31 10:20:43,927 DEV : loss 0.06285466253757477 - f1-score (micro avg) 0.9829 |
|
2021-12-31 10:20:44,123 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 10:20:44,125 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:21:00,298 epoch 32 - iter 180/1807 - loss 0.06077116 - samples/sec: 89.18 - lr: 0.050000 |
|
2021-12-31 10:21:16,393 epoch 32 - iter 360/1807 - loss 0.06270324 - samples/sec: 89.60 - lr: 0.050000 |
|
2021-12-31 10:21:32,158 epoch 32 - iter 540/1807 - loss 0.06340224 - samples/sec: 91.47 - lr: 0.050000 |
|
2021-12-31 10:21:48,183 epoch 32 - iter 720/1807 - loss 0.06267842 - samples/sec: 89.99 - lr: 0.050000 |
|
2021-12-31 10:22:03,949 epoch 32 - iter 900/1807 - loss 0.06345792 - samples/sec: 91.50 - lr: 0.050000 |
|
2021-12-31 10:22:19,674 epoch 32 - iter 1080/1807 - loss 0.06439376 - samples/sec: 91.71 - lr: 0.050000 |
|
2021-12-31 10:22:35,414 epoch 32 - iter 1260/1807 - loss 0.06437464 - samples/sec: 91.63 - lr: 0.050000 |
|
2021-12-31 10:22:51,702 epoch 32 - iter 1440/1807 - loss 0.06435182 - samples/sec: 88.53 - lr: 0.050000 |
|
2021-12-31 10:23:07,918 epoch 32 - iter 1620/1807 - loss 0.06467809 - samples/sec: 88.93 - lr: 0.050000 |
|
2021-12-31 10:23:23,880 epoch 32 - iter 1800/1807 - loss 0.06484923 - samples/sec: 90.35 - lr: 0.050000 |
|
2021-12-31 10:23:24,513 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:23:24,513 EPOCH 32 done: loss 0.0648 - lr 0.0500000 |
|
2021-12-31 10:24:00,678 DEV : loss 0.062373436987400055 - f1-score (micro avg) 0.9827 |
|
2021-12-31 10:24:00,863 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 10:24:00,865 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:24:17,368 epoch 33 - iter 180/1807 - loss 0.06511517 - samples/sec: 87.39 - lr: 0.050000 |
|
2021-12-31 10:24:33,869 epoch 33 - iter 360/1807 - loss 0.06359714 - samples/sec: 87.39 - lr: 0.050000 |
|
2021-12-31 10:24:49,974 epoch 33 - iter 540/1807 - loss 0.06324776 - samples/sec: 89.54 - lr: 0.050000 |
|
2021-12-31 10:25:05,411 epoch 33 - iter 720/1807 - loss 0.06296883 - samples/sec: 93.42 - lr: 0.050000 |
|
2021-12-31 10:25:21,477 epoch 33 - iter 900/1807 - loss 0.06304943 - samples/sec: 89.76 - lr: 0.050000 |
|
2021-12-31 10:25:37,062 epoch 33 - iter 1080/1807 - loss 0.06266940 - samples/sec: 92.52 - lr: 0.050000 |
|
2021-12-31 10:25:52,743 epoch 33 - iter 1260/1807 - loss 0.06359599 - samples/sec: 91.97 - lr: 0.050000 |
|
2021-12-31 10:26:08,521 epoch 33 - iter 1440/1807 - loss 0.06353058 - samples/sec: 91.40 - lr: 0.050000 |
|
2021-12-31 10:26:24,080 epoch 33 - iter 1620/1807 - loss 0.06366170 - samples/sec: 92.69 - lr: 0.050000 |
|
2021-12-31 10:26:39,568 epoch 33 - iter 1800/1807 - loss 0.06405823 - samples/sec: 93.11 - lr: 0.050000 |
|
2021-12-31 10:26:40,121 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:26:40,121 EPOCH 33 done: loss 0.0640 - lr 0.0500000 |
|
2021-12-31 10:27:18,678 DEV : loss 0.06352584064006805 - f1-score (micro avg) 0.983 |
|
2021-12-31 10:27:18,875 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 10:27:18,877 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:27:34,632 epoch 34 - iter 180/1807 - loss 0.05738992 - samples/sec: 91.55 - lr: 0.025000 |
|
2021-12-31 10:27:50,783 epoch 34 - iter 360/1807 - loss 0.05964139 - samples/sec: 89.29 - lr: 0.025000 |
|
2021-12-31 10:28:06,956 epoch 34 - iter 540/1807 - loss 0.05950577 - samples/sec: 89.16 - lr: 0.025000 |
|
2021-12-31 10:28:23,264 epoch 34 - iter 720/1807 - loss 0.06033373 - samples/sec: 88.43 - lr: 0.025000 |
|
2021-12-31 10:28:38,762 epoch 34 - iter 900/1807 - loss 0.06053852 - samples/sec: 93.06 - lr: 0.025000 |
|
2021-12-31 10:28:54,790 epoch 34 - iter 1080/1807 - loss 0.06008683 - samples/sec: 89.97 - lr: 0.025000 |
|
2021-12-31 10:29:10,752 epoch 34 - iter 1260/1807 - loss 0.06017032 - samples/sec: 90.34 - lr: 0.025000 |
|
2021-12-31 10:29:26,533 epoch 34 - iter 1440/1807 - loss 0.06026720 - samples/sec: 91.39 - lr: 0.025000 |
|
2021-12-31 10:29:41,962 epoch 34 - iter 1620/1807 - loss 0.06023939 - samples/sec: 93.47 - lr: 0.025000 |
|
2021-12-31 10:29:57,974 epoch 34 - iter 1800/1807 - loss 0.06024915 - samples/sec: 90.06 - lr: 0.025000 |
|
2021-12-31 10:29:58,641 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:29:58,642 EPOCH 34 done: loss 0.0602 - lr 0.0250000 |
|
2021-12-31 10:30:34,901 DEV : loss 0.06348917633295059 - f1-score (micro avg) 0.9835 |
|
2021-12-31 10:30:35,087 BAD EPOCHS (no improvement): 0 |
|
2021-12-31 10:30:35,089 saving best model |
|
2021-12-31 10:30:40,883 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:30:57,202 epoch 35 - iter 180/1807 - loss 0.05878333 - samples/sec: 88.38 - lr: 0.025000 |
|
2021-12-31 10:31:12,996 epoch 35 - iter 360/1807 - loss 0.05795906 - samples/sec: 91.32 - lr: 0.025000 |
|
2021-12-31 10:31:29,079 epoch 35 - iter 540/1807 - loss 0.05935994 - samples/sec: 89.67 - lr: 0.025000 |
|
2021-12-31 10:31:45,084 epoch 35 - iter 720/1807 - loss 0.05982168 - samples/sec: 90.10 - lr: 0.025000 |
|
2021-12-31 10:32:00,692 epoch 35 - iter 900/1807 - loss 0.05928538 - samples/sec: 92.39 - lr: 0.025000 |
|
2021-12-31 10:32:16,615 epoch 35 - iter 1080/1807 - loss 0.05961166 - samples/sec: 90.58 - lr: 0.025000 |
|
2021-12-31 10:32:32,475 epoch 35 - iter 1260/1807 - loss 0.06019352 - samples/sec: 90.93 - lr: 0.025000 |
|
2021-12-31 10:32:48,494 epoch 35 - iter 1440/1807 - loss 0.06020781 - samples/sec: 90.02 - lr: 0.025000 |
|
2021-12-31 10:33:04,244 epoch 35 - iter 1620/1807 - loss 0.05999299 - samples/sec: 91.57 - lr: 0.025000 |
|
2021-12-31 10:33:20,684 epoch 35 - iter 1800/1807 - loss 0.05998842 - samples/sec: 87.72 - lr: 0.025000 |
|
2021-12-31 10:33:21,238 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:33:21,238 EPOCH 35 done: loss 0.0600 - lr 0.0250000 |
|
2021-12-31 10:33:57,434 DEV : loss 0.06338120251893997 - f1-score (micro avg) 0.9829 |
|
2021-12-31 10:33:57,624 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 10:33:57,626 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:34:13,768 epoch 36 - iter 180/1807 - loss 0.06028850 - samples/sec: 89.35 - lr: 0.025000 |
|
2021-12-31 10:34:29,556 epoch 36 - iter 360/1807 - loss 0.05827195 - samples/sec: 91.34 - lr: 0.025000 |
|
2021-12-31 10:34:46,060 epoch 36 - iter 540/1807 - loss 0.05947832 - samples/sec: 87.38 - lr: 0.025000 |
|
2021-12-31 10:35:02,018 epoch 36 - iter 720/1807 - loss 0.05898679 - samples/sec: 90.38 - lr: 0.025000 |
|
2021-12-31 10:35:18,203 epoch 36 - iter 900/1807 - loss 0.05910041 - samples/sec: 89.10 - lr: 0.025000 |
|
2021-12-31 10:35:34,254 epoch 36 - iter 1080/1807 - loss 0.05973540 - samples/sec: 89.84 - lr: 0.025000 |
|
2021-12-31 10:35:50,256 epoch 36 - iter 1260/1807 - loss 0.05924335 - samples/sec: 90.13 - lr: 0.025000 |
|
2021-12-31 10:36:06,236 epoch 36 - iter 1440/1807 - loss 0.05881263 - samples/sec: 90.25 - lr: 0.025000 |
|
2021-12-31 10:36:22,117 epoch 36 - iter 1620/1807 - loss 0.05885928 - samples/sec: 90.80 - lr: 0.025000 |
|
2021-12-31 10:36:38,208 epoch 36 - iter 1800/1807 - loss 0.05867245 - samples/sec: 89.62 - lr: 0.025000 |
|
2021-12-31 10:36:38,763 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:36:38,763 EPOCH 36 done: loss 0.0587 - lr 0.0250000 |
|
2021-12-31 10:37:17,552 DEV : loss 0.06424003839492798 - f1-score (micro avg) 0.9835 |
|
2021-12-31 10:37:17,751 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 10:37:17,752 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:37:33,804 epoch 37 - iter 180/1807 - loss 0.05692650 - samples/sec: 89.85 - lr: 0.025000 |
|
2021-12-31 10:37:50,368 epoch 37 - iter 360/1807 - loss 0.05616469 - samples/sec: 87.06 - lr: 0.025000 |
|
2021-12-31 10:38:06,389 epoch 37 - iter 540/1807 - loss 0.05662717 - samples/sec: 90.01 - lr: 0.025000 |
|
2021-12-31 10:38:22,399 epoch 37 - iter 720/1807 - loss 0.05716632 - samples/sec: 90.08 - lr: 0.025000 |
|
2021-12-31 10:38:37,783 epoch 37 - iter 900/1807 - loss 0.05713545 - samples/sec: 93.74 - lr: 0.025000 |
|
2021-12-31 10:38:53,871 epoch 37 - iter 1080/1807 - loss 0.05764661 - samples/sec: 89.64 - lr: 0.025000 |
|
2021-12-31 10:39:10,031 epoch 37 - iter 1260/1807 - loss 0.05713711 - samples/sec: 89.23 - lr: 0.025000 |
|
2021-12-31 10:39:25,737 epoch 37 - iter 1440/1807 - loss 0.05769197 - samples/sec: 91.83 - lr: 0.025000 |
|
2021-12-31 10:39:41,486 epoch 37 - iter 1620/1807 - loss 0.05788084 - samples/sec: 91.57 - lr: 0.025000 |
|
2021-12-31 10:39:57,218 epoch 37 - iter 1800/1807 - loss 0.05864320 - samples/sec: 91.67 - lr: 0.025000 |
|
2021-12-31 10:39:57,747 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:39:57,748 EPOCH 37 done: loss 0.0586 - lr 0.0250000 |
|
2021-12-31 10:40:34,869 DEV : loss 0.06326954811811447 - f1-score (micro avg) 0.9831 |
|
2021-12-31 10:40:35,052 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 10:40:35,054 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:40:51,312 epoch 38 - iter 180/1807 - loss 0.05496563 - samples/sec: 88.71 - lr: 0.025000 |
|
2021-12-31 10:41:07,088 epoch 38 - iter 360/1807 - loss 0.05435886 - samples/sec: 91.42 - lr: 0.025000 |
|
2021-12-31 10:41:22,841 epoch 38 - iter 540/1807 - loss 0.05464384 - samples/sec: 91.55 - lr: 0.025000 |
|
2021-12-31 10:41:38,398 epoch 38 - iter 720/1807 - loss 0.05548335 - samples/sec: 92.69 - lr: 0.025000 |
|
2021-12-31 10:41:54,754 epoch 38 - iter 900/1807 - loss 0.05628518 - samples/sec: 88.18 - lr: 0.025000 |
|
2021-12-31 10:42:10,229 epoch 38 - iter 1080/1807 - loss 0.05604961 - samples/sec: 93.19 - lr: 0.025000 |
|
2021-12-31 10:42:26,417 epoch 38 - iter 1260/1807 - loss 0.05594531 - samples/sec: 89.09 - lr: 0.025000 |
|
2021-12-31 10:42:42,839 epoch 38 - iter 1440/1807 - loss 0.05651329 - samples/sec: 87.81 - lr: 0.025000 |
|
2021-12-31 10:42:58,889 epoch 38 - iter 1620/1807 - loss 0.05695998 - samples/sec: 89.85 - lr: 0.025000 |
|
2021-12-31 10:43:15,043 epoch 38 - iter 1800/1807 - loss 0.05706783 - samples/sec: 89.27 - lr: 0.025000 |
|
2021-12-31 10:43:15,590 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:43:15,590 EPOCH 38 done: loss 0.0570 - lr 0.0250000 |
|
2021-12-31 10:43:52,423 DEV : loss 0.06343492120504379 - f1-score (micro avg) 0.9831 |
|
2021-12-31 10:43:52,610 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 10:43:52,612 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:44:08,739 epoch 39 - iter 180/1807 - loss 0.05834451 - samples/sec: 89.43 - lr: 0.012500 |
|
2021-12-31 10:44:24,462 epoch 39 - iter 360/1807 - loss 0.05496382 - samples/sec: 91.72 - lr: 0.012500 |
|
2021-12-31 10:44:40,570 epoch 39 - iter 540/1807 - loss 0.05537094 - samples/sec: 89.53 - lr: 0.012500 |
|
2021-12-31 10:44:56,434 epoch 39 - iter 720/1807 - loss 0.05546561 - samples/sec: 90.90 - lr: 0.012500 |
|
2021-12-31 10:45:12,338 epoch 39 - iter 900/1807 - loss 0.05527723 - samples/sec: 90.67 - lr: 0.012500 |
|
2021-12-31 10:45:27,903 epoch 39 - iter 1080/1807 - loss 0.05518412 - samples/sec: 92.65 - lr: 0.012500 |
|
2021-12-31 10:45:43,777 epoch 39 - iter 1260/1807 - loss 0.05540916 - samples/sec: 90.86 - lr: 0.012500 |
|
2021-12-31 10:45:59,259 epoch 39 - iter 1440/1807 - loss 0.05568263 - samples/sec: 93.15 - lr: 0.012500 |
|
2021-12-31 10:46:15,024 epoch 39 - iter 1620/1807 - loss 0.05532678 - samples/sec: 91.47 - lr: 0.012500 |
|
2021-12-31 10:46:30,975 epoch 39 - iter 1800/1807 - loss 0.05524694 - samples/sec: 90.40 - lr: 0.012500 |
|
2021-12-31 10:46:31,584 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:46:31,585 EPOCH 39 done: loss 0.0552 - lr 0.0125000 |
|
2021-12-31 10:47:10,908 DEV : loss 0.06419230252504349 - f1-score (micro avg) 0.9829 |
|
2021-12-31 10:47:11,105 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 10:47:11,106 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:47:26,949 epoch 40 - iter 180/1807 - loss 0.05824543 - samples/sec: 91.06 - lr: 0.012500 |
|
2021-12-31 10:47:42,913 epoch 40 - iter 360/1807 - loss 0.05527233 - samples/sec: 90.33 - lr: 0.012500 |
|
2021-12-31 10:47:59,224 epoch 40 - iter 540/1807 - loss 0.05570769 - samples/sec: 88.41 - lr: 0.012500 |
|
2021-12-31 10:48:14,703 epoch 40 - iter 720/1807 - loss 0.05485811 - samples/sec: 93.17 - lr: 0.012500 |
|
2021-12-31 10:48:30,458 epoch 40 - iter 900/1807 - loss 0.05502772 - samples/sec: 91.54 - lr: 0.012500 |
|
2021-12-31 10:48:46,369 epoch 40 - iter 1080/1807 - loss 0.05487373 - samples/sec: 90.63 - lr: 0.012500 |
|
2021-12-31 10:49:01,734 epoch 40 - iter 1260/1807 - loss 0.05438047 - samples/sec: 93.85 - lr: 0.012500 |
|
2021-12-31 10:49:17,649 epoch 40 - iter 1440/1807 - loss 0.05459548 - samples/sec: 90.61 - lr: 0.012500 |
|
2021-12-31 10:49:33,390 epoch 40 - iter 1620/1807 - loss 0.05450567 - samples/sec: 91.62 - lr: 0.012500 |
|
2021-12-31 10:49:49,353 epoch 40 - iter 1800/1807 - loss 0.05462945 - samples/sec: 90.34 - lr: 0.012500 |
|
2021-12-31 10:49:49,959 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:49:49,959 EPOCH 40 done: loss 0.0546 - lr 0.0125000 |
|
2021-12-31 10:50:26,216 DEV : loss 0.06343018263578415 - f1-score (micro avg) 0.9829 |
|
2021-12-31 10:50:26,401 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 10:50:26,402 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:50:42,801 epoch 41 - iter 180/1807 - loss 0.04923909 - samples/sec: 87.95 - lr: 0.012500 |
|
2021-12-31 10:50:58,898 epoch 41 - iter 360/1807 - loss 0.05125288 - samples/sec: 89.59 - lr: 0.012500 |
|
2021-12-31 10:51:14,501 epoch 41 - iter 540/1807 - loss 0.05242298 - samples/sec: 92.43 - lr: 0.012500 |
|
2021-12-31 10:51:30,244 epoch 41 - iter 720/1807 - loss 0.05272643 - samples/sec: 91.60 - lr: 0.012500 |
|
2021-12-31 10:51:46,266 epoch 41 - iter 900/1807 - loss 0.05277145 - samples/sec: 90.01 - lr: 0.012500 |
|
2021-12-31 10:52:02,535 epoch 41 - iter 1080/1807 - loss 0.05329680 - samples/sec: 88.64 - lr: 0.012500 |
|
2021-12-31 10:52:18,362 epoch 41 - iter 1260/1807 - loss 0.05349535 - samples/sec: 91.12 - lr: 0.012500 |
|
2021-12-31 10:52:34,324 epoch 41 - iter 1440/1807 - loss 0.05371268 - samples/sec: 90.35 - lr: 0.012500 |
|
2021-12-31 10:52:50,154 epoch 41 - iter 1620/1807 - loss 0.05362217 - samples/sec: 91.09 - lr: 0.012500 |
|
2021-12-31 10:53:06,114 epoch 41 - iter 1800/1807 - loss 0.05361560 - samples/sec: 90.36 - lr: 0.012500 |
|
2021-12-31 10:53:06,648 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:53:06,649 EPOCH 41 done: loss 0.0537 - lr 0.0125000 |
|
2021-12-31 10:53:42,920 DEV : loss 0.06420625746250153 - f1-score (micro avg) 0.9831 |
|
2021-12-31 10:53:43,107 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 10:53:43,108 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:53:59,320 epoch 42 - iter 180/1807 - loss 0.04886676 - samples/sec: 88.96 - lr: 0.012500 |
|
2021-12-31 10:54:15,301 epoch 42 - iter 360/1807 - loss 0.05210812 - samples/sec: 90.24 - lr: 0.012500 |
|
2021-12-31 10:54:31,014 epoch 42 - iter 540/1807 - loss 0.05220145 - samples/sec: 91.78 - lr: 0.012500 |
|
2021-12-31 10:54:46,930 epoch 42 - iter 720/1807 - loss 0.05239133 - samples/sec: 90.61 - lr: 0.012500 |
|
2021-12-31 10:55:02,977 epoch 42 - iter 900/1807 - loss 0.05260141 - samples/sec: 89.87 - lr: 0.012500 |
|
2021-12-31 10:55:19,228 epoch 42 - iter 1080/1807 - loss 0.05260187 - samples/sec: 88.74 - lr: 0.012500 |
|
2021-12-31 10:55:35,215 epoch 42 - iter 1260/1807 - loss 0.05242910 - samples/sec: 90.21 - lr: 0.012500 |
|
2021-12-31 10:55:51,163 epoch 42 - iter 1440/1807 - loss 0.05265492 - samples/sec: 90.43 - lr: 0.012500 |
|
2021-12-31 10:56:07,328 epoch 42 - iter 1620/1807 - loss 0.05317972 - samples/sec: 89.21 - lr: 0.012500 |
|
2021-12-31 10:56:23,405 epoch 42 - iter 1800/1807 - loss 0.05319734 - samples/sec: 89.70 - lr: 0.012500 |
|
2021-12-31 10:56:23,951 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:56:23,951 EPOCH 42 done: loss 0.0532 - lr 0.0125000 |
|
2021-12-31 10:57:03,168 DEV : loss 0.06362675130367279 - f1-score (micro avg) 0.9831 |
|
2021-12-31 10:57:03,368 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 10:57:03,370 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:57:19,009 epoch 43 - iter 180/1807 - loss 0.05496817 - samples/sec: 92.23 - lr: 0.006250 |
|
2021-12-31 10:57:34,952 epoch 43 - iter 360/1807 - loss 0.05262157 - samples/sec: 90.45 - lr: 0.006250 |
|
2021-12-31 10:57:51,104 epoch 43 - iter 540/1807 - loss 0.05252708 - samples/sec: 89.28 - lr: 0.006250 |
|
2021-12-31 10:58:06,630 epoch 43 - iter 720/1807 - loss 0.05258453 - samples/sec: 92.89 - lr: 0.006250 |
|
2021-12-31 10:58:22,297 epoch 43 - iter 900/1807 - loss 0.05170441 - samples/sec: 92.05 - lr: 0.006250 |
|
2021-12-31 10:58:38,636 epoch 43 - iter 1080/1807 - loss 0.05199907 - samples/sec: 88.26 - lr: 0.006250 |
|
2021-12-31 10:58:54,582 epoch 43 - iter 1260/1807 - loss 0.05289598 - samples/sec: 90.42 - lr: 0.006250 |
|
2021-12-31 10:59:10,756 epoch 43 - iter 1440/1807 - loss 0.05239565 - samples/sec: 89.17 - lr: 0.006250 |
|
2021-12-31 10:59:26,756 epoch 43 - iter 1620/1807 - loss 0.05245197 - samples/sec: 90.14 - lr: 0.006250 |
|
2021-12-31 10:59:43,140 epoch 43 - iter 1800/1807 - loss 0.05236153 - samples/sec: 88.01 - lr: 0.006250 |
|
2021-12-31 10:59:43,734 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 10:59:43,734 EPOCH 43 done: loss 0.0523 - lr 0.0062500 |
|
2021-12-31 11:00:19,875 DEV : loss 0.06449297815561295 - f1-score (micro avg) 0.983 |
|
2021-12-31 11:00:20,058 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 11:00:20,060 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:00:36,054 epoch 44 - iter 180/1807 - loss 0.05668095 - samples/sec: 90.17 - lr: 0.006250 |
|
2021-12-31 11:00:51,879 epoch 44 - iter 360/1807 - loss 0.05376107 - samples/sec: 91.13 - lr: 0.006250 |
|
2021-12-31 11:01:07,774 epoch 44 - iter 540/1807 - loss 0.05410164 - samples/sec: 90.73 - lr: 0.006250 |
|
2021-12-31 11:01:23,539 epoch 44 - iter 720/1807 - loss 0.05349578 - samples/sec: 91.47 - lr: 0.006250 |
|
2021-12-31 11:01:39,511 epoch 44 - iter 900/1807 - loss 0.05316904 - samples/sec: 90.29 - lr: 0.006250 |
|
2021-12-31 11:01:55,495 epoch 44 - iter 1080/1807 - loss 0.05360298 - samples/sec: 90.23 - lr: 0.006250 |
|
2021-12-31 11:02:11,974 epoch 44 - iter 1260/1807 - loss 0.05360002 - samples/sec: 87.52 - lr: 0.006250 |
|
2021-12-31 11:02:27,697 epoch 44 - iter 1440/1807 - loss 0.05333331 - samples/sec: 91.72 - lr: 0.006250 |
|
2021-12-31 11:02:43,120 epoch 44 - iter 1620/1807 - loss 0.05286587 - samples/sec: 93.50 - lr: 0.006250 |
|
2021-12-31 11:02:58,798 epoch 44 - iter 1800/1807 - loss 0.05270956 - samples/sec: 91.99 - lr: 0.006250 |
|
2021-12-31 11:02:59,351 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:02:59,352 EPOCH 44 done: loss 0.0527 - lr 0.0062500 |
|
2021-12-31 11:03:35,832 DEV : loss 0.06455685943365097 - f1-score (micro avg) 0.9831 |
|
2021-12-31 11:03:36,019 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 11:03:36,021 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:03:52,202 epoch 45 - iter 180/1807 - loss 0.05063292 - samples/sec: 89.13 - lr: 0.006250 |
|
2021-12-31 11:04:08,225 epoch 45 - iter 360/1807 - loss 0.05171673 - samples/sec: 90.00 - lr: 0.006250 |
|
2021-12-31 11:04:24,263 epoch 45 - iter 540/1807 - loss 0.05167432 - samples/sec: 89.93 - lr: 0.006250 |
|
2021-12-31 11:04:40,362 epoch 45 - iter 720/1807 - loss 0.05121190 - samples/sec: 89.58 - lr: 0.006250 |
|
2021-12-31 11:04:56,274 epoch 45 - iter 900/1807 - loss 0.05221446 - samples/sec: 90.63 - lr: 0.006250 |
|
2021-12-31 11:05:12,479 epoch 45 - iter 1080/1807 - loss 0.05188940 - samples/sec: 88.99 - lr: 0.006250 |
|
2021-12-31 11:05:28,572 epoch 45 - iter 1260/1807 - loss 0.05237022 - samples/sec: 89.62 - lr: 0.006250 |
|
2021-12-31 11:05:44,476 epoch 45 - iter 1440/1807 - loss 0.05180768 - samples/sec: 90.68 - lr: 0.006250 |
|
2021-12-31 11:06:00,356 epoch 45 - iter 1620/1807 - loss 0.05176296 - samples/sec: 90.81 - lr: 0.006250 |
|
2021-12-31 11:06:16,343 epoch 45 - iter 1800/1807 - loss 0.05236414 - samples/sec: 90.20 - lr: 0.006250 |
|
2021-12-31 11:06:16,948 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:06:16,949 EPOCH 45 done: loss 0.0523 - lr 0.0062500 |
|
2021-12-31 11:06:56,269 DEV : loss 0.06413871794939041 - f1-score (micro avg) 0.983 |
|
2021-12-31 11:06:56,425 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 11:06:56,427 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:07:12,359 epoch 46 - iter 180/1807 - loss 0.04909660 - samples/sec: 90.52 - lr: 0.006250 |
|
2021-12-31 11:07:27,933 epoch 46 - iter 360/1807 - loss 0.04990439 - samples/sec: 92.58 - lr: 0.006250 |
|
2021-12-31 11:07:44,036 epoch 46 - iter 540/1807 - loss 0.05183261 - samples/sec: 89.55 - lr: 0.006250 |
|
2021-12-31 11:07:59,808 epoch 46 - iter 720/1807 - loss 0.05108367 - samples/sec: 91.44 - lr: 0.006250 |
|
2021-12-31 11:08:16,323 epoch 46 - iter 900/1807 - loss 0.05156129 - samples/sec: 87.33 - lr: 0.006250 |
|
2021-12-31 11:08:32,181 epoch 46 - iter 1080/1807 - loss 0.05164911 - samples/sec: 90.93 - lr: 0.006250 |
|
2021-12-31 11:08:48,124 epoch 46 - iter 1260/1807 - loss 0.05241189 - samples/sec: 90.45 - lr: 0.006250 |
|
2021-12-31 11:09:04,600 epoch 46 - iter 1440/1807 - loss 0.05209220 - samples/sec: 87.53 - lr: 0.006250 |
|
2021-12-31 11:09:20,227 epoch 46 - iter 1620/1807 - loss 0.05187081 - samples/sec: 92.29 - lr: 0.006250 |
|
2021-12-31 11:09:36,191 epoch 46 - iter 1800/1807 - loss 0.05205935 - samples/sec: 90.34 - lr: 0.006250 |
|
2021-12-31 11:09:36,782 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:09:36,782 EPOCH 46 done: loss 0.0521 - lr 0.0062500 |
|
2021-12-31 11:10:13,201 DEV : loss 0.0644669309258461 - f1-score (micro avg) 0.983 |
|
2021-12-31 11:10:13,398 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 11:10:13,399 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:10:29,417 epoch 47 - iter 180/1807 - loss 0.05250873 - samples/sec: 90.04 - lr: 0.003125 |
|
2021-12-31 11:10:45,589 epoch 47 - iter 360/1807 - loss 0.05160928 - samples/sec: 89.18 - lr: 0.003125 |
|
2021-12-31 11:11:01,280 epoch 47 - iter 540/1807 - loss 0.05161492 - samples/sec: 91.91 - lr: 0.003125 |
|
2021-12-31 11:11:17,277 epoch 47 - iter 720/1807 - loss 0.05136337 - samples/sec: 90.15 - lr: 0.003125 |
|
2021-12-31 11:11:33,230 epoch 47 - iter 900/1807 - loss 0.05023989 - samples/sec: 90.40 - lr: 0.003125 |
|
2021-12-31 11:11:49,156 epoch 47 - iter 1080/1807 - loss 0.05064277 - samples/sec: 90.55 - lr: 0.003125 |
|
2021-12-31 11:12:04,959 epoch 47 - iter 1260/1807 - loss 0.05089925 - samples/sec: 91.25 - lr: 0.003125 |
|
2021-12-31 11:12:21,092 epoch 47 - iter 1440/1807 - loss 0.05071923 - samples/sec: 89.39 - lr: 0.003125 |
|
2021-12-31 11:12:36,949 epoch 47 - iter 1620/1807 - loss 0.05083516 - samples/sec: 90.95 - lr: 0.003125 |
|
2021-12-31 11:12:52,744 epoch 47 - iter 1800/1807 - loss 0.05106443 - samples/sec: 91.31 - lr: 0.003125 |
|
2021-12-31 11:12:53,321 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:12:53,321 EPOCH 47 done: loss 0.0511 - lr 0.0031250 |
|
2021-12-31 11:13:29,490 DEV : loss 0.06470787525177002 - f1-score (micro avg) 0.9829 |
|
2021-12-31 11:13:29,672 BAD EPOCHS (no improvement): 1 |
|
2021-12-31 11:13:29,674 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:13:45,987 epoch 48 - iter 180/1807 - loss 0.05119727 - samples/sec: 88.41 - lr: 0.003125 |
|
2021-12-31 11:14:02,271 epoch 48 - iter 360/1807 - loss 0.05026057 - samples/sec: 88.57 - lr: 0.003125 |
|
2021-12-31 11:14:18,202 epoch 48 - iter 540/1807 - loss 0.04968790 - samples/sec: 90.53 - lr: 0.003125 |
|
2021-12-31 11:14:33,834 epoch 48 - iter 720/1807 - loss 0.05040465 - samples/sec: 92.25 - lr: 0.003125 |
|
2021-12-31 11:14:49,709 epoch 48 - iter 900/1807 - loss 0.05065504 - samples/sec: 90.84 - lr: 0.003125 |
|
2021-12-31 11:15:05,727 epoch 48 - iter 1080/1807 - loss 0.05037297 - samples/sec: 90.02 - lr: 0.003125 |
|
2021-12-31 11:15:21,077 epoch 48 - iter 1260/1807 - loss 0.05063199 - samples/sec: 93.96 - lr: 0.003125 |
|
2021-12-31 11:15:36,587 epoch 48 - iter 1440/1807 - loss 0.05076731 - samples/sec: 92.98 - lr: 0.003125 |
|
2021-12-31 11:15:52,489 epoch 48 - iter 1620/1807 - loss 0.05082260 - samples/sec: 90.68 - lr: 0.003125 |
|
2021-12-31 11:16:08,520 epoch 48 - iter 1800/1807 - loss 0.05101165 - samples/sec: 89.96 - lr: 0.003125 |
|
2021-12-31 11:16:09,115 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:16:09,116 EPOCH 48 done: loss 0.0510 - lr 0.0031250 |
|
2021-12-31 11:16:48,035 DEV : loss 0.06484530121088028 - f1-score (micro avg) 0.983 |
|
2021-12-31 11:16:48,189 BAD EPOCHS (no improvement): 2 |
|
2021-12-31 11:16:48,191 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:17:03,775 epoch 49 - iter 180/1807 - loss 0.04706234 - samples/sec: 92.51 - lr: 0.003125 |
|
2021-12-31 11:17:19,604 epoch 49 - iter 360/1807 - loss 0.04796051 - samples/sec: 91.07 - lr: 0.003125 |
|
2021-12-31 11:17:35,506 epoch 49 - iter 540/1807 - loss 0.04820802 - samples/sec: 90.67 - lr: 0.003125 |
|
2021-12-31 11:17:51,301 epoch 49 - iter 720/1807 - loss 0.04872061 - samples/sec: 91.31 - lr: 0.003125 |
|
2021-12-31 11:18:06,963 epoch 49 - iter 900/1807 - loss 0.04900955 - samples/sec: 92.08 - lr: 0.003125 |
|
2021-12-31 11:18:22,961 epoch 49 - iter 1080/1807 - loss 0.04952427 - samples/sec: 90.14 - lr: 0.003125 |
|
2021-12-31 11:18:39,172 epoch 49 - iter 1260/1807 - loss 0.04981242 - samples/sec: 88.96 - lr: 0.003125 |
|
2021-12-31 11:18:55,485 epoch 49 - iter 1440/1807 - loss 0.05015633 - samples/sec: 88.41 - lr: 0.003125 |
|
2021-12-31 11:19:11,166 epoch 49 - iter 1620/1807 - loss 0.05076498 - samples/sec: 91.97 - lr: 0.003125 |
|
2021-12-31 11:19:27,065 epoch 49 - iter 1800/1807 - loss 0.05104387 - samples/sec: 90.71 - lr: 0.003125 |
|
2021-12-31 11:19:27,675 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:19:27,675 EPOCH 49 done: loss 0.0510 - lr 0.0031250 |
|
2021-12-31 11:20:04,021 DEV : loss 0.06486314535140991 - f1-score (micro avg) 0.983 |
|
2021-12-31 11:20:04,217 BAD EPOCHS (no improvement): 3 |
|
2021-12-31 11:20:04,218 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:20:20,650 epoch 50 - iter 180/1807 - loss 0.05726933 - samples/sec: 87.77 - lr: 0.003125 |
|
2021-12-31 11:20:36,455 epoch 50 - iter 360/1807 - loss 0.05538766 - samples/sec: 91.25 - lr: 0.003125 |
|
2021-12-31 11:20:52,012 epoch 50 - iter 540/1807 - loss 0.05444601 - samples/sec: 92.69 - lr: 0.003125 |
|
2021-12-31 11:21:07,973 epoch 50 - iter 720/1807 - loss 0.05313637 - samples/sec: 90.35 - lr: 0.003125 |
|
2021-12-31 11:21:23,983 epoch 50 - iter 900/1807 - loss 0.05290526 - samples/sec: 90.08 - lr: 0.003125 |
|
2021-12-31 11:21:39,924 epoch 50 - iter 1080/1807 - loss 0.05235234 - samples/sec: 90.47 - lr: 0.003125 |
|
2021-12-31 11:21:55,732 epoch 50 - iter 1260/1807 - loss 0.05207690 - samples/sec: 91.23 - lr: 0.003125 |
|
2021-12-31 11:22:11,663 epoch 50 - iter 1440/1807 - loss 0.05205514 - samples/sec: 90.52 - lr: 0.003125 |
|
2021-12-31 11:22:27,392 epoch 50 - iter 1620/1807 - loss 0.05173851 - samples/sec: 91.69 - lr: 0.003125 |
|
2021-12-31 11:22:43,193 epoch 50 - iter 1800/1807 - loss 0.05189058 - samples/sec: 91.27 - lr: 0.003125 |
|
2021-12-31 11:22:43,750 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:22:43,750 EPOCH 50 done: loss 0.0519 - lr 0.0031250 |
|
2021-12-31 11:23:20,432 DEV : loss 0.06452730298042297 - f1-score (micro avg) 0.9831 |
|
2021-12-31 11:23:20,619 BAD EPOCHS (no improvement): 4 |
|
2021-12-31 11:23:25,890 ---------------------------------------------------------------------------------------------------- |
|
2021-12-31 11:23:25,893 loading file models/UPOS_UD_FRENCH_GSD_PLUS_Flair-Embeddings_50_2021-12-31-08:34:44/best-model.pt |
|
2021-12-31 11:23:43,354 0.9797 0.9797 0.9797 0.9797 |
|
2021-12-31 11:23:43,354 |
|
Results: |
|
- F-score (micro) 0.9797 |
|
- F-score (macro) 0.9178 |
|
- Accuracy 0.9797 |
|
|
|
By class: |
|
precision recall f1-score support |
|
|
|
PREP 0.9966 0.9987 0.9976 1483 |
|
PUNCT 1.0000 1.0000 1.0000 833 |
|
NMS 0.9634 0.9801 0.9717 753 |
|
DET 0.9923 0.9984 0.9954 645 |
|
VERB 0.9913 0.9811 0.9862 583 |
|
NFS 0.9667 0.9839 0.9752 560 |
|
ADV 0.9940 0.9821 0.9880 504 |
|
PROPN 0.9541 0.8937 0.9229 395 |
|
DETMS 1.0000 1.0000 1.0000 362 |
|
AUX 0.9860 0.9915 0.9888 355 |
|
YPFOR 1.0000 1.0000 1.0000 353 |
|
NMP 0.9666 0.9475 0.9570 305 |
|
COCO 0.9959 1.0000 0.9980 245 |
|
ADJMS 0.9463 0.9385 0.9424 244 |
|
DETFS 1.0000 1.0000 1.0000 240 |
|
CHIF 0.9648 0.9865 0.9755 222 |
|
NFP 0.9515 0.9849 0.9679 199 |
|
ADJFS 0.9657 0.9286 0.9468 182 |
|
VPPMS 0.9387 0.9745 0.9563 157 |
|
COSUB 1.0000 0.9844 0.9921 128 |
|
DINTMS 0.9918 0.9918 0.9918 122 |
|
XFAMIL 0.9298 0.9217 0.9258 115 |
|
PPER3MS 1.0000 1.0000 1.0000 87 |
|
ADJMP 0.9294 0.9634 0.9461 82 |
|
PDEMMS 1.0000 1.0000 1.0000 75 |
|
ADJFP 0.9861 0.9342 0.9595 76 |
|
PREL 0.9859 1.0000 0.9929 70 |
|
DINTFS 0.9839 1.0000 0.9919 61 |
|
PREF 1.0000 1.0000 1.0000 52 |
|
PPOBJMS 0.9565 0.9362 0.9462 47 |
|
PREFP 0.9778 1.0000 0.9888 44 |
|
PINDMS 1.0000 0.9773 0.9885 44 |
|
VPPFS 0.8298 0.9750 0.8966 40 |
|
PPER1S 1.0000 1.0000 1.0000 42 |
|
SYM 1.0000 0.9474 0.9730 38 |
|
NOUN 0.8824 0.7692 0.8219 39 |
|
PRON 1.0000 0.9677 0.9836 31 |
|
PDEMFS 1.0000 1.0000 1.0000 29 |
|
VPPMP 0.9286 1.0000 0.9630 26 |
|
ADJ 0.9524 0.9091 0.9302 22 |
|
PPER3MP 1.0000 1.0000 1.0000 20 |
|
VPPFP 1.0000 1.0000 1.0000 19 |
|
PPER3FS 1.0000 1.0000 1.0000 18 |
|
MOTINC 0.3333 0.4000 0.3636 15 |
|
PREFS 1.0000 1.0000 1.0000 10 |
|
PPOBJMP 1.0000 0.8000 0.8889 10 |
|
PPOBJFS 0.6250 0.8333 0.7143 6 |
|
INTJ 0.5000 0.6667 0.5714 6 |
|
PART 1.0000 1.0000 1.0000 4 |
|
PDEMMP 1.0000 1.0000 1.0000 3 |
|
PDEMFP 1.0000 1.0000 1.0000 3 |
|
PPER3FP 1.0000 1.0000 1.0000 2 |
|
NUM 1.0000 0.3333 0.5000 3 |
|
PPER2S 1.0000 1.0000 1.0000 2 |
|
PPOBJFP 0.5000 0.5000 0.5000 2 |
|
PRELMS 1.0000 1.0000 1.0000 2 |
|
PINDFS 0.5000 1.0000 0.6667 1 |
|
PINDMP 1.0000 1.0000 1.0000 1 |
|
X 0.0000 0.0000 0.0000 1 |
|
PINDFP 1.0000 1.0000 1.0000 1 |
|
|
|
micro avg 0.9797 0.9797 0.9797 10019 |
|
macro avg 0.9228 0.9230 0.9178 10019 |
|
weighted avg 0.9802 0.9797 0.9798 10019 |
|
samples avg 0.9797 0.9797 0.9797 10019 |
|
|
|
2021-12-31 11:23:43,354 ---------------------------------------------------------------------------------------------------- |
|
|