mariagrandury commited on 15 days ago

Commit

1c7d2cb

verified ·

1 Parent(s): d615e1f

End of training

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

README.md +19 -12
config.json +18 -15
logs/events.out.tfevents.1740157634.a2d653e866f9.226.3 +3 -0
logs/events.out.tfevents.1740162891.0a0ba32201a8.2151.21 +3 -0
logs/events.out.tfevents.1740163730.0a0ba32201a8.2151.22 +3 -0
model.safetensors +2 -2
model_stats.json +157 -238
tokenizer.json +2 -2
tokenizer_config.json +1 -1
training_args.bin +2 -2
trial_0/checkpoint-292/config.json +50 -0
trial_0/checkpoint-292/model.safetensors +3 -0
trial_0/checkpoint-292/optimizer.pt +3 -0
trial_0/checkpoint-292/rng_state.pth +3 -0
trial_0/checkpoint-292/scheduler.pt +3 -0
trial_0/checkpoint-292/special_tokens_map.json +37 -0
trial_0/checkpoint-292/tokenizer.json +0 -0
trial_0/checkpoint-292/tokenizer_config.json +58 -0
trial_0/checkpoint-292/trainer_state.json +314 -0
trial_0/checkpoint-292/training_args.bin +3 -0
trial_0/checkpoint-292/vocab.txt +0 -0
trial_0/checkpoint-584/config.json +50 -0
trial_0/checkpoint-584/model.safetensors +3 -0
trial_0/checkpoint-584/optimizer.pt +3 -0
trial_0/checkpoint-584/rng_state.pth +3 -0
trial_0/checkpoint-584/scheduler.pt +3 -0
trial_0/checkpoint-584/special_tokens_map.json +37 -0
trial_0/checkpoint-584/tokenizer.json +0 -0
trial_0/checkpoint-584/tokenizer_config.json +58 -0
trial_0/checkpoint-584/trainer_state.json +595 -0
trial_0/checkpoint-584/training_args.bin +3 -0
trial_0/checkpoint-584/vocab.txt +0 -0
trial_0/checkpoint-876/config.json +50 -0
trial_0/checkpoint-876/model.safetensors +3 -0
trial_0/checkpoint-876/optimizer.pt +3 -0
trial_0/checkpoint-876/rng_state.pth +3 -0
trial_0/checkpoint-876/scheduler.pt +3 -0
trial_0/checkpoint-876/special_tokens_map.json +37 -0
trial_0/checkpoint-876/tokenizer.json +0 -0
trial_0/checkpoint-876/tokenizer_config.json +58 -0
trial_0/checkpoint-876/trainer_state.json +876 -0
trial_0/checkpoint-876/training_args.bin +3 -0
trial_0/checkpoint-876/vocab.txt +0 -0
trial_0/logs/events.out.tfevents.1740158198.a2d653e866f9.226.4 +3 -0
trial_0/logs/events.out.tfevents.1740161296.0a0ba32201a8.2151.0 +3 -0
trial_0/logs/events.out.tfevents.1740161531.0a0ba32201a8.2151.1 +3 -0
trial_0/logs/events.out.tfevents.1740161645.0a0ba32201a8.2151.2 +3 -0
trial_1/checkpoint-146/config.json +50 -0
trial_1/checkpoint-146/model.safetensors +3 -0
trial_1/checkpoint-146/optimizer.pt +3 -0

README.md CHANGED Viewed

@@ -1,8 +1,10 @@
 ---
 library_name: transformers
-base_model: dccuchile/distilbert-base-spanish-uncased
 tags:
 - generated_from_trainer
 model-index:
 - name: bluesky-spanish-classifier
   results: []
@@ -13,10 +15,11 @@ should probably proofread and complete it, then remove this comment. -->
 # bluesky-spanish-classifier
-This model is a fine-tuned version of [dccuchile/distilbert-base-spanish-uncased](https://huggingface.co/dccuchile/distilbert-base-spanish-uncased) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.2149
-- Classification Report: {'ar': {'precision': 0.125, 'recall': 0.014492753623188406, 'f1-score': 0.025974025974025976, 'support': 207.0}, 'cl': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 263.0}, 'co': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 171.0}, 'es': {'precision': 0.6666666666666666, 'recall': 0.006024096385542169, 'f1-score': 0.011940298507462687, 'support': 332.0}, 'mx': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 203.0}, 'pe': {'precision': 0.03333333333333333, 'recall': 0.006211180124223602, 'f1-score': 0.010471204188481676, 'support': 161.0}, 'pr': {'precision': 0.09401709401709402, 'recall': 0.22, 'f1-score': 0.1317365269461078, 'support': 50.0}, 'uy': {'precision': 0.07073715562174236, 'recall': 0.8260869565217391, 'f1-score': 0.13031550068587106, 'support': 115.0}, 've': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 22.0}, 'accuracy': 0.07349081364829396, 'macro avg': {'precision': 0.10997269440431515, 'recall': 0.1192016651838548, 'f1-score': 0.03449306181132769, 'support': 1524.0}, 'weighted avg': {'precision': 0.17415395511637471, 'recall': 0.07349081364829396, 'f1-score': 0.021390928662484977, 'support': 1524.0}}
 ## Model description
@@ -35,20 +38,24 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 2e-05
-- train_batch_size: 4
-- eval_batch_size: 4
 - seed: 42
 - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
-- lr_scheduler_warmup_steps: 2
-- training_steps: 2
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Classification Report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-|:-------------:|:------:|:----:|:---------------:|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|
-| 2.2248        | 0.0022 | 2    | 2.2149          | {'ar': {'precision': 0.125, 'recall': 0.014492753623188406, 'f1-score': 0.025974025974025976, 'support': 207.0}, 'cl': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 263.0}, 'co': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 171.0}, 'es': {'precision': 0.6666666666666666, 'recall': 0.006024096385542169, 'f1-score': 0.011940298507462687, 'support': 332.0}, 'mx': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 203.0}, 'pe': {'precision': 0.03333333333333333, 'recall': 0.006211180124223602, 'f1-score': 0.010471204188481676, 'support': 161.0}, 'pr': {'precision': 0.09401709401709402, 'recall': 0.22, 'f1-score': 0.1317365269461078, 'support': 50.0}, 'uy': {'precision': 0.07073715562174236, 'recall': 0.8260869565217391, 'f1-score': 0.13031550068587106, 'support': 115.0}, 've': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 22.0}, 'accuracy': 0.07349081364829396, 'macro avg': {'precision': 0.10997269440431515, 'recall': 0.1192016651838548, 'f1-score': 0.03449306181132769, 'support': 1524.0}, 'weighted avg': {'precision': 0.17415395511637471, 'recall': 0.07349081364829396, 'f1-score': 0.021390928662484977, 'support': 1524.0}} |
 ### Framework versions

 ---
 library_name: transformers
+base_model: dccuchile/bert-base-spanish-wwm-uncased
 tags:
 - generated_from_trainer
+metrics:
+- f1
 model-index:
 - name: bluesky-spanish-classifier
   results: []
 # bluesky-spanish-classifier
+This model is a fine-tuned version of [dccuchile/bert-base-spanish-wwm-uncased](https://huggingface.co/dccuchile/bert-base-spanish-wwm-uncased) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 2.3731
+- Classification Report: {'ar': {'precision': 0.4898785425101215, 'recall': 0.32180851063829785, 'f1-score': 0.3884430176565008, 'support': 376.0}, 'cl': {'precision': 0.3626666666666667, 'recall': 0.4722222222222222, 'f1-score': 0.41025641025641024, 'support': 576.0}, 'co': {'precision': 0.34656084656084657, 'recall': 0.3808139534883721, 'f1-score': 0.3628808864265928, 'support': 344.0}, 'es': {'precision': 0.4630738522954092, 'recall': 0.427255985267035, 'f1-score': 0.4444444444444444, 'support': 543.0}, 'mx': {'precision': 0.43380855397148677, 'recall': 0.43917525773195876, 'f1-score': 0.4364754098360656, 'support': 485.0}, 'pe': {'precision': 0.3769968051118211, 'recall': 0.3390804597701149, 'f1-score': 0.35703479576399394, 'support': 348.0}, 'pr': {'precision': 0.5736434108527132, 'recall': 0.7326732673267327, 'f1-score': 0.6434782608695652, 'support': 101.0}, 'uy': {'precision': 0.35096153846153844, 'recall': 0.3201754385964912, 'f1-score': 0.3348623853211009, 'support': 228.0}, 've': {'precision': 0.16666666666666666, 'recall': 0.045454545454545456, 'f1-score': 0.07142857142857142, 'support': 22.0}, 'accuracy': 0.4085345683096262, 'macro avg': {'precision': 0.39602854256636333, 'recall': 0.38651773783286336, 'f1-score': 0.3832560202225828, 'support': 3023.0}, 'weighted avg': {'precision': 0.4124949665181113, 'recall': 0.4085345683096262, 'f1-score': 0.40601279016852304, 'support': 3023.0}}
+- F1: 0.3833
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 2.8600231011639855e-05
+- train_batch_size: 8
+- eval_batch_size: 8
 - seed: 42
 - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
+- lr_scheduler_warmup_ratio: 0.11531859504380029
+- num_epochs: 5
 ### Training results
+| Training Loss | Epoch | Step | Validation Loss | Classification Report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              | F1     |
+|:-------------:|:-----:|:----:|:---------------:|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------:|:------:|
+| 1.7603        | 1.0   | 882  | 1.7406          | {'ar': {'precision': 0.35516372795969775, 'recall': 0.375, 'f1-score': 0.3648124191461837, 'support': 376.0}, 'cl': {'precision': 0.3016759776536313, 'recall': 0.28125, 'f1-score': 0.29110512129380056, 'support': 576.0}, 'co': {'precision': 0.3670886075949367, 'recall': 0.25290697674418605, 'f1-score': 0.29948364888123924, 'support': 344.0}, 'es': {'precision': 0.3584905660377358, 'recall': 0.4548802946593002, 'f1-score': 0.400974025974026, 'support': 543.0}, 'mx': {'precision': 0.32465753424657534, 'recall': 0.488659793814433, 'f1-score': 0.39012345679012345, 'support': 485.0}, 'pe': {'precision': 0.3958333333333333, 'recall': 0.27298850574712646, 'f1-score': 0.3231292517006803, 'support': 348.0}, 'pr': {'precision': 0.5631067961165048, 'recall': 0.5742574257425742, 'f1-score': 0.5686274509803921, 'support': 101.0}, 'uy': {'precision': 0.4666666666666667, 'recall': 0.18421052631578946, 'f1-score': 0.2641509433962264, 'support': 228.0}, 've': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 22.0}, 'accuracy': 0.3536222295732716, 'macro avg': {'precision': 0.34807591217878686, 'recall': 0.3204615025581566, 'f1-score': 0.32248959090696355, 'support': 3023.0}, 'weighted avg': {'precision': 0.35948675942105285, 'recall': 0.3536222295732716, 'f1-score': 0.3456546260541325, 'support': 3023.0}}                                                                          | 0.3225 |
+| 1.4223        | 2.0   | 1764 | 1.6758          | {'ar': {'precision': 0.4349315068493151, 'recall': 0.3377659574468085, 'f1-score': 0.38023952095808383, 'support': 376.0}, 'cl': {'precision': 0.336996336996337, 'recall': 0.3194444444444444, 'f1-score': 0.32798573975044565, 'support': 576.0}, 'co': {'precision': 0.36333333333333334, 'recall': 0.3168604651162791, 'f1-score': 0.3385093167701863, 'support': 344.0}, 'es': {'precision': 0.38980716253443526, 'recall': 0.5211786372007366, 'f1-score': 0.44602048857368004, 'support': 543.0}, 'mx': {'precision': 0.35246995994659547, 'recall': 0.5443298969072164, 'f1-score': 0.42787682333873583, 'support': 485.0}, 'pe': {'precision': 0.44308943089430897, 'recall': 0.3132183908045977, 'f1-score': 0.367003367003367, 'support': 348.0}, 'pr': {'precision': 0.759493670886076, 'recall': 0.594059405940594, 'f1-score': 0.6666666666666666, 'support': 101.0}, 'uy': {'precision': 0.5542168674698795, 'recall': 0.20175438596491227, 'f1-score': 0.2958199356913183, 'support': 228.0}, 've': {'precision': 1.0, 'recall': 0.09090909090909091, 'f1-score': 0.16666666666666666, 'support': 22.0}, 'accuracy': 0.3916639100231558, 'macro avg': {'precision': 0.5149264743233645, 'recall': 0.35994674163718665, 'f1-score': 0.3796431694910167, 'support': 3023.0}, 'weighted avg': {'precision': 0.4116802685001794, 'recall': 0.3916639100231558, 'f1-score': 0.3851176158170783, 'support': 3023.0}}                     | 0.3796 |
+| 0.9068        | 3.0   | 2646 | 1.9523          | {'ar': {'precision': 0.39574468085106385, 'recall': 0.4946808510638298, 'f1-score': 0.4397163120567376, 'support': 376.0}, 'cl': {'precision': 0.35144927536231885, 'recall': 0.3368055555555556, 'f1-score': 0.34397163120567376, 'support': 576.0}, 'co': {'precision': 0.31555555555555553, 'recall': 0.4127906976744186, 'f1-score': 0.35768261964735515, 'support': 344.0}, 'es': {'precision': 0.47113163972286376, 'recall': 0.3756906077348066, 'f1-score': 0.4180327868852459, 'support': 543.0}, 'mx': {'precision': 0.43680709534368073, 'recall': 0.4061855670103093, 'f1-score': 0.42094017094017094, 'support': 485.0}, 'pe': {'precision': 0.38661710037174724, 'recall': 0.2988505747126437, 'f1-score': 0.3371150729335494, 'support': 348.0}, 'pr': {'precision': 0.64, 'recall': 0.6336633663366337, 'f1-score': 0.6368159203980099, 'support': 101.0}, 'uy': {'precision': 0.30662020905923343, 'recall': 0.38596491228070173, 'f1-score': 0.341747572815534, 'support': 228.0}, 've': {'precision': 0.18181818181818182, 'recall': 0.09090909090909091, 'f1-score': 0.12121212121212122, 'support': 22.0}, 'accuracy': 0.3906715183592458, 'macro avg': {'precision': 0.3873048597871828, 'recall': 0.3817268025864433, 'f1-score': 0.37969268978826637, 'support': 3023.0}, 'weighted avg': {'precision': 0.3971399185993649, 'recall': 0.3906715183592458, 'f1-score': 0.3902981034934984, 'support': 3023.0}}              | 0.3797 |
+| 0.4818        | 4.0   | 3528 | 2.3731          | {'ar': {'precision': 0.4898785425101215, 'recall': 0.32180851063829785, 'f1-score': 0.3884430176565008, 'support': 376.0}, 'cl': {'precision': 0.3626666666666667, 'recall': 0.4722222222222222, 'f1-score': 0.41025641025641024, 'support': 576.0}, 'co': {'precision': 0.34656084656084657, 'recall': 0.3808139534883721, 'f1-score': 0.3628808864265928, 'support': 344.0}, 'es': {'precision': 0.4630738522954092, 'recall': 0.427255985267035, 'f1-score': 0.4444444444444444, 'support': 543.0}, 'mx': {'precision': 0.43380855397148677, 'recall': 0.43917525773195876, 'f1-score': 0.4364754098360656, 'support': 485.0}, 'pe': {'precision': 0.3769968051118211, 'recall': 0.3390804597701149, 'f1-score': 0.35703479576399394, 'support': 348.0}, 'pr': {'precision': 0.5736434108527132, 'recall': 0.7326732673267327, 'f1-score': 0.6434782608695652, 'support': 101.0}, 'uy': {'precision': 0.35096153846153844, 'recall': 0.3201754385964912, 'f1-score': 0.3348623853211009, 'support': 228.0}, 've': {'precision': 0.16666666666666666, 'recall': 0.045454545454545456, 'f1-score': 0.07142857142857142, 'support': 22.0}, 'accuracy': 0.4085345683096262, 'macro avg': {'precision': 0.39602854256636333, 'recall': 0.38651773783286336, 'f1-score': 0.3832560202225828, 'support': 3023.0}, 'weighted avg': {'precision': 0.4124949665181113, 'recall': 0.4085345683096262, 'f1-score': 0.40601279016852304, 'support': 3023.0}} | 0.3833 |
+| 0.2357        | 5.0   | 4410 | 2.7721          | {'ar': {'precision': 0.42168674698795183, 'recall': 0.3723404255319149, 'f1-score': 0.3954802259887006, 'support': 376.0}, 'cl': {'precision': 0.38753799392097266, 'recall': 0.4427083333333333, 'f1-score': 0.413290113452188, 'support': 576.0}, 'co': {'precision': 0.35051546391752575, 'recall': 0.3953488372093023, 'f1-score': 0.37158469945355194, 'support': 344.0}, 'es': {'precision': 0.4642857142857143, 'recall': 0.40699815837937386, 'f1-score': 0.4337585868498528, 'support': 543.0}, 'mx': {'precision': 0.43089430894308944, 'recall': 0.43711340206185567, 'f1-score': 0.43398157625383826, 'support': 485.0}, 'pe': {'precision': 0.3407960199004975, 'recall': 0.3936781609195402, 'f1-score': 0.36533333333333334, 'support': 348.0}, 'pr': {'precision': 0.6601941747572816, 'recall': 0.6732673267326733, 'f1-score': 0.6666666666666666, 'support': 101.0}, 'uy': {'precision': 0.40853658536585363, 'recall': 0.29385964912280704, 'f1-score': 0.34183673469387754, 'support': 228.0}, 've': {'precision': 0.0, 'recall': 0.0, 'f1-score': 0.0, 'support': 22.0}, 'accuracy': 0.40886536553092956, 'macro avg': {'precision': 0.3849385564532096, 'recall': 0.3794793659212001, 'f1-score': 0.38021465963244544, 'support': 3023.0}, 'weighted avg': {'precision': 0.41080624270175103, 'recall': 0.40886536553092956, 'f1-score': 0.4078732692419294, 'support': 3023.0}}                                            | 0.3802 |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,13 +1,14 @@
 {
-  "_name_or_path": "dccuchile/distilbert-base-spanish-uncased",
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "dim": 768,
-  "dropout": 0.1,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "ar",
     "1": "cl",
@@ -20,6 +21,7 @@
     "8": "ve"
   },
   "initializer_range": 0.02,
   "label2id": {
     "ar": 0,
     "cl": 1,
@@ -31,17 +33,18 @@
     "uy": 7,
     "ve": 8
   },
   "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
-  "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": true,
-  "tie_weights_": true,
   "torch_dtype": "float32",
   "transformers_version": "4.48.3",
   "vocab_size": 31002
 }

 {
+  "_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
   "architectures": [
+    "BertForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
   "id2label": {
     "0": "ar",
     "1": "cl",
     "8": "ve"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 3072,
   "label2id": {
     "ar": 0,
     "cl": 1,
     "uy": 7,
     "ve": 8
   },
+  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
   "transformers_version": "4.48.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
   "vocab_size": 31002
 }

logs/events.out.tfevents.1740157634.a2d653e866f9.226.3 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:646126b025c968bf4bd3116e12b41d96bfb11ffd3e476cc70526ebb920ce8b86
+size 354

logs/events.out.tfevents.1740162891.0a0ba32201a8.2151.21 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ab77507abc6135face2f24050935579841c0edd04ed429b2b14a790d9de3346
+size 100428

logs/events.out.tfevents.1740163730.0a0ba32201a8.2151.22 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5c9e1f0c540ff78c3cd5ed026bc180b0a9e5b858cf3411c46ddbc70bd2f355ef
+size 405

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2e9ad0f28c73e32d964399d0a61f45d861c8a1af2235599dd7b8c5d38517ce4a
-size 269328660

 version https://git-lfs.github.com/spec/v1
+oid sha256:9640bf7ca7b6a541089109fcdb8dd4b103d14e514f0b0b70e6032897467855b5
+size 439454740

model_stats.json CHANGED Viewed

@@ -1,177 +1,96 @@
 {
   "dataset": {
-    "splits": {
       "train": {
-        "num_examples": 3553,
-        "features": [
-          "author",
-          "country",
-          "post_text",
-          "created_at",
-          "likes",
-          "quotes",
-          "replies",
-          "reposts",
-          "post_id",
-          "lang",
-          "tags",
-          "image_links",
-          "profile_info",
-          "processed_text",
-          "__index_level_0__"
-        ],
-        "first_example": {
-          "author": "apalet.bsky.social",
-          "country": "cl",
-          "post_text": "Me lloran los ojos sin pedir permiso ni razón.",
-          "created_at": "2024-12-31T01:15:04.751Z",
-          "likes": 8,
-          "quotes": 0,
-          "replies": 1,
-          "reposts": 0,
-          "post_id": "at://did:plc:y4bvfcu7wrx7jlyjg6qglqzl/app.bsky.feed.post/3lekuofg3xk2v",
-          "lang": "es",
-          "tags": "",
-          "image_links": "",
-          "profile_info": {
-            "description": "Leo y olvido \nwww.laurel.cl\nhttps://revistadossier.udp.cl",
-            "display_name": "Andrea Palet",
-            "feed_uri": null,
-            "followers_count": 1355,
-            "follows_count": 304,
-            "indexed_at": "2024-11-30T20:22:38.048Z",
-            "posts_count": 515
-          },
-          "processed_text": "lloran ojos pedir permiso razón",
-          "__index_level_0__": 4653
         },
-        "country_distribution": {
-          "ar": {
-            "count": 483,
-            "percentage": 13.594145792288206
-          },
-          "cl": {
-            "count": 614,
-            "percentage": 17.28117084154236
-          },
-          "co": {
-            "count": 399,
-            "percentage": 11.229946524064172
-          },
-          "es": {
-            "count": 774,
-            "percentage": 21.784407542921475
-          },
-          "mx": {
-            "count": 473,
-            "percentage": 13.312693498452013
-          },
-          "pe": {
-            "count": 376,
-            "percentage": 10.582606248240923
-          },
-          "pr": {
-            "count": 117,
-            "percentage": 3.2929918378834784
-          },
-          "uy": {
-            "count": 267,
-            "percentage": 7.5147762454264
-          },
-          "ve": {
-            "count": 50,
-            "percentage": 1.407261469180974
-          }
         }
       },
       "test": {
-        "num_examples": 1524,
-        "features": [
-          "author",
-          "country",
-          "post_text",
-          "created_at",
-          "likes",
-          "quotes",
-          "replies",
-          "reposts",
-          "post_id",
-          "lang",
-          "tags",
-          "image_links",
-          "profile_info",
-          "processed_text",
-          "__index_level_0__"
-        ],
-        "first_example": {
-          "author": "rpalomino.bsky.social",
-          "country": "pe",
-          "post_text": "Dos libros que he estado esperando leer hace mucho.",
-          "created_at": "2024-12-25T16:32:48.934Z",
-          "likes": 2,
-          "quotes": 0,
-          "replies": 1,
-          "reposts": 0,
-          "post_id": "at://did:plc:65xzu4se42blbypbgmki3xxv/app.bsky.feed.post/3le5f5vxtmc2h",
-          "lang": "es",
-          "tags": "",
-          "image_links": "",
-          "profile_info": {
-            "description": "Literatura y sociedad.",
-            "display_name": "Roy Palomino",
-            "feed_uri": null,
-            "followers_count": 174,
-            "follows_count": 283,
-            "indexed_at": "2024-11-25T05:12:19.445Z",
-            "posts_count": 90
-          },
-          "processed_text": "libros esperando leer",
-          "__index_level_0__": 3477
         },
-        "country_distribution": {
-          "ar": {
-            "count": 207,
-            "percentage": 13.582677165354331
-          },
-          "cl": {
-            "count": 263,
-            "percentage": 17.25721784776903
-          },
-          "co": {
-            "count": 171,
-            "percentage": 11.220472440944881
-          },
-          "es": {
-            "count": 332,
-            "percentage": 21.784776902887142
-          },
-          "mx": {
-            "count": 203,
-            "percentage": 13.32020997375328
-          },
-          "pe": {
-            "count": 161,
-            "percentage": 10.564304461942257
-          },
-          "pr": {
-            "count": 50,
-            "percentage": 3.2808398950131235
-          },
-          "uy": {
-            "count": 115,
-            "percentage": 7.545931758530183
-          },
-          "ve": {
-            "count": 22,
-            "percentage": 1.4435695538057742
-          }
         }
       }
     },
-    "processed": {
-      "train_examples": 3553,
-      "test_examples": 1524
-    }
   },
   "model": {
     "name": "dccuchile/distilbert-base-spanish-uncased",
@@ -185,152 +104,152 @@
     "hub_url": "https://huggingface.co/None/bluesky-spanish-classifier"
   },
   "training": {
-    "runtime_seconds": 97.8884,
-    "loss": 2.1454918384552,
-    "steps_per_second": 0.02
   },
   "evaluation": {
     "ar": {
-      "precision": 0.10526315789473684,
-      "recall": 0.08695652173913043,
-      "f1-score": 0.09523809523809523,
       "support": 207.0
     },
     "cl": {
-      "precision": 0.17346938775510204,
-      "recall": 0.19391634980988592,
-      "f1-score": 0.18312387791741472,
       "support": 263.0
     },
     "co": {
-      "precision": 0.06451612903225806,
-      "recall": 0.011695906432748537,
-      "f1-score": 0.019801980198019802,
       "support": 171.0
     },
     "es": {
-      "precision": 0.24783362218370883,
-      "recall": 0.4307228915662651,
-      "f1-score": 0.3146314631463146,
       "support": 332.0
     },
     "mx": {
-      "precision": 0.15086206896551724,
-      "recall": 0.1724137931034483,
-      "f1-score": 0.16091954022988506,
       "support": 203.0
     },
     "pe": {
-      "precision": 0.061946902654867256,
-      "recall": 0.043478260869565216,
-      "f1-score": 0.051094890510948905,
       "support": 161.0
     },
     "pr": {
-      "precision": 0.5,
-      "recall": 0.02,
-      "f1-score": 0.038461538461538464,
       "support": 50.0
     },
     "uy": {
-      "precision": 0.3181818181818182,
-      "recall": 0.06086956521739131,
-      "f1-score": 0.10218978102189781,
       "support": 115.0
     },
     "ve": {
-      "precision": 0.012195121951219513,
-      "recall": 0.045454545454545456,
-      "f1-score": 0.019230769230769232,
       "support": 22.0
     },
-    "accuracy": 0.17388451443569553,
     "macro avg": {
-      "precision": 0.18158535651324753,
-      "recall": 0.11838975935477558,
-      "f1-score": 0.10941021510609822,
       "support": 1524.0
     },
     "weighted avg": {
-      "precision": 0.1726919923848946,
-      "recall": 0.17388451443569553,
-      "f1-score": 0.151384890214964,
       "support": 1524.0
     },
     "final": {
-      "eval_loss": 2.181152582168579,
       "eval_classification_report": {
         "ar": {
-          "precision": 0.10526315789473684,
-          "recall": 0.08695652173913043,
-          "f1-score": 0.09523809523809523,
           "support": 207.0
         },
         "cl": {
-          "precision": 0.17346938775510204,
-          "recall": 0.19391634980988592,
-          "f1-score": 0.18312387791741472,
           "support": 263.0
         },
         "co": {
-          "precision": 0.06451612903225806,
-          "recall": 0.011695906432748537,
-          "f1-score": 0.019801980198019802,
           "support": 171.0
         },
         "es": {
-          "precision": 0.24783362218370883,
-          "recall": 0.4307228915662651,
-          "f1-score": 0.3146314631463146,
           "support": 332.0
         },
         "mx": {
-          "precision": 0.15086206896551724,
-          "recall": 0.1724137931034483,
-          "f1-score": 0.16091954022988506,
           "support": 203.0
         },
         "pe": {
-          "precision": 0.061946902654867256,
-          "recall": 0.043478260869565216,
-          "f1-score": 0.051094890510948905,
           "support": 161.0
         },
         "pr": {
-          "precision": 0.5,
-          "recall": 0.02,
-          "f1-score": 0.038461538461538464,
           "support": 50.0
         },
         "uy": {
-          "precision": 0.3181818181818182,
-          "recall": 0.06086956521739131,
-          "f1-score": 0.10218978102189781,
           "support": 115.0
         },
         "ve": {
-          "precision": 0.012195121951219513,
-          "recall": 0.045454545454545456,
-          "f1-score": 0.019230769230769232,
           "support": 22.0
         },
-        "accuracy": 0.17388451443569553,
         "macro avg": {
-          "precision": 0.18158535651324753,
-          "recall": 0.11838975935477558,
-          "f1-score": 0.10941021510609822,
           "support": 1524.0
         },
         "weighted avg": {
-          "precision": 0.1726919923848946,
-          "recall": 0.17388451443569553,
-          "f1-score": 0.151384890214964,
           "support": 1524.0
         }
       },
-      "eval_runtime": 97.6642,
-      "eval_samples_per_second": 15.604,
-      "eval_steps_per_second": 3.901,
       "epoch": 0.0022497187851518562
     }
   }

 {
   "dataset": {
+    "train_size": 3553,
+    "test_size": 1524,
+    "country_distribution": {
       "train": {
+        "ar": {
+          "count": 483,
+          "percentage": 13.594145792288206
+        },
+        "cl": {
+          "count": 614,
+          "percentage": 17.28117084154236
+        },
+        "co": {
+          "count": 399,
+          "percentage": 11.229946524064172
+        },
+        "es": {
+          "count": 774,
+          "percentage": 21.784407542921475
+        },
+        "mx": {
+          "count": 473,
+          "percentage": 13.312693498452013
         },
+        "pe": {
+          "count": 376,
+          "percentage": 10.582606248240923
+        },
+        "pr": {
+          "count": 117,
+          "percentage": 3.2929918378834784
+        },
+        "uy": {
+          "count": 267,
+          "percentage": 7.5147762454264
+        },
+        "ve": {
+          "count": 50,
+          "percentage": 1.407261469180974
         }
       },
       "test": {
+        "ar": {
+          "count": 207,
+          "percentage": 13.582677165354331
         },
+        "cl": {
+          "count": 263,
+          "percentage": 17.25721784776903
+        },
+        "co": {
+          "count": 171,
+          "percentage": 11.220472440944881
+        },
+        "es": {
+          "count": 332,
+          "percentage": 21.784776902887142
+        },
+        "mx": {
+          "count": 203,
+          "percentage": 13.32020997375328
+        },
+        "pe": {
+          "count": 161,
+          "percentage": 10.564304461942257
+        },
+        "pr": {
+          "count": 50,
+          "percentage": 3.2808398950131235
+        },
+        "uy": {
+          "count": 115,
+          "percentage": 7.545931758530183
+        },
+        "ve": {
+          "count": 22,
+          "percentage": 1.4435695538057742
         }
       }
     },
+    "unique_countries": [
+      "ar",
+      "cl",
+      "co",
+      "es",
+      "mx",
+      "pe",
+      "pr",
+      "uy",
+      "ve"
+    ]
   },
   "model": {
     "name": "dccuchile/distilbert-base-spanish-uncased",
     "hub_url": "https://huggingface.co/None/bluesky-spanish-classifier"
   },
   "training": {
+    "runtime_seconds": 105.9611,
+    "loss": 2.257941484451294,
+    "steps_per_second": 0.019
   },
   "evaluation": {
     "ar": {
+      "precision": 0.125,
+      "recall": 0.014492753623188406,
+      "f1-score": 0.025974025974025976,
       "support": 207.0
     },
     "cl": {
+      "precision": 0.0,
+      "recall": 0.0,
+      "f1-score": 0.0,
       "support": 263.0
     },
     "co": {
+      "precision": 0.0,
+      "recall": 0.0,
+      "f1-score": 0.0,
       "support": 171.0
     },
     "es": {
+      "precision": 0.6666666666666666,
+      "recall": 0.006024096385542169,
+      "f1-score": 0.011940298507462687,
       "support": 332.0
     },
     "mx": {
+      "precision": 0.0,
+      "recall": 0.0,
+      "f1-score": 0.0,
       "support": 203.0
     },
     "pe": {
+      "precision": 0.03333333333333333,
+      "recall": 0.006211180124223602,
+      "f1-score": 0.010471204188481676,
       "support": 161.0
     },
     "pr": {
+      "precision": 0.09401709401709402,
+      "recall": 0.22,
+      "f1-score": 0.1317365269461078,
       "support": 50.0
     },
     "uy": {
+      "precision": 0.07073715562174236,
+      "recall": 0.8260869565217391,
+      "f1-score": 0.13031550068587106,
       "support": 115.0
     },
     "ve": {
+      "precision": 0.0,
+      "recall": 0.0,
+      "f1-score": 0.0,
       "support": 22.0
     },
+    "accuracy": 0.07349081364829396,
     "macro avg": {
+      "precision": 0.10997269440431515,
+      "recall": 0.1192016651838548,
+      "f1-score": 0.03449306181132769,
       "support": 1524.0
     },
     "weighted avg": {
+      "precision": 0.17415395511637471,
+      "recall": 0.07349081364829396,
+      "f1-score": 0.021390928662484977,
       "support": 1524.0
     },
     "final": {
+      "eval_loss": 2.2149105072021484,
       "eval_classification_report": {
         "ar": {
+          "precision": 0.125,
+          "recall": 0.014492753623188406,
+          "f1-score": 0.025974025974025976,
           "support": 207.0
         },
         "cl": {
+          "precision": 0.0,
+          "recall": 0.0,
+          "f1-score": 0.0,
           "support": 263.0
         },
         "co": {
+          "precision": 0.0,
+          "recall": 0.0,
+          "f1-score": 0.0,
           "support": 171.0
         },
         "es": {
+          "precision": 0.6666666666666666,
+          "recall": 0.006024096385542169,
+          "f1-score": 0.011940298507462687,
           "support": 332.0
         },
         "mx": {
+          "precision": 0.0,
+          "recall": 0.0,
+          "f1-score": 0.0,
           "support": 203.0
         },
         "pe": {
+          "precision": 0.03333333333333333,
+          "recall": 0.006211180124223602,
+          "f1-score": 0.010471204188481676,
           "support": 161.0
         },
         "pr": {
+          "precision": 0.09401709401709402,
+          "recall": 0.22,
+          "f1-score": 0.1317365269461078,
           "support": 50.0
         },
         "uy": {
+          "precision": 0.07073715562174236,
+          "recall": 0.8260869565217391,
+          "f1-score": 0.13031550068587106,
           "support": 115.0
         },
         "ve": {
+          "precision": 0.0,
+          "recall": 0.0,
+          "f1-score": 0.0,
           "support": 22.0
         },
+        "accuracy": 0.07349081364829396,
         "macro avg": {
+          "precision": 0.10997269440431515,
+          "recall": 0.1192016651838548,
+          "f1-score": 0.03449306181132769,
           "support": 1524.0
         },
         "weighted avg": {
+          "precision": 0.17415395511637471,
+          "recall": 0.07349081364829396,
+          "f1-score": 0.021390928662484977,
           "support": 1524.0
         }
       },
+      "eval_runtime": 98.563,
+      "eval_samples_per_second": 15.462,
+      "eval_steps_per_second": 3.866,
       "epoch": 0.0022497187851518562
     }
   }

tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 32,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
-      "Fixed": 32
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 64,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
+      "Fixed": 64
     },
     "direction": "Right",
     "pad_to_multiple_of": null,

tokenizer_config.json CHANGED Viewed

@@ -53,6 +53,6 @@
   "sep_token": "[SEP]",
   "strip_accents": false,
   "tokenize_chinese_chars": true,
-  "tokenizer_class": "DistilBertTokenizer",
   "unk_token": "[UNK]"
 }

   "sep_token": "[SEP]",
   "strip_accents": false,
   "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6a931bb071306bc2c9f6731ed0c069d5875fa5eab471d84947b67f65d2ef43f3
-size 5368

 version https://git-lfs.github.com/spec/v1
+oid sha256:a2de174b6ea17c52db95df91a80925879ae293fdc8fa93e84445ba29d1a5e95b
+size 5432

trial_0/checkpoint-292/config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "ar",
+    "1": "cl",
+    "2": "co",
+    "3": "es",
+    "4": "mx",
+    "5": "pe",
+    "6": "pr",
+    "7": "uy",
+    "8": "ve"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "ar": 0,
+    "cl": 1,
+    "co": 2,
+    "es": 3,
+    "mx": 4,
+    "pe": 5,
+    "pr": 6,
+    "uy": 7,
+    "ve": 8
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 31002
+}

trial_0/checkpoint-292/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76e0b013258938faa56136402a7e40a933eef90038e3f931c5780cf4f69b10bd
+size 439454740

trial_0/checkpoint-292/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:751bd43e029cbd1d226e60e6a4fd7af47fee03b3990b3f6a8ecbc3ec83eeba06
+size 879030522

trial_0/checkpoint-292/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0df68380976b6dbabd78e6cbea5eb7a814681ecd61ae85ed04b274788a2e922
+size 14244

trial_0/checkpoint-292/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1778d089cccff46f89357266568881d0aa63539ed46bc3a93cfb7fba7fc007c3
+size 1064

trial_0/checkpoint-292/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

trial_0/checkpoint-292/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/checkpoint-292/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": false,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

trial_0/checkpoint-292/trainer_state.json ADDED Viewed

	@@ -0,0 +1,314 @@

+{
+  "best_metric": 0.2140692864641761,
+  "best_model_checkpoint": "/content/drive/MyDrive/model_outputs/trial_0/checkpoint-292",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 292,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03424657534246575,
+      "grad_norm": 8.432939529418945,
+      "learning_rate": 8.18270817933484e-07,
+      "loss": 2.2234,
+      "step": 10
+    },
+    {
+      "epoch": 0.0684931506849315,
+      "grad_norm": 8.3140230178833,
+      "learning_rate": 1.636541635866968e-06,
+      "loss": 2.2403,
+      "step": 20
+    },
+    {
+      "epoch": 0.10273972602739725,
+      "grad_norm": 7.506945610046387,
+      "learning_rate": 2.454812453800452e-06,
+      "loss": 2.2297,
+      "step": 30
+    },
+    {
+      "epoch": 0.136986301369863,
+      "grad_norm": 8.531285285949707,
+      "learning_rate": 3.273083271733936e-06,
+      "loss": 2.1823,
+      "step": 40
+    },
+    {
+      "epoch": 0.17123287671232876,
+      "grad_norm": 7.951968669891357,
+      "learning_rate": 4.091354089667421e-06,
+      "loss": 2.1696,
+      "step": 50
+    },
+    {
+      "epoch": 0.2054794520547945,
+      "grad_norm": 8.328391075134277,
+      "learning_rate": 4.909624907600904e-06,
+      "loss": 2.1415,
+      "step": 60
+    },
+    {
+      "epoch": 0.23972602739726026,
+      "grad_norm": 7.337668418884277,
+      "learning_rate": 5.727895725534388e-06,
+      "loss": 2.1206,
+      "step": 70
+    },
+    {
+      "epoch": 0.273972602739726,
+      "grad_norm": 7.09800386428833,
+      "learning_rate": 6.546166543467872e-06,
+      "loss": 2.0949,
+      "step": 80
+    },
+    {
+      "epoch": 0.3082191780821918,
+      "grad_norm": 6.549777507781982,
+      "learning_rate": 7.364437361401356e-06,
+      "loss": 2.076,
+      "step": 90
+    },
+    {
+      "epoch": 0.3424657534246575,
+      "grad_norm": 7.464539051055908,
+      "learning_rate": 8.182708179334841e-06,
+      "loss": 2.096,
+      "step": 100
+    },
+    {
+      "epoch": 0.3767123287671233,
+      "grad_norm": 6.982883930206299,
+      "learning_rate": 9.000978997268324e-06,
+      "loss": 2.0615,
+      "step": 110
+    },
+    {
+      "epoch": 0.410958904109589,
+      "grad_norm": 7.149113655090332,
+      "learning_rate": 9.819249815201808e-06,
+      "loss": 2.0785,
+      "step": 120
+    },
+    {
+      "epoch": 0.4452054794520548,
+      "grad_norm": 6.507534503936768,
+      "learning_rate": 1.0637520633135292e-05,
+      "loss": 2.0865,
+      "step": 130
+    },
+    {
+      "epoch": 0.4794520547945205,
+      "grad_norm": 6.1932196617126465,
+      "learning_rate": 1.1455791451068777e-05,
+      "loss": 2.0533,
+      "step": 140
+    },
+    {
+      "epoch": 0.5136986301369864,
+      "grad_norm": 7.072916507720947,
+      "learning_rate": 1.1783771409556479e-05,
+      "loss": 2.0613,
+      "step": 150
+    },
+    {
+      "epoch": 0.547945205479452,
+      "grad_norm": 8.155049324035645,
+      "learning_rate": 1.1621460508598402e-05,
+      "loss": 2.0284,
+      "step": 160
+    },
+    {
+      "epoch": 0.5821917808219178,
+      "grad_norm": 9.3668851852417,
+      "learning_rate": 1.1459149607640322e-05,
+      "loss": 2.0137,
+      "step": 170
+    },
+    {
+      "epoch": 0.6164383561643836,
+      "grad_norm": 8.165146827697754,
+      "learning_rate": 1.1296838706682245e-05,
+      "loss": 1.9835,
+      "step": 180
+    },
+    {
+      "epoch": 0.6506849315068494,
+      "grad_norm": 9.0431547164917,
+      "learning_rate": 1.1134527805724166e-05,
+      "loss": 1.9934,
+      "step": 190
+    },
+    {
+      "epoch": 0.684931506849315,
+      "grad_norm": 8.92784309387207,
+      "learning_rate": 1.0972216904766088e-05,
+      "loss": 2.0081,
+      "step": 200
+    },
+    {
+      "epoch": 0.7191780821917808,
+      "grad_norm": 9.184441566467285,
+      "learning_rate": 1.0809906003808009e-05,
+      "loss": 1.9567,
+      "step": 210
+    },
+    {
+      "epoch": 0.7534246575342466,
+      "grad_norm": 10.262762069702148,
+      "learning_rate": 1.0647595102849931e-05,
+      "loss": 1.966,
+      "step": 220
+    },
+    {
+      "epoch": 0.7876712328767124,
+      "grad_norm": 7.367489337921143,
+      "learning_rate": 1.0485284201891854e-05,
+      "loss": 2.051,
+      "step": 230
+    },
+    {
+      "epoch": 0.821917808219178,
+      "grad_norm": 8.76405143737793,
+      "learning_rate": 1.0322973300933776e-05,
+      "loss": 2.0785,
+      "step": 240
+    },
+    {
+      "epoch": 0.8561643835616438,
+      "grad_norm": 7.100874900817871,
+      "learning_rate": 1.0160662399975697e-05,
+      "loss": 1.9977,
+      "step": 250
+    },
+    {
+      "epoch": 0.8904109589041096,
+      "grad_norm": 8.239387512207031,
+      "learning_rate": 9.998351499017618e-06,
+      "loss": 2.0099,
+      "step": 260
+    },
+    {
+      "epoch": 0.9246575342465754,
+      "grad_norm": 7.704412460327148,
+      "learning_rate": 9.83604059805954e-06,
+      "loss": 1.9851,
+      "step": 270
+    },
+    {
+      "epoch": 0.958904109589041,
+      "grad_norm": 7.8163652420043945,
+      "learning_rate": 9.673729697101463e-06,
+      "loss": 2.0085,
+      "step": 280
+    },
+    {
+      "epoch": 0.9931506849315068,
+      "grad_norm": 8.153071403503418,
+      "learning_rate": 9.511418796143383e-06,
+      "loss": 1.9962,
+      "step": 290
+    },
+    {
+      "epoch": 1.0,
+      "eval_classification_report": {
+        "accuracy": 0.2375,
+        "ar": {
+          "f1-score": 0.0622568093385214,
+          "precision": 0.1568627450980392,
+          "recall": 0.038834951456310676,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.2011173184357542,
+          "precision": 0.16901408450704225,
+          "recall": 0.2482758620689655,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.31543624161073824,
+          "precision": 0.23383084577114427,
+          "recall": 0.4845360824742268,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.27364185110663986,
+          "precision": 0.3119266055045872,
+          "recall": 0.24372759856630824,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.2140692864641761,
+          "precision": 0.24922489036795273,
+          "recall": 0.22042150190811827,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.22950819672131148,
+          "precision": 0.28426395939086296,
+          "recall": 0.19243986254295534,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.10610079575596817,
+          "precision": 0.23255813953488372,
+          "recall": 0.06872852233676977,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.5030674846625767,
+          "precision": 0.6612903225806451,
+          "recall": 0.40594059405940597,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.2354948805460751,
+          "precision": 0.19327731092436976,
+          "recall": 0.30131004366812225,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.22084365412222065,
+          "precision": 0.24892308331106963,
+          "recall": 0.2375,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.2140692864641761,
+      "eval_loss": 1.964627742767334,
+      "eval_runtime": 3.948,
+      "eval_samples_per_second": 506.591,
+      "eval_steps_per_second": 31.662,
+      "step": 292
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 876,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 306938335993344.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

trial_0/checkpoint-292/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf983bab71d39717083fd85c30b7e0fd950e8d457e647f61a7ff596cb390b138
+size 5368

trial_0/checkpoint-292/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/checkpoint-584/config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "ar",
+    "1": "cl",
+    "2": "co",
+    "3": "es",
+    "4": "mx",
+    "5": "pe",
+    "6": "pr",
+    "7": "uy",
+    "8": "ve"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "ar": 0,
+    "cl": 1,
+    "co": 2,
+    "es": 3,
+    "mx": 4,
+    "pe": 5,
+    "pr": 6,
+    "uy": 7,
+    "ve": 8
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 31002
+}

trial_0/checkpoint-584/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4bd824eba668c9f99dbdde707cc6253632a9e5404c4c7bef800e5dba0b97408
+size 439454740

trial_0/checkpoint-584/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d9e5a12946127f3bcd02446e83b50c11c5b9bd0d42c2769ab3843e2416a6ea45
+size 879030522

trial_0/checkpoint-584/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:29298f33af39c877ad364d333a5cea911258abeb5e708833407727da7ed21d36
+size 14244

trial_0/checkpoint-584/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b3ae5ac764505bf16f8c0111375ef98ea91c30113225dcd6204117dc37e31e3b
+size 1064

trial_0/checkpoint-584/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

trial_0/checkpoint-584/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/checkpoint-584/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": false,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

trial_0/checkpoint-584/trainer_state.json ADDED Viewed

	@@ -0,0 +1,595 @@

+{
+  "best_metric": 0.28404923689784706,
+  "best_model_checkpoint": "/content/drive/MyDrive/model_outputs/trial_0/checkpoint-584",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 584,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03424657534246575,
+      "grad_norm": 8.432939529418945,
+      "learning_rate": 8.18270817933484e-07,
+      "loss": 2.2234,
+      "step": 10
+    },
+    {
+      "epoch": 0.0684931506849315,
+      "grad_norm": 8.3140230178833,
+      "learning_rate": 1.636541635866968e-06,
+      "loss": 2.2403,
+      "step": 20
+    },
+    {
+      "epoch": 0.10273972602739725,
+      "grad_norm": 7.506945610046387,
+      "learning_rate": 2.454812453800452e-06,
+      "loss": 2.2297,
+      "step": 30
+    },
+    {
+      "epoch": 0.136986301369863,
+      "grad_norm": 8.531285285949707,
+      "learning_rate": 3.273083271733936e-06,
+      "loss": 2.1823,
+      "step": 40
+    },
+    {
+      "epoch": 0.17123287671232876,
+      "grad_norm": 7.951968669891357,
+      "learning_rate": 4.091354089667421e-06,
+      "loss": 2.1696,
+      "step": 50
+    },
+    {
+      "epoch": 0.2054794520547945,
+      "grad_norm": 8.328391075134277,
+      "learning_rate": 4.909624907600904e-06,
+      "loss": 2.1415,
+      "step": 60
+    },
+    {
+      "epoch": 0.23972602739726026,
+      "grad_norm": 7.337668418884277,
+      "learning_rate": 5.727895725534388e-06,
+      "loss": 2.1206,
+      "step": 70
+    },
+    {
+      "epoch": 0.273972602739726,
+      "grad_norm": 7.09800386428833,
+      "learning_rate": 6.546166543467872e-06,
+      "loss": 2.0949,
+      "step": 80
+    },
+    {
+      "epoch": 0.3082191780821918,
+      "grad_norm": 6.549777507781982,
+      "learning_rate": 7.364437361401356e-06,
+      "loss": 2.076,
+      "step": 90
+    },
+    {
+      "epoch": 0.3424657534246575,
+      "grad_norm": 7.464539051055908,
+      "learning_rate": 8.182708179334841e-06,
+      "loss": 2.096,
+      "step": 100
+    },
+    {
+      "epoch": 0.3767123287671233,
+      "grad_norm": 6.982883930206299,
+      "learning_rate": 9.000978997268324e-06,
+      "loss": 2.0615,
+      "step": 110
+    },
+    {
+      "epoch": 0.410958904109589,
+      "grad_norm": 7.149113655090332,
+      "learning_rate": 9.819249815201808e-06,
+      "loss": 2.0785,
+      "step": 120
+    },
+    {
+      "epoch": 0.4452054794520548,
+      "grad_norm": 6.507534503936768,
+      "learning_rate": 1.0637520633135292e-05,
+      "loss": 2.0865,
+      "step": 130
+    },
+    {
+      "epoch": 0.4794520547945205,
+      "grad_norm": 6.1932196617126465,
+      "learning_rate": 1.1455791451068777e-05,
+      "loss": 2.0533,
+      "step": 140
+    },
+    {
+      "epoch": 0.5136986301369864,
+      "grad_norm": 7.072916507720947,
+      "learning_rate": 1.1783771409556479e-05,
+      "loss": 2.0613,
+      "step": 150
+    },
+    {
+      "epoch": 0.547945205479452,
+      "grad_norm": 8.155049324035645,
+      "learning_rate": 1.1621460508598402e-05,
+      "loss": 2.0284,
+      "step": 160
+    },
+    {
+      "epoch": 0.5821917808219178,
+      "grad_norm": 9.3668851852417,
+      "learning_rate": 1.1459149607640322e-05,
+      "loss": 2.0137,
+      "step": 170
+    },
+    {
+      "epoch": 0.6164383561643836,
+      "grad_norm": 8.165146827697754,
+      "learning_rate": 1.1296838706682245e-05,
+      "loss": 1.9835,
+      "step": 180
+    },
+    {
+      "epoch": 0.6506849315068494,
+      "grad_norm": 9.0431547164917,
+      "learning_rate": 1.1134527805724166e-05,
+      "loss": 1.9934,
+      "step": 190
+    },
+    {
+      "epoch": 0.684931506849315,
+      "grad_norm": 8.92784309387207,
+      "learning_rate": 1.0972216904766088e-05,
+      "loss": 2.0081,
+      "step": 200
+    },
+    {
+      "epoch": 0.7191780821917808,
+      "grad_norm": 9.184441566467285,
+      "learning_rate": 1.0809906003808009e-05,
+      "loss": 1.9567,
+      "step": 210
+    },
+    {
+      "epoch": 0.7534246575342466,
+      "grad_norm": 10.262762069702148,
+      "learning_rate": 1.0647595102849931e-05,
+      "loss": 1.966,
+      "step": 220
+    },
+    {
+      "epoch": 0.7876712328767124,
+      "grad_norm": 7.367489337921143,
+      "learning_rate": 1.0485284201891854e-05,
+      "loss": 2.051,
+      "step": 230
+    },
+    {
+      "epoch": 0.821917808219178,
+      "grad_norm": 8.76405143737793,
+      "learning_rate": 1.0322973300933776e-05,
+      "loss": 2.0785,
+      "step": 240
+    },
+    {
+      "epoch": 0.8561643835616438,
+      "grad_norm": 7.100874900817871,
+      "learning_rate": 1.0160662399975697e-05,
+      "loss": 1.9977,
+      "step": 250
+    },
+    {
+      "epoch": 0.8904109589041096,
+      "grad_norm": 8.239387512207031,
+      "learning_rate": 9.998351499017618e-06,
+      "loss": 2.0099,
+      "step": 260
+    },
+    {
+      "epoch": 0.9246575342465754,
+      "grad_norm": 7.704412460327148,
+      "learning_rate": 9.83604059805954e-06,
+      "loss": 1.9851,
+      "step": 270
+    },
+    {
+      "epoch": 0.958904109589041,
+      "grad_norm": 7.8163652420043945,
+      "learning_rate": 9.673729697101463e-06,
+      "loss": 2.0085,
+      "step": 280
+    },
+    {
+      "epoch": 0.9931506849315068,
+      "grad_norm": 8.153071403503418,
+      "learning_rate": 9.511418796143383e-06,
+      "loss": 1.9962,
+      "step": 290
+    },
+    {
+      "epoch": 1.0,
+      "eval_classification_report": {
+        "accuracy": 0.2375,
+        "ar": {
+          "f1-score": 0.0622568093385214,
+          "precision": 0.1568627450980392,
+          "recall": 0.038834951456310676,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.2011173184357542,
+          "precision": 0.16901408450704225,
+          "recall": 0.2482758620689655,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.31543624161073824,
+          "precision": 0.23383084577114427,
+          "recall": 0.4845360824742268,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.27364185110663986,
+          "precision": 0.3119266055045872,
+          "recall": 0.24372759856630824,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.2140692864641761,
+          "precision": 0.24922489036795273,
+          "recall": 0.22042150190811827,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.22950819672131148,
+          "precision": 0.28426395939086296,
+          "recall": 0.19243986254295534,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.10610079575596817,
+          "precision": 0.23255813953488372,
+          "recall": 0.06872852233676977,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.5030674846625767,
+          "precision": 0.6612903225806451,
+          "recall": 0.40594059405940597,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.2354948805460751,
+          "precision": 0.19327731092436976,
+          "recall": 0.30131004366812225,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.22084365412222065,
+          "precision": 0.24892308331106963,
+          "recall": 0.2375,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.2140692864641761,
+      "eval_loss": 1.964627742767334,
+      "eval_runtime": 3.948,
+      "eval_samples_per_second": 506.591,
+      "eval_steps_per_second": 31.662,
+      "step": 292
+    },
+    {
+      "epoch": 1.0273972602739727,
+      "grad_norm": 7.403143882751465,
+      "learning_rate": 9.349107895185306e-06,
+      "loss": 1.9144,
+      "step": 300
+    },
+    {
+      "epoch": 1.0616438356164384,
+      "grad_norm": 7.673084735870361,
+      "learning_rate": 9.186796994227228e-06,
+      "loss": 1.8783,
+      "step": 310
+    },
+    {
+      "epoch": 1.095890410958904,
+      "grad_norm": 7.875649452209473,
+      "learning_rate": 9.024486093269149e-06,
+      "loss": 1.9275,
+      "step": 320
+    },
+    {
+      "epoch": 1.13013698630137,
+      "grad_norm": 8.519344329833984,
+      "learning_rate": 8.86217519231107e-06,
+      "loss": 1.9603,
+      "step": 330
+    },
+    {
+      "epoch": 1.1643835616438356,
+      "grad_norm": 11.323283195495605,
+      "learning_rate": 8.699864291352992e-06,
+      "loss": 1.923,
+      "step": 340
+    },
+    {
+      "epoch": 1.1986301369863013,
+      "grad_norm": 8.269103050231934,
+      "learning_rate": 8.537553390394915e-06,
+      "loss": 1.9427,
+      "step": 350
+    },
+    {
+      "epoch": 1.2328767123287672,
+      "grad_norm": 9.630481719970703,
+      "learning_rate": 8.375242489436837e-06,
+      "loss": 1.8944,
+      "step": 360
+    },
+    {
+      "epoch": 1.2671232876712328,
+      "grad_norm": 10.00069808959961,
+      "learning_rate": 8.212931588478758e-06,
+      "loss": 1.8854,
+      "step": 370
+    },
+    {
+      "epoch": 1.3013698630136985,
+      "grad_norm": 10.448683738708496,
+      "learning_rate": 8.05062068752068e-06,
+      "loss": 1.9484,
+      "step": 380
+    },
+    {
+      "epoch": 1.3356164383561644,
+      "grad_norm": 9.772107124328613,
+      "learning_rate": 7.888309786562601e-06,
+      "loss": 1.8663,
+      "step": 390
+    },
+    {
+      "epoch": 1.36986301369863,
+      "grad_norm": 10.358853340148926,
+      "learning_rate": 7.725998885604523e-06,
+      "loss": 1.9082,
+      "step": 400
+    },
+    {
+      "epoch": 1.404109589041096,
+      "grad_norm": 11.836031913757324,
+      "learning_rate": 7.563687984646444e-06,
+      "loss": 1.881,
+      "step": 410
+    },
+    {
+      "epoch": 1.4383561643835616,
+      "grad_norm": 11.461163520812988,
+      "learning_rate": 7.401377083688367e-06,
+      "loss": 1.964,
+      "step": 420
+    },
+    {
+      "epoch": 1.4726027397260273,
+      "grad_norm": 9.836813926696777,
+      "learning_rate": 7.239066182730289e-06,
+      "loss": 1.8552,
+      "step": 430
+    },
+    {
+      "epoch": 1.5068493150684932,
+      "grad_norm": 12.651612281799316,
+      "learning_rate": 7.076755281772211e-06,
+      "loss": 1.8211,
+      "step": 440
+    },
+    {
+      "epoch": 1.541095890410959,
+      "grad_norm": 10.353775024414062,
+      "learning_rate": 6.9144443808141315e-06,
+      "loss": 1.905,
+      "step": 450
+    },
+    {
+      "epoch": 1.5753424657534247,
+      "grad_norm": 9.688141822814941,
+      "learning_rate": 6.752133479856054e-06,
+      "loss": 1.8525,
+      "step": 460
+    },
+    {
+      "epoch": 1.6095890410958904,
+      "grad_norm": 10.979829788208008,
+      "learning_rate": 6.5898225788979756e-06,
+      "loss": 1.8468,
+      "step": 470
+    },
+    {
+      "epoch": 1.643835616438356,
+      "grad_norm": 11.913898468017578,
+      "learning_rate": 6.427511677939898e-06,
+      "loss": 1.8301,
+      "step": 480
+    },
+    {
+      "epoch": 1.678082191780822,
+      "grad_norm": 9.506439208984375,
+      "learning_rate": 6.265200776981819e-06,
+      "loss": 1.9175,
+      "step": 490
+    },
+    {
+      "epoch": 1.7123287671232876,
+      "grad_norm": 11.259939193725586,
+      "learning_rate": 6.102889876023741e-06,
+      "loss": 1.8674,
+      "step": 500
+    },
+    {
+      "epoch": 1.7465753424657535,
+      "grad_norm": 10.506684303283691,
+      "learning_rate": 5.940578975065663e-06,
+      "loss": 1.8201,
+      "step": 510
+    },
+    {
+      "epoch": 1.7808219178082192,
+      "grad_norm": 10.255843162536621,
+      "learning_rate": 5.7782680741075844e-06,
+      "loss": 1.83,
+      "step": 520
+    },
+    {
+      "epoch": 1.8150684931506849,
+      "grad_norm": 10.053559303283691,
+      "learning_rate": 5.615957173149507e-06,
+      "loss": 1.8929,
+      "step": 530
+    },
+    {
+      "epoch": 1.8493150684931505,
+      "grad_norm": 11.122831344604492,
+      "learning_rate": 5.4536462721914285e-06,
+      "loss": 1.8836,
+      "step": 540
+    },
+    {
+      "epoch": 1.8835616438356164,
+      "grad_norm": 10.520340919494629,
+      "learning_rate": 5.29133537123335e-06,
+      "loss": 1.8587,
+      "step": 550
+    },
+    {
+      "epoch": 1.9178082191780823,
+      "grad_norm": 10.444989204406738,
+      "learning_rate": 5.129024470275272e-06,
+      "loss": 1.9133,
+      "step": 560
+    },
+    {
+      "epoch": 1.952054794520548,
+      "grad_norm": 9.19580078125,
+      "learning_rate": 4.966713569317194e-06,
+      "loss": 1.7403,
+      "step": 570
+    },
+    {
+      "epoch": 1.9863013698630136,
+      "grad_norm": 9.467530250549316,
+      "learning_rate": 4.804402668359115e-06,
+      "loss": 1.854,
+      "step": 580
+    },
+    {
+      "epoch": 2.0,
+      "eval_classification_report": {
+        "accuracy": 0.3015,
+        "ar": {
+          "f1-score": 0.20817843866171004,
+          "precision": 0.4444444444444444,
+          "recall": 0.13592233009708737,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.24404761904761904,
+          "precision": 0.21465968586387435,
+          "recall": 0.2827586206896552,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.3091190108191654,
+          "precision": 0.2808988764044944,
+          "recall": 0.3436426116838488,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.36363636363636365,
+          "precision": 0.31891891891891894,
+          "recall": 0.4229390681003584,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.28404923689784706,
+          "precision": 0.313232548351025,
+          "recall": 0.28845705885930073,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.3058350100603622,
+          "precision": 0.36893203883495146,
+          "recall": 0.2611683848797251,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.23582089552238805,
+          "precision": 0.20844327176781002,
+          "recall": 0.27147766323024053,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.5688888888888889,
+          "precision": 0.5161290322580645,
+          "recall": 0.6336633663366337,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.3209169054441261,
+          "precision": 0.4666666666666667,
+          "recall": 0.2445414847161572,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.29681818157005363,
+          "precision": 0.3257693650891501,
+          "recall": 0.3015,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.28404923689784706,
+      "eval_loss": 1.8588982820510864,
+      "eval_runtime": 3.9624,
+      "eval_samples_per_second": 504.741,
+      "eval_steps_per_second": 31.546,
+      "step": 584
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 876,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 613876671986688.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

trial_0/checkpoint-584/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf983bab71d39717083fd85c30b7e0fd950e8d457e647f61a7ff596cb390b138
+size 5368

trial_0/checkpoint-584/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/checkpoint-876/config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "ar",
+    "1": "cl",
+    "2": "co",
+    "3": "es",
+    "4": "mx",
+    "5": "pe",
+    "6": "pr",
+    "7": "uy",
+    "8": "ve"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "ar": 0,
+    "cl": 1,
+    "co": 2,
+    "es": 3,
+    "mx": 4,
+    "pe": 5,
+    "pr": 6,
+    "uy": 7,
+    "ve": 8
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 31002
+}

trial_0/checkpoint-876/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf854bf20a145ed4aea50832d905cbc3b7c185076aa225249307cba72e17e404
+size 439454740

trial_0/checkpoint-876/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a57e2c02488f59dc935a6f5d7b68b0210f98125fd0c15d37ff039eb0f9a9cb9e
+size 879030522

trial_0/checkpoint-876/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5ec19cccb67f774cb5d9d70fcb09d0964e6b44cd2249c3f0f947bc6c27a2d1c
+size 14244

trial_0/checkpoint-876/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5f3e075f9e406a57a0eebb4f878639933cb4c2996bf03eaa3ac48b55e42597a6
+size 1064

trial_0/checkpoint-876/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "cls_token": {
+    "content": "[CLS]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "[MASK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "[PAD]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "[SEP]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "[UNK]",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

trial_0/checkpoint-876/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/checkpoint-876/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,58 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "4": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "5": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": true,
+  "extra_special_tokens": {},
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": false,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

trial_0/checkpoint-876/trainer_state.json ADDED Viewed

	@@ -0,0 +1,876 @@

+{
+  "best_metric": 0.30473656895821705,
+  "best_model_checkpoint": "/content/drive/MyDrive/model_outputs/trial_0/checkpoint-876",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 876,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03424657534246575,
+      "grad_norm": 8.432939529418945,
+      "learning_rate": 8.18270817933484e-07,
+      "loss": 2.2234,
+      "step": 10
+    },
+    {
+      "epoch": 0.0684931506849315,
+      "grad_norm": 8.3140230178833,
+      "learning_rate": 1.636541635866968e-06,
+      "loss": 2.2403,
+      "step": 20
+    },
+    {
+      "epoch": 0.10273972602739725,
+      "grad_norm": 7.506945610046387,
+      "learning_rate": 2.454812453800452e-06,
+      "loss": 2.2297,
+      "step": 30
+    },
+    {
+      "epoch": 0.136986301369863,
+      "grad_norm": 8.531285285949707,
+      "learning_rate": 3.273083271733936e-06,
+      "loss": 2.1823,
+      "step": 40
+    },
+    {
+      "epoch": 0.17123287671232876,
+      "grad_norm": 7.951968669891357,
+      "learning_rate": 4.091354089667421e-06,
+      "loss": 2.1696,
+      "step": 50
+    },
+    {
+      "epoch": 0.2054794520547945,
+      "grad_norm": 8.328391075134277,
+      "learning_rate": 4.909624907600904e-06,
+      "loss": 2.1415,
+      "step": 60
+    },
+    {
+      "epoch": 0.23972602739726026,
+      "grad_norm": 7.337668418884277,
+      "learning_rate": 5.727895725534388e-06,
+      "loss": 2.1206,
+      "step": 70
+    },
+    {
+      "epoch": 0.273972602739726,
+      "grad_norm": 7.09800386428833,
+      "learning_rate": 6.546166543467872e-06,
+      "loss": 2.0949,
+      "step": 80
+    },
+    {
+      "epoch": 0.3082191780821918,
+      "grad_norm": 6.549777507781982,
+      "learning_rate": 7.364437361401356e-06,
+      "loss": 2.076,
+      "step": 90
+    },
+    {
+      "epoch": 0.3424657534246575,
+      "grad_norm": 7.464539051055908,
+      "learning_rate": 8.182708179334841e-06,
+      "loss": 2.096,
+      "step": 100
+    },
+    {
+      "epoch": 0.3767123287671233,
+      "grad_norm": 6.982883930206299,
+      "learning_rate": 9.000978997268324e-06,
+      "loss": 2.0615,
+      "step": 110
+    },
+    {
+      "epoch": 0.410958904109589,
+      "grad_norm": 7.149113655090332,
+      "learning_rate": 9.819249815201808e-06,
+      "loss": 2.0785,
+      "step": 120
+    },
+    {
+      "epoch": 0.4452054794520548,
+      "grad_norm": 6.507534503936768,
+      "learning_rate": 1.0637520633135292e-05,
+      "loss": 2.0865,
+      "step": 130
+    },
+    {
+      "epoch": 0.4794520547945205,
+      "grad_norm": 6.1932196617126465,
+      "learning_rate": 1.1455791451068777e-05,
+      "loss": 2.0533,
+      "step": 140
+    },
+    {
+      "epoch": 0.5136986301369864,
+      "grad_norm": 7.072916507720947,
+      "learning_rate": 1.1783771409556479e-05,
+      "loss": 2.0613,
+      "step": 150
+    },
+    {
+      "epoch": 0.547945205479452,
+      "grad_norm": 8.155049324035645,
+      "learning_rate": 1.1621460508598402e-05,
+      "loss": 2.0284,
+      "step": 160
+    },
+    {
+      "epoch": 0.5821917808219178,
+      "grad_norm": 9.3668851852417,
+      "learning_rate": 1.1459149607640322e-05,
+      "loss": 2.0137,
+      "step": 170
+    },
+    {
+      "epoch": 0.6164383561643836,
+      "grad_norm": 8.165146827697754,
+      "learning_rate": 1.1296838706682245e-05,
+      "loss": 1.9835,
+      "step": 180
+    },
+    {
+      "epoch": 0.6506849315068494,
+      "grad_norm": 9.0431547164917,
+      "learning_rate": 1.1134527805724166e-05,
+      "loss": 1.9934,
+      "step": 190
+    },
+    {
+      "epoch": 0.684931506849315,
+      "grad_norm": 8.92784309387207,
+      "learning_rate": 1.0972216904766088e-05,
+      "loss": 2.0081,
+      "step": 200
+    },
+    {
+      "epoch": 0.7191780821917808,
+      "grad_norm": 9.184441566467285,
+      "learning_rate": 1.0809906003808009e-05,
+      "loss": 1.9567,
+      "step": 210
+    },
+    {
+      "epoch": 0.7534246575342466,
+      "grad_norm": 10.262762069702148,
+      "learning_rate": 1.0647595102849931e-05,
+      "loss": 1.966,
+      "step": 220
+    },
+    {
+      "epoch": 0.7876712328767124,
+      "grad_norm": 7.367489337921143,
+      "learning_rate": 1.0485284201891854e-05,
+      "loss": 2.051,
+      "step": 230
+    },
+    {
+      "epoch": 0.821917808219178,
+      "grad_norm": 8.76405143737793,
+      "learning_rate": 1.0322973300933776e-05,
+      "loss": 2.0785,
+      "step": 240
+    },
+    {
+      "epoch": 0.8561643835616438,
+      "grad_norm": 7.100874900817871,
+      "learning_rate": 1.0160662399975697e-05,
+      "loss": 1.9977,
+      "step": 250
+    },
+    {
+      "epoch": 0.8904109589041096,
+      "grad_norm": 8.239387512207031,
+      "learning_rate": 9.998351499017618e-06,
+      "loss": 2.0099,
+      "step": 260
+    },
+    {
+      "epoch": 0.9246575342465754,
+      "grad_norm": 7.704412460327148,
+      "learning_rate": 9.83604059805954e-06,
+      "loss": 1.9851,
+      "step": 270
+    },
+    {
+      "epoch": 0.958904109589041,
+      "grad_norm": 7.8163652420043945,
+      "learning_rate": 9.673729697101463e-06,
+      "loss": 2.0085,
+      "step": 280
+    },
+    {
+      "epoch": 0.9931506849315068,
+      "grad_norm": 8.153071403503418,
+      "learning_rate": 9.511418796143383e-06,
+      "loss": 1.9962,
+      "step": 290
+    },
+    {
+      "epoch": 1.0,
+      "eval_classification_report": {
+        "accuracy": 0.2375,
+        "ar": {
+          "f1-score": 0.0622568093385214,
+          "precision": 0.1568627450980392,
+          "recall": 0.038834951456310676,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.2011173184357542,
+          "precision": 0.16901408450704225,
+          "recall": 0.2482758620689655,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.31543624161073824,
+          "precision": 0.23383084577114427,
+          "recall": 0.4845360824742268,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.27364185110663986,
+          "precision": 0.3119266055045872,
+          "recall": 0.24372759856630824,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.2140692864641761,
+          "precision": 0.24922489036795273,
+          "recall": 0.22042150190811827,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.22950819672131148,
+          "precision": 0.28426395939086296,
+          "recall": 0.19243986254295534,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.10610079575596817,
+          "precision": 0.23255813953488372,
+          "recall": 0.06872852233676977,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.5030674846625767,
+          "precision": 0.6612903225806451,
+          "recall": 0.40594059405940597,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.2354948805460751,
+          "precision": 0.19327731092436976,
+          "recall": 0.30131004366812225,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.22084365412222065,
+          "precision": 0.24892308331106963,
+          "recall": 0.2375,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.2140692864641761,
+      "eval_loss": 1.964627742767334,
+      "eval_runtime": 3.948,
+      "eval_samples_per_second": 506.591,
+      "eval_steps_per_second": 31.662,
+      "step": 292
+    },
+    {
+      "epoch": 1.0273972602739727,
+      "grad_norm": 7.403143882751465,
+      "learning_rate": 9.349107895185306e-06,
+      "loss": 1.9144,
+      "step": 300
+    },
+    {
+      "epoch": 1.0616438356164384,
+      "grad_norm": 7.673084735870361,
+      "learning_rate": 9.186796994227228e-06,
+      "loss": 1.8783,
+      "step": 310
+    },
+    {
+      "epoch": 1.095890410958904,
+      "grad_norm": 7.875649452209473,
+      "learning_rate": 9.024486093269149e-06,
+      "loss": 1.9275,
+      "step": 320
+    },
+    {
+      "epoch": 1.13013698630137,
+      "grad_norm": 8.519344329833984,
+      "learning_rate": 8.86217519231107e-06,
+      "loss": 1.9603,
+      "step": 330
+    },
+    {
+      "epoch": 1.1643835616438356,
+      "grad_norm": 11.323283195495605,
+      "learning_rate": 8.699864291352992e-06,
+      "loss": 1.923,
+      "step": 340
+    },
+    {
+      "epoch": 1.1986301369863013,
+      "grad_norm": 8.269103050231934,
+      "learning_rate": 8.537553390394915e-06,
+      "loss": 1.9427,
+      "step": 350
+    },
+    {
+      "epoch": 1.2328767123287672,
+      "grad_norm": 9.630481719970703,
+      "learning_rate": 8.375242489436837e-06,
+      "loss": 1.8944,
+      "step": 360
+    },
+    {
+      "epoch": 1.2671232876712328,
+      "grad_norm": 10.00069808959961,
+      "learning_rate": 8.212931588478758e-06,
+      "loss": 1.8854,
+      "step": 370
+    },
+    {
+      "epoch": 1.3013698630136985,
+      "grad_norm": 10.448683738708496,
+      "learning_rate": 8.05062068752068e-06,
+      "loss": 1.9484,
+      "step": 380
+    },
+    {
+      "epoch": 1.3356164383561644,
+      "grad_norm": 9.772107124328613,
+      "learning_rate": 7.888309786562601e-06,
+      "loss": 1.8663,
+      "step": 390
+    },
+    {
+      "epoch": 1.36986301369863,
+      "grad_norm": 10.358853340148926,
+      "learning_rate": 7.725998885604523e-06,
+      "loss": 1.9082,
+      "step": 400
+    },
+    {
+      "epoch": 1.404109589041096,
+      "grad_norm": 11.836031913757324,
+      "learning_rate": 7.563687984646444e-06,
+      "loss": 1.881,
+      "step": 410
+    },
+    {
+      "epoch": 1.4383561643835616,
+      "grad_norm": 11.461163520812988,
+      "learning_rate": 7.401377083688367e-06,
+      "loss": 1.964,
+      "step": 420
+    },
+    {
+      "epoch": 1.4726027397260273,
+      "grad_norm": 9.836813926696777,
+      "learning_rate": 7.239066182730289e-06,
+      "loss": 1.8552,
+      "step": 430
+    },
+    {
+      "epoch": 1.5068493150684932,
+      "grad_norm": 12.651612281799316,
+      "learning_rate": 7.076755281772211e-06,
+      "loss": 1.8211,
+      "step": 440
+    },
+    {
+      "epoch": 1.541095890410959,
+      "grad_norm": 10.353775024414062,
+      "learning_rate": 6.9144443808141315e-06,
+      "loss": 1.905,
+      "step": 450
+    },
+    {
+      "epoch": 1.5753424657534247,
+      "grad_norm": 9.688141822814941,
+      "learning_rate": 6.752133479856054e-06,
+      "loss": 1.8525,
+      "step": 460
+    },
+    {
+      "epoch": 1.6095890410958904,
+      "grad_norm": 10.979829788208008,
+      "learning_rate": 6.5898225788979756e-06,
+      "loss": 1.8468,
+      "step": 470
+    },
+    {
+      "epoch": 1.643835616438356,
+      "grad_norm": 11.913898468017578,
+      "learning_rate": 6.427511677939898e-06,
+      "loss": 1.8301,
+      "step": 480
+    },
+    {
+      "epoch": 1.678082191780822,
+      "grad_norm": 9.506439208984375,
+      "learning_rate": 6.265200776981819e-06,
+      "loss": 1.9175,
+      "step": 490
+    },
+    {
+      "epoch": 1.7123287671232876,
+      "grad_norm": 11.259939193725586,
+      "learning_rate": 6.102889876023741e-06,
+      "loss": 1.8674,
+      "step": 500
+    },
+    {
+      "epoch": 1.7465753424657535,
+      "grad_norm": 10.506684303283691,
+      "learning_rate": 5.940578975065663e-06,
+      "loss": 1.8201,
+      "step": 510
+    },
+    {
+      "epoch": 1.7808219178082192,
+      "grad_norm": 10.255843162536621,
+      "learning_rate": 5.7782680741075844e-06,
+      "loss": 1.83,
+      "step": 520
+    },
+    {
+      "epoch": 1.8150684931506849,
+      "grad_norm": 10.053559303283691,
+      "learning_rate": 5.615957173149507e-06,
+      "loss": 1.8929,
+      "step": 530
+    },
+    {
+      "epoch": 1.8493150684931505,
+      "grad_norm": 11.122831344604492,
+      "learning_rate": 5.4536462721914285e-06,
+      "loss": 1.8836,
+      "step": 540
+    },
+    {
+      "epoch": 1.8835616438356164,
+      "grad_norm": 10.520340919494629,
+      "learning_rate": 5.29133537123335e-06,
+      "loss": 1.8587,
+      "step": 550
+    },
+    {
+      "epoch": 1.9178082191780823,
+      "grad_norm": 10.444989204406738,
+      "learning_rate": 5.129024470275272e-06,
+      "loss": 1.9133,
+      "step": 560
+    },
+    {
+      "epoch": 1.952054794520548,
+      "grad_norm": 9.19580078125,
+      "learning_rate": 4.966713569317194e-06,
+      "loss": 1.7403,
+      "step": 570
+    },
+    {
+      "epoch": 1.9863013698630136,
+      "grad_norm": 9.467530250549316,
+      "learning_rate": 4.804402668359115e-06,
+      "loss": 1.854,
+      "step": 580
+    },
+    {
+      "epoch": 2.0,
+      "eval_classification_report": {
+        "accuracy": 0.3015,
+        "ar": {
+          "f1-score": 0.20817843866171004,
+          "precision": 0.4444444444444444,
+          "recall": 0.13592233009708737,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.24404761904761904,
+          "precision": 0.21465968586387435,
+          "recall": 0.2827586206896552,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.3091190108191654,
+          "precision": 0.2808988764044944,
+          "recall": 0.3436426116838488,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.36363636363636365,
+          "precision": 0.31891891891891894,
+          "recall": 0.4229390681003584,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.28404923689784706,
+          "precision": 0.313232548351025,
+          "recall": 0.28845705885930073,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.3058350100603622,
+          "precision": 0.36893203883495146,
+          "recall": 0.2611683848797251,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.23582089552238805,
+          "precision": 0.20844327176781002,
+          "recall": 0.27147766323024053,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.5688888888888889,
+          "precision": 0.5161290322580645,
+          "recall": 0.6336633663366337,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.3209169054441261,
+          "precision": 0.4666666666666667,
+          "recall": 0.2445414847161572,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.29681818157005363,
+          "precision": 0.3257693650891501,
+          "recall": 0.3015,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.28404923689784706,
+      "eval_loss": 1.8588982820510864,
+      "eval_runtime": 3.9624,
+      "eval_samples_per_second": 504.741,
+      "eval_steps_per_second": 31.546,
+      "step": 584
+    },
+    {
+      "epoch": 2.0205479452054793,
+      "grad_norm": 10.664342880249023,
+      "learning_rate": 4.642091767401037e-06,
+      "loss": 1.7675,
+      "step": 590
+    },
+    {
+      "epoch": 2.0547945205479454,
+      "grad_norm": 10.18624210357666,
+      "learning_rate": 4.479780866442959e-06,
+      "loss": 1.7303,
+      "step": 600
+    },
+    {
+      "epoch": 2.089041095890411,
+      "grad_norm": 9.922106742858887,
+      "learning_rate": 4.3174699654848806e-06,
+      "loss": 1.6809,
+      "step": 610
+    },
+    {
+      "epoch": 2.1232876712328768,
+      "grad_norm": 10.778169631958008,
+      "learning_rate": 4.155159064526802e-06,
+      "loss": 1.6858,
+      "step": 620
+    },
+    {
+      "epoch": 2.1575342465753424,
+      "grad_norm": 11.85101318359375,
+      "learning_rate": 3.992848163568725e-06,
+      "loss": 1.7164,
+      "step": 630
+    },
+    {
+      "epoch": 2.191780821917808,
+      "grad_norm": 10.55038833618164,
+      "learning_rate": 3.830537262610646e-06,
+      "loss": 1.7627,
+      "step": 640
+    },
+    {
+      "epoch": 2.2260273972602738,
+      "grad_norm": 12.37063217163086,
+      "learning_rate": 3.6682263616525683e-06,
+      "loss": 1.7254,
+      "step": 650
+    },
+    {
+      "epoch": 2.26027397260274,
+      "grad_norm": 12.823184967041016,
+      "learning_rate": 3.5059154606944894e-06,
+      "loss": 1.6745,
+      "step": 660
+    },
+    {
+      "epoch": 2.2945205479452055,
+      "grad_norm": 10.982261657714844,
+      "learning_rate": 3.3436045597364115e-06,
+      "loss": 1.6329,
+      "step": 670
+    },
+    {
+      "epoch": 2.328767123287671,
+      "grad_norm": 11.901023864746094,
+      "learning_rate": 3.181293658778333e-06,
+      "loss": 1.7054,
+      "step": 680
+    },
+    {
+      "epoch": 2.363013698630137,
+      "grad_norm": 12.643646240234375,
+      "learning_rate": 3.018982757820255e-06,
+      "loss": 1.6988,
+      "step": 690
+    },
+    {
+      "epoch": 2.3972602739726026,
+      "grad_norm": 11.213497161865234,
+      "learning_rate": 2.8566718568621767e-06,
+      "loss": 1.6856,
+      "step": 700
+    },
+    {
+      "epoch": 2.4315068493150687,
+      "grad_norm": 13.69401741027832,
+      "learning_rate": 2.6943609559040983e-06,
+      "loss": 1.7865,
+      "step": 710
+    },
+    {
+      "epoch": 2.4657534246575343,
+      "grad_norm": 11.204819679260254,
+      "learning_rate": 2.5320500549460203e-06,
+      "loss": 1.6012,
+      "step": 720
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 11.135315895080566,
+      "learning_rate": 2.369739153987942e-06,
+      "loss": 1.7297,
+      "step": 730
+    },
+    {
+      "epoch": 2.5342465753424657,
+      "grad_norm": 11.281685829162598,
+      "learning_rate": 2.207428253029864e-06,
+      "loss": 1.7066,
+      "step": 740
+    },
+    {
+      "epoch": 2.5684931506849313,
+      "grad_norm": 12.174514770507812,
+      "learning_rate": 2.0451173520717856e-06,
+      "loss": 1.7291,
+      "step": 750
+    },
+    {
+      "epoch": 2.602739726027397,
+      "grad_norm": 11.84288501739502,
+      "learning_rate": 1.8828064511137074e-06,
+      "loss": 1.7143,
+      "step": 760
+    },
+    {
+      "epoch": 2.636986301369863,
+      "grad_norm": 13.132065773010254,
+      "learning_rate": 1.7204955501556292e-06,
+      "loss": 1.6739,
+      "step": 770
+    },
+    {
+      "epoch": 2.671232876712329,
+      "grad_norm": 10.684150695800781,
+      "learning_rate": 1.5581846491975508e-06,
+      "loss": 1.7677,
+      "step": 780
+    },
+    {
+      "epoch": 2.7054794520547945,
+      "grad_norm": 10.924251556396484,
+      "learning_rate": 1.3958737482394726e-06,
+      "loss": 1.7319,
+      "step": 790
+    },
+    {
+      "epoch": 2.73972602739726,
+      "grad_norm": 11.701458930969238,
+      "learning_rate": 1.2335628472813945e-06,
+      "loss": 1.633,
+      "step": 800
+    },
+    {
+      "epoch": 2.7739726027397262,
+      "grad_norm": 15.176057815551758,
+      "learning_rate": 1.0712519463233163e-06,
+      "loss": 1.7776,
+      "step": 810
+    },
+    {
+      "epoch": 2.808219178082192,
+      "grad_norm": 11.823851585388184,
+      "learning_rate": 9.08941045365238e-07,
+      "loss": 1.6718,
+      "step": 820
+    },
+    {
+      "epoch": 2.8424657534246576,
+      "grad_norm": 16.096837997436523,
+      "learning_rate": 7.466301444071598e-07,
+      "loss": 1.8125,
+      "step": 830
+    },
+    {
+      "epoch": 2.8767123287671232,
+      "grad_norm": 14.548500061035156,
+      "learning_rate": 5.843192434490816e-07,
+      "loss": 1.6709,
+      "step": 840
+    },
+    {
+      "epoch": 2.910958904109589,
+      "grad_norm": 14.510014533996582,
+      "learning_rate": 4.2200834249100337e-07,
+      "loss": 1.7332,
+      "step": 850
+    },
+    {
+      "epoch": 2.9452054794520546,
+      "grad_norm": 12.800880432128906,
+      "learning_rate": 2.5969744153292514e-07,
+      "loss": 1.656,
+      "step": 860
+    },
+    {
+      "epoch": 2.9794520547945207,
+      "grad_norm": 11.786734580993652,
+      "learning_rate": 9.738654057484693e-08,
+      "loss": 1.6054,
+      "step": 870
+    },
+    {
+      "epoch": 3.0,
+      "eval_classification_report": {
+        "accuracy": 0.321,
+        "ar": {
+          "f1-score": 0.24539877300613497,
+          "precision": 0.3333333333333333,
+          "recall": 0.1941747572815534,
+          "support": 206.0
+        },
+        "cl": {
+          "f1-score": 0.22151898734177214,
+          "precision": 0.2046783625730994,
+          "recall": 0.2413793103448276,
+          "support": 290.0
+        },
+        "co": {
+          "f1-score": 0.327212020033389,
+          "precision": 0.3181818181818182,
+          "recall": 0.33676975945017185,
+          "support": 291.0
+        },
+        "es": {
+          "f1-score": 0.39095315024232635,
+          "precision": 0.3558823529411765,
+          "recall": 0.4336917562724014,
+          "support": 279.0
+        },
+        "macro avg": {
+          "f1-score": 0.30473656895821705,
+          "precision": 0.31299377782399707,
+          "recall": 0.3074325006319518,
+          "support": 2000.0
+        },
+        "mx": {
+          "f1-score": 0.36075949367088606,
+          "precision": 0.3343108504398827,
+          "recall": 0.3917525773195876,
+          "support": 291.0
+        },
+        "pe": {
+          "f1-score": 0.23850085178875638,
+          "precision": 0.23648648648648649,
+          "recall": 0.24054982817869416,
+          "support": 291.0
+        },
+        "pr": {
+          "f1-score": 0.616822429906542,
+          "precision": 0.584070796460177,
+          "recall": 0.6534653465346535,
+          "support": 101.0
+        },
+        "uy": {
+          "f1-score": 0.34146341463414637,
+          "precision": 0.45,
+          "recall": 0.27510917030567683,
+          "support": 229.0
+        },
+        "ve": {
+          "f1-score": 0.0,
+          "precision": 0.0,
+          "recall": 0.0,
+          "support": 22.0
+        },
+        "weighted avg": {
+          "f1-score": 0.3169831141081196,
+          "precision": 0.3240243264312071,
+          "recall": 0.321,
+          "support": 2000.0
+        }
+      },
+      "eval_f1": 0.30473656895821705,
+      "eval_loss": 1.8237080574035645,
+      "eval_runtime": 3.9808,
+      "eval_samples_per_second": 502.417,
+      "eval_steps_per_second": 31.401,
+      "step": 876
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 876,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 920815007980032.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

trial_0/checkpoint-876/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cf983bab71d39717083fd85c30b7e0fd950e8d457e647f61a7ff596cb390b138
+size 5368

trial_0/checkpoint-876/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

trial_0/logs/events.out.tfevents.1740158198.a2d653e866f9.226.4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d93a76ea98cda8f1a1f299c4559552e6ff63b7201898fd12d91c00f7d63ab861
+size 6723

trial_0/logs/events.out.tfevents.1740161296.0a0ba32201a8.2151.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e04278ab83601bb3ec7661f515626f6d5cc7e973b6bc6ef2761183a848daed5
+size 30179

trial_0/logs/events.out.tfevents.1740161531.0a0ba32201a8.2151.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc6a4056a5185e518d4124b6179202d83d9aa7b9da6f6957c3776875c2345405
+size 25089

trial_0/logs/events.out.tfevents.1740161645.0a0ba32201a8.2151.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:76747c3b41f44365b9f8d4eabb3389f8487d7441a12322dc7488712efccf4d86
+size 405

trial_1/checkpoint-146/config.json ADDED Viewed

	@@ -0,0 +1,50 @@

+{
+  "_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "ar",
+    "1": "cl",
+    "2": "co",
+    "3": "es",
+    "4": "mx",
+    "5": "pe",
+    "6": "pr",
+    "7": "uy",
+    "8": "ve"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "ar": 0,
+    "cl": 1,
+    "co": 2,
+    "es": 3,
+    "mx": 4,
+    "pe": 5,
+    "pr": 6,
+    "uy": 7,
+    "ve": 8
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.48.3",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 31002
+}

trial_1/checkpoint-146/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f148025042e8766377f58bd5b2cb8ab568f58cfee85f2f67d50d7b13949b896
+size 439454740

trial_1/checkpoint-146/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5b16f9046371de70837c5fcfbbb97032ca47fd7b0f2f5f70b053c6733259e41
+size 879030522