daccuong2002 commited on Jul 19

Commit

1e49d2a

•

1 Parent(s): 4aff16e

Upload folder using huggingface_hub

Browse files

Files changed (19) hide show

README.md +36 -0
added_tokens.json +3 -0
bpe.codes +0 -0
checkpoint-3318/config.json +46 -0
checkpoint-3318/model.safetensors +3 -0
checkpoint-3318/optimizer.pt +3 -0
checkpoint-3318/rng_state.pth +3 -0
checkpoint-3318/scheduler.pt +3 -0
checkpoint-3318/trainer_state.json +1020 -0
checkpoint-3318/training_args.bin +3 -0
config.json +46 -0
model.safetensors +3 -0
runs/Jul19_08-08-26_r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l/events.out.tfevents.1721376507.r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l.98.0 +2 -2
runs/Jul19_08-08-26_r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l/events.out.tfevents.1721396576.r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l.98.1 +3 -0
special_tokens_map.json +9 -0
tokenizer_config.json +54 -0
training_args.bin +3 -0
training_params.json +30 -0
vocab.txt +0 -0

README.md ADDED Viewed

	@@ -0,0 +1,36 @@

+---
+tags:
+- autotrain
+- text-classification
+base_model: vinai/phobert-base-v2
+widget:
+- text: "I love AutoTrain"
+---
+# Model Trained Using AutoTrain
+- Problem type: Text Classification
+## Validation Metrics
+loss: 0.3279833495616913
+f1_macro: 0.876649943334319
+f1_micro: 0.9077217308152044
+f1_weighted: 0.9087694078887676
+precision_macro: 0.8488349060784007
+precision_micro: 0.9077217308152044
+precision_weighted: 0.9121960695781595
+recall_macro: 0.9108354827796887
+recall_micro: 0.9077217308152044
+recall_weighted: 0.9077217308152044
+accuracy: 0.9077217308152044

added_tokens.json ADDED Viewed

	@@ -0,0 +1,3 @@

+{
+  "<mask>": 64000
+}

bpe.codes ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-3318/config.json ADDED Viewed

	@@ -0,0 +1,46 @@

+{
+  "_name_or_path": "vinai/phobert-base-v2",
+  "_num_labels": 6,
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "2733522",
+    "1": "2733534",
+    "2": "2733540",
+    "3": "2733546",
+    "4": "2733552",
+    "5": "2733570"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "2733522": 0,
+    "2733534": 1,
+    "2733540": 2,
+    "2733546": 3,
+    "2733552": 4,
+    "2733570": 5
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 258,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "tokenizer_class": "PhobertTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 64001
+}

checkpoint-3318/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a7f3216c6c1b6968f4f4281cf1783c8a31a1b4bfab39a5c662e9187b46dd9a4
+size 540035688

checkpoint-3318/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c19526db84c55352b658c866c30e730017626871256e7e12c7b10b866f0a5f54
+size 1080185594

checkpoint-3318/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee3e85b34fcc1f3e72b38b7a9e71564fc210aedb1f14a96c4fe8318c124f297d
+size 13990

checkpoint-3318/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1c1e7c83cf538fc428c3e82626883d7aafd057626237481ba3d141d2e7e4f6e7
+size 1064

checkpoint-3318/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1020 @@

+{
+  "best_metric": 0.3279833495616913,
+  "best_model_checkpoint": "PhoBert-MultiLabel-KMeans/checkpoint-3318",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 3318,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.022603978300180832,
+      "grad_norm": 3.841909170150757,
+      "learning_rate": 3.765060240963856e-06,
+      "loss": 1.7878,
+      "step": 25
+    },
+    {
+      "epoch": 0.045207956600361664,
+      "grad_norm": 2.6476118564605713,
+      "learning_rate": 7.530120481927712e-06,
+      "loss": 1.7541,
+      "step": 50
+    },
+    {
+      "epoch": 0.06781193490054249,
+      "grad_norm": 3.1488897800445557,
+      "learning_rate": 1.1295180722891567e-05,
+      "loss": 1.7143,
+      "step": 75
+    },
+    {
+      "epoch": 0.09041591320072333,
+      "grad_norm": 3.9978089332580566,
+      "learning_rate": 1.5060240963855424e-05,
+      "loss": 1.6553,
+      "step": 100
+    },
+    {
+      "epoch": 0.11301989150090416,
+      "grad_norm": 4.824118614196777,
+      "learning_rate": 1.882530120481928e-05,
+      "loss": 1.5607,
+      "step": 125
+    },
+    {
+      "epoch": 0.13562386980108498,
+      "grad_norm": 4.588301658630371,
+      "learning_rate": 2.2590361445783133e-05,
+      "loss": 1.4288,
+      "step": 150
+    },
+    {
+      "epoch": 0.15822784810126583,
+      "grad_norm": 14.850578308105469,
+      "learning_rate": 2.635542168674699e-05,
+      "loss": 1.2511,
+      "step": 175
+    },
+    {
+      "epoch": 0.18083182640144665,
+      "grad_norm": 11.93288516998291,
+      "learning_rate": 3.012048192771085e-05,
+      "loss": 1.1645,
+      "step": 200
+    },
+    {
+      "epoch": 0.20343580470162748,
+      "grad_norm": 10.374913215637207,
+      "learning_rate": 3.38855421686747e-05,
+      "loss": 1.1245,
+      "step": 225
+    },
+    {
+      "epoch": 0.22603978300180833,
+      "grad_norm": 5.814253330230713,
+      "learning_rate": 3.765060240963856e-05,
+      "loss": 1.1271,
+      "step": 250
+    },
+    {
+      "epoch": 0.24864376130198915,
+      "grad_norm": 19.154064178466797,
+      "learning_rate": 4.141566265060241e-05,
+      "loss": 1.0359,
+      "step": 275
+    },
+    {
+      "epoch": 0.27124773960216997,
+      "grad_norm": 12.057534217834473,
+      "learning_rate": 4.5180722891566266e-05,
+      "loss": 0.9842,
+      "step": 300
+    },
+    {
+      "epoch": 0.2938517179023508,
+      "grad_norm": 5.480999946594238,
+      "learning_rate": 4.8945783132530124e-05,
+      "loss": 1.165,
+      "step": 325
+    },
+    {
+      "epoch": 0.31645569620253167,
+      "grad_norm": 27.02998924255371,
+      "learning_rate": 4.969859343603483e-05,
+      "loss": 1.0626,
+      "step": 350
+    },
+    {
+      "epoch": 0.33905967450271246,
+      "grad_norm": 8.911443710327148,
+      "learning_rate": 4.927997320830543e-05,
+      "loss": 0.9147,
+      "step": 375
+    },
+    {
+      "epoch": 0.3616636528028933,
+      "grad_norm": 7.904396057128906,
+      "learning_rate": 4.886135298057603e-05,
+      "loss": 0.8824,
+      "step": 400
+    },
+    {
+      "epoch": 0.38426763110307416,
+      "grad_norm": 40.34563064575195,
+      "learning_rate": 4.844273275284662e-05,
+      "loss": 0.9151,
+      "step": 425
+    },
+    {
+      "epoch": 0.40687160940325495,
+      "grad_norm": 11.78642749786377,
+      "learning_rate": 4.8024112525117214e-05,
+      "loss": 0.9926,
+      "step": 450
+    },
+    {
+      "epoch": 0.4294755877034358,
+      "grad_norm": 8.729843139648438,
+      "learning_rate": 4.760549229738781e-05,
+      "loss": 0.8049,
+      "step": 475
+    },
+    {
+      "epoch": 0.45207956600361665,
+      "grad_norm": 3.0259087085723877,
+      "learning_rate": 4.718687206965841e-05,
+      "loss": 0.9043,
+      "step": 500
+    },
+    {
+      "epoch": 0.47468354430379744,
+      "grad_norm": 3.1441285610198975,
+      "learning_rate": 4.676825184192901e-05,
+      "loss": 1.024,
+      "step": 525
+    },
+    {
+      "epoch": 0.4972875226039783,
+      "grad_norm": 297.1407775878906,
+      "learning_rate": 4.63496316141996e-05,
+      "loss": 0.7747,
+      "step": 550
+    },
+    {
+      "epoch": 0.5198915009041591,
+      "grad_norm": 21.502670288085938,
+      "learning_rate": 4.5931011386470195e-05,
+      "loss": 1.106,
+      "step": 575
+    },
+    {
+      "epoch": 0.5424954792043399,
+      "grad_norm": 7.8344340324401855,
+      "learning_rate": 4.551239115874079e-05,
+      "loss": 0.9031,
+      "step": 600
+    },
+    {
+      "epoch": 0.5650994575045208,
+      "grad_norm": 9.26258373260498,
+      "learning_rate": 4.509377093101139e-05,
+      "loss": 0.9796,
+      "step": 625
+    },
+    {
+      "epoch": 0.5877034358047016,
+      "grad_norm": 21.926687240600586,
+      "learning_rate": 4.467515070328199e-05,
+      "loss": 0.8663,
+      "step": 650
+    },
+    {
+      "epoch": 0.6103074141048824,
+      "grad_norm": 17.36395263671875,
+      "learning_rate": 4.425653047555258e-05,
+      "loss": 0.866,
+      "step": 675
+    },
+    {
+      "epoch": 0.6329113924050633,
+      "grad_norm": 9.919265747070312,
+      "learning_rate": 4.3837910247823175e-05,
+      "loss": 0.8074,
+      "step": 700
+    },
+    {
+      "epoch": 0.6555153707052441,
+      "grad_norm": 15.072575569152832,
+      "learning_rate": 4.3419290020093775e-05,
+      "loss": 0.9021,
+      "step": 725
+    },
+    {
+      "epoch": 0.6781193490054249,
+      "grad_norm": 2.6935675144195557,
+      "learning_rate": 4.300066979236437e-05,
+      "loss": 0.8359,
+      "step": 750
+    },
+    {
+      "epoch": 0.7007233273056058,
+      "grad_norm": 2.398829698562622,
+      "learning_rate": 4.258204956463496e-05,
+      "loss": 0.8454,
+      "step": 775
+    },
+    {
+      "epoch": 0.7233273056057866,
+      "grad_norm": 1.5908894538879395,
+      "learning_rate": 4.216342933690556e-05,
+      "loss": 0.7676,
+      "step": 800
+    },
+    {
+      "epoch": 0.7459312839059674,
+      "grad_norm": 12.428017616271973,
+      "learning_rate": 4.1744809109176155e-05,
+      "loss": 0.8397,
+      "step": 825
+    },
+    {
+      "epoch": 0.7685352622061483,
+      "grad_norm": 8.742015838623047,
+      "learning_rate": 4.1326188881446755e-05,
+      "loss": 0.8207,
+      "step": 850
+    },
+    {
+      "epoch": 0.7911392405063291,
+      "grad_norm": 16.055889129638672,
+      "learning_rate": 4.090756865371735e-05,
+      "loss": 0.7526,
+      "step": 875
+    },
+    {
+      "epoch": 0.8137432188065099,
+      "grad_norm": 2.839799642562866,
+      "learning_rate": 4.048894842598794e-05,
+      "loss": 0.6883,
+      "step": 900
+    },
+    {
+      "epoch": 0.8363471971066908,
+      "grad_norm": 30.43299102783203,
+      "learning_rate": 4.007032819825854e-05,
+      "loss": 0.9797,
+      "step": 925
+    },
+    {
+      "epoch": 0.8589511754068716,
+      "grad_norm": 3.6067237854003906,
+      "learning_rate": 3.965170797052914e-05,
+      "loss": 0.7248,
+      "step": 950
+    },
+    {
+      "epoch": 0.8815551537070524,
+      "grad_norm": 1.6388925313949585,
+      "learning_rate": 3.9233087742799736e-05,
+      "loss": 0.9144,
+      "step": 975
+    },
+    {
+      "epoch": 0.9041591320072333,
+      "grad_norm": 1.7512284517288208,
+      "learning_rate": 3.881446751507033e-05,
+      "loss": 0.8286,
+      "step": 1000
+    },
+    {
+      "epoch": 0.9267631103074141,
+      "grad_norm": 1.7240828275680542,
+      "learning_rate": 3.839584728734092e-05,
+      "loss": 0.8361,
+      "step": 1025
+    },
+    {
+      "epoch": 0.9493670886075949,
+      "grad_norm": 12.430205345153809,
+      "learning_rate": 3.797722705961152e-05,
+      "loss": 0.8154,
+      "step": 1050
+    },
+    {
+      "epoch": 0.9719710669077758,
+      "grad_norm": 2.2587053775787354,
+      "learning_rate": 3.755860683188212e-05,
+      "loss": 0.7517,
+      "step": 1075
+    },
+    {
+      "epoch": 0.9945750452079566,
+      "grad_norm": 4.7276105880737305,
+      "learning_rate": 3.7139986604152716e-05,
+      "loss": 0.7314,
+      "step": 1100
+    },
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.8646904135787712,
+      "eval_f1_macro": 0.7969114035222423,
+      "eval_f1_micro": 0.8646904135787712,
+      "eval_f1_weighted": 0.8686677177148115,
+      "eval_loss": 0.474561870098114,
+      "eval_precision_macro": 0.7463296033587281,
+      "eval_precision_micro": 0.8646904135787712,
+      "eval_precision_weighted": 0.8811279472143232,
+      "eval_recall_macro": 0.8754275642409685,
+      "eval_recall_micro": 0.8646904135787712,
+      "eval_recall_weighted": 0.8646904135787712,
+      "eval_runtime": 684.5188,
+      "eval_samples_per_second": 6.111,
+      "eval_steps_per_second": 0.383,
+      "step": 1106
+    },
+    {
+      "epoch": 1.0171790235081375,
+      "grad_norm": 4.729485988616943,
+      "learning_rate": 3.672136637642331e-05,
+      "loss": 0.7628,
+      "step": 1125
+    },
+    {
+      "epoch": 1.0397830018083183,
+      "grad_norm": 13.282486915588379,
+      "learning_rate": 3.63027461486939e-05,
+      "loss": 0.7394,
+      "step": 1150
+    },
+    {
+      "epoch": 1.062386980108499,
+      "grad_norm": 9.316232681274414,
+      "learning_rate": 3.58841259209645e-05,
+      "loss": 0.677,
+      "step": 1175
+    },
+    {
+      "epoch": 1.0849909584086799,
+      "grad_norm": 4.590908050537109,
+      "learning_rate": 3.54655056932351e-05,
+      "loss": 0.9049,
+      "step": 1200
+    },
+    {
+      "epoch": 1.1075949367088607,
+      "grad_norm": 7.4369988441467285,
+      "learning_rate": 3.5046885465505696e-05,
+      "loss": 0.8201,
+      "step": 1225
+    },
+    {
+      "epoch": 1.1301989150090417,
+      "grad_norm": 46.419105529785156,
+      "learning_rate": 3.462826523777629e-05,
+      "loss": 0.7825,
+      "step": 1250
+    },
+    {
+      "epoch": 1.1528028933092225,
+      "grad_norm": 11.992456436157227,
+      "learning_rate": 3.420964501004689e-05,
+      "loss": 0.6292,
+      "step": 1275
+    },
+    {
+      "epoch": 1.1754068716094033,
+      "grad_norm": 5.902411460876465,
+      "learning_rate": 3.379102478231748e-05,
+      "loss": 0.7238,
+      "step": 1300
+    },
+    {
+      "epoch": 1.198010849909584,
+      "grad_norm": 0.5739479660987854,
+      "learning_rate": 3.3372404554588077e-05,
+      "loss": 0.6716,
+      "step": 1325
+    },
+    {
+      "epoch": 1.2206148282097649,
+      "grad_norm": 39.53816604614258,
+      "learning_rate": 3.295378432685868e-05,
+      "loss": 0.9233,
+      "step": 1350
+    },
+    {
+      "epoch": 1.2432188065099457,
+      "grad_norm": 6.763810157775879,
+      "learning_rate": 3.253516409912927e-05,
+      "loss": 0.7302,
+      "step": 1375
+    },
+    {
+      "epoch": 1.2658227848101267,
+      "grad_norm": 13.701122283935547,
+      "learning_rate": 3.211654387139987e-05,
+      "loss": 0.7074,
+      "step": 1400
+    },
+    {
+      "epoch": 1.2884267631103075,
+      "grad_norm": 3.521284580230713,
+      "learning_rate": 3.1697923643670464e-05,
+      "loss": 0.7279,
+      "step": 1425
+    },
+    {
+      "epoch": 1.3110307414104883,
+      "grad_norm": 1.2048885822296143,
+      "learning_rate": 3.127930341594106e-05,
+      "loss": 0.6119,
+      "step": 1450
+    },
+    {
+      "epoch": 1.333634719710669,
+      "grad_norm": 1.5905373096466064,
+      "learning_rate": 3.086068318821165e-05,
+      "loss": 0.639,
+      "step": 1475
+    },
+    {
+      "epoch": 1.3562386980108498,
+      "grad_norm": 3.3090178966522217,
+      "learning_rate": 3.0442062960482254e-05,
+      "loss": 0.7074,
+      "step": 1500
+    },
+    {
+      "epoch": 1.3788426763110309,
+      "grad_norm": 1.7795202732086182,
+      "learning_rate": 3.002344273275285e-05,
+      "loss": 0.6383,
+      "step": 1525
+    },
+    {
+      "epoch": 1.4014466546112117,
+      "grad_norm": 10.706816673278809,
+      "learning_rate": 2.9604822505023444e-05,
+      "loss": 0.7385,
+      "step": 1550
+    },
+    {
+      "epoch": 1.4240506329113924,
+      "grad_norm": 11.373717308044434,
+      "learning_rate": 2.918620227729404e-05,
+      "loss": 0.7328,
+      "step": 1575
+    },
+    {
+      "epoch": 1.4466546112115732,
+      "grad_norm": 1.1606653928756714,
+      "learning_rate": 2.8767582049564634e-05,
+      "loss": 0.7943,
+      "step": 1600
+    },
+    {
+      "epoch": 1.469258589511754,
+      "grad_norm": 4.997502326965332,
+      "learning_rate": 2.8348961821835234e-05,
+      "loss": 0.7762,
+      "step": 1625
+    },
+    {
+      "epoch": 1.4918625678119348,
+      "grad_norm": 10.411747932434082,
+      "learning_rate": 2.793034159410583e-05,
+      "loss": 0.6818,
+      "step": 1650
+    },
+    {
+      "epoch": 1.5144665461121156,
+      "grad_norm": 1.0002527236938477,
+      "learning_rate": 2.7511721366376424e-05,
+      "loss": 0.4924,
+      "step": 1675
+    },
+    {
+      "epoch": 1.5370705244122966,
+      "grad_norm": 1.6328582763671875,
+      "learning_rate": 2.709310113864702e-05,
+      "loss": 0.7116,
+      "step": 1700
+    },
+    {
+      "epoch": 1.5596745027124774,
+      "grad_norm": 3.9850947856903076,
+      "learning_rate": 2.6674480910917614e-05,
+      "loss": 0.7846,
+      "step": 1725
+    },
+    {
+      "epoch": 1.5822784810126582,
+      "grad_norm": 12.702369689941406,
+      "learning_rate": 2.625586068318821e-05,
+      "loss": 0.6727,
+      "step": 1750
+    },
+    {
+      "epoch": 1.604882459312839,
+      "grad_norm": 22.720844268798828,
+      "learning_rate": 2.583724045545881e-05,
+      "loss": 0.6354,
+      "step": 1775
+    },
+    {
+      "epoch": 1.6274864376130198,
+      "grad_norm": 7.914674282073975,
+      "learning_rate": 2.5418620227729404e-05,
+      "loss": 0.8122,
+      "step": 1800
+    },
+    {
+      "epoch": 1.6500904159132008,
+      "grad_norm": 10.155131340026855,
+      "learning_rate": 2.5e-05,
+      "loss": 0.5847,
+      "step": 1825
+    },
+    {
+      "epoch": 1.6726943942133814,
+      "grad_norm": 4.096177577972412,
+      "learning_rate": 2.4581379772270598e-05,
+      "loss": 0.6681,
+      "step": 1850
+    },
+    {
+      "epoch": 1.6952983725135624,
+      "grad_norm": 1.1155363321304321,
+      "learning_rate": 2.4162759544541195e-05,
+      "loss": 0.5517,
+      "step": 1875
+    },
+    {
+      "epoch": 1.7179023508137432,
+      "grad_norm": 0.886872410774231,
+      "learning_rate": 2.3744139316811788e-05,
+      "loss": 0.6529,
+      "step": 1900
+    },
+    {
+      "epoch": 1.740506329113924,
+      "grad_norm": 45.21336364746094,
+      "learning_rate": 2.3325519089082385e-05,
+      "loss": 0.7317,
+      "step": 1925
+    },
+    {
+      "epoch": 1.763110307414105,
+      "grad_norm": 2.183527946472168,
+      "learning_rate": 2.290689886135298e-05,
+      "loss": 0.5836,
+      "step": 1950
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 9.820974349975586,
+      "learning_rate": 2.2488278633623578e-05,
+      "loss": 0.717,
+      "step": 1975
+    },
+    {
+      "epoch": 1.8083182640144666,
+      "grad_norm": 2.521716594696045,
+      "learning_rate": 2.2069658405894175e-05,
+      "loss": 0.665,
+      "step": 2000
+    },
+    {
+      "epoch": 1.8309222423146474,
+      "grad_norm": 43.333824157714844,
+      "learning_rate": 2.1651038178164772e-05,
+      "loss": 0.4805,
+      "step": 2025
+    },
+    {
+      "epoch": 1.8535262206148282,
+      "grad_norm": 1.851754069328308,
+      "learning_rate": 2.1232417950435365e-05,
+      "loss": 0.6131,
+      "step": 2050
+    },
+    {
+      "epoch": 1.8761301989150092,
+      "grad_norm": 1.0132567882537842,
+      "learning_rate": 2.0813797722705962e-05,
+      "loss": 0.6625,
+      "step": 2075
+    },
+    {
+      "epoch": 1.8987341772151898,
+      "grad_norm": 18.15288543701172,
+      "learning_rate": 2.039517749497656e-05,
+      "loss": 0.692,
+      "step": 2100
+    },
+    {
+      "epoch": 1.9213381555153708,
+      "grad_norm": 2.7393548488616943,
+      "learning_rate": 1.9976557267247152e-05,
+      "loss": 0.8157,
+      "step": 2125
+    },
+    {
+      "epoch": 1.9439421338155516,
+      "grad_norm": 2.785061836242676,
+      "learning_rate": 1.9557937039517752e-05,
+      "loss": 0.6455,
+      "step": 2150
+    },
+    {
+      "epoch": 1.9665461121157324,
+      "grad_norm": 7.032905578613281,
+      "learning_rate": 1.9139316811788345e-05,
+      "loss": 0.673,
+      "step": 2175
+    },
+    {
+      "epoch": 1.9891500904159132,
+      "grad_norm": 6.695957660675049,
+      "learning_rate": 1.8720696584058942e-05,
+      "loss": 0.6465,
+      "step": 2200
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.8864451350705236,
+      "eval_f1_macro": 0.8559865482684758,
+      "eval_f1_micro": 0.8864451350705236,
+      "eval_f1_weighted": 0.8885254655749029,
+      "eval_loss": 0.3843747675418854,
+      "eval_precision_macro": 0.8270066883752536,
+      "eval_precision_micro": 0.8864451350705236,
+      "eval_precision_weighted": 0.8971130501570121,
+      "eval_recall_macro": 0.8950094171847649,
+      "eval_recall_micro": 0.8864451350705236,
+      "eval_recall_weighted": 0.8864451350705236,
+      "eval_runtime": 708.9221,
+      "eval_samples_per_second": 5.901,
+      "eval_steps_per_second": 0.37,
+      "step": 2212
+    },
+    {
+      "epoch": 2.011754068716094,
+      "grad_norm": 0.2900655269622803,
+      "learning_rate": 1.830207635632954e-05,
+      "loss": 0.4926,
+      "step": 2225
+    },
+    {
+      "epoch": 2.034358047016275,
+      "grad_norm": 0.25579121708869934,
+      "learning_rate": 1.7883456128600136e-05,
+      "loss": 0.5601,
+      "step": 2250
+    },
+    {
+      "epoch": 2.0569620253164556,
+      "grad_norm": 10.494261741638184,
+      "learning_rate": 1.746483590087073e-05,
+      "loss": 0.4779,
+      "step": 2275
+    },
+    {
+      "epoch": 2.0795660036166366,
+      "grad_norm": 2.495044231414795,
+      "learning_rate": 1.704621567314133e-05,
+      "loss": 0.6575,
+      "step": 2300
+    },
+    {
+      "epoch": 2.102169981916817,
+      "grad_norm": 19.166954040527344,
+      "learning_rate": 1.6627595445411922e-05,
+      "loss": 0.5641,
+      "step": 2325
+    },
+    {
+      "epoch": 2.124773960216998,
+      "grad_norm": 6.6829915046691895,
+      "learning_rate": 1.620897521768252e-05,
+      "loss": 0.6266,
+      "step": 2350
+    },
+    {
+      "epoch": 2.147377938517179,
+      "grad_norm": 18.80038070678711,
+      "learning_rate": 1.5790354989953116e-05,
+      "loss": 0.6087,
+      "step": 2375
+    },
+    {
+      "epoch": 2.1699819168173597,
+      "grad_norm": 32.67726135253906,
+      "learning_rate": 1.537173476222371e-05,
+      "loss": 0.8013,
+      "step": 2400
+    },
+    {
+      "epoch": 2.1925858951175408,
+      "grad_norm": 4.437242031097412,
+      "learning_rate": 1.4953114534494308e-05,
+      "loss": 0.6542,
+      "step": 2425
+    },
+    {
+      "epoch": 2.2151898734177213,
+      "grad_norm": 7.463759899139404,
+      "learning_rate": 1.4534494306764904e-05,
+      "loss": 0.5717,
+      "step": 2450
+    },
+    {
+      "epoch": 2.2377938517179023,
+      "grad_norm": 4.608203411102295,
+      "learning_rate": 1.41158740790355e-05,
+      "loss": 0.5789,
+      "step": 2475
+    },
+    {
+      "epoch": 2.2603978300180834,
+      "grad_norm": 1.7395381927490234,
+      "learning_rate": 1.3697253851306096e-05,
+      "loss": 0.5181,
+      "step": 2500
+    },
+    {
+      "epoch": 2.283001808318264,
+      "grad_norm": 21.39842414855957,
+      "learning_rate": 1.3278633623576691e-05,
+      "loss": 0.5867,
+      "step": 2525
+    },
+    {
+      "epoch": 2.305605786618445,
+      "grad_norm": 15.271064758300781,
+      "learning_rate": 1.2860013395847286e-05,
+      "loss": 0.62,
+      "step": 2550
+    },
+    {
+      "epoch": 2.3282097649186255,
+      "grad_norm": 1.706192135810852,
+      "learning_rate": 1.2441393168117885e-05,
+      "loss": 0.6125,
+      "step": 2575
+    },
+    {
+      "epoch": 2.3508137432188065,
+      "grad_norm": 0.2807926833629608,
+      "learning_rate": 1.202277294038848e-05,
+      "loss": 0.6651,
+      "step": 2600
+    },
+    {
+      "epoch": 2.3734177215189876,
+      "grad_norm": 1.556008219718933,
+      "learning_rate": 1.1604152712659077e-05,
+      "loss": 0.4651,
+      "step": 2625
+    },
+    {
+      "epoch": 2.396021699819168,
+      "grad_norm": 13.534441947937012,
+      "learning_rate": 1.1185532484929673e-05,
+      "loss": 0.6178,
+      "step": 2650
+    },
+    {
+      "epoch": 2.418625678119349,
+      "grad_norm": 29.2789249420166,
+      "learning_rate": 1.0766912257200268e-05,
+      "loss": 0.5291,
+      "step": 2675
+    },
+    {
+      "epoch": 2.4412296564195297,
+      "grad_norm": 37.51542663574219,
+      "learning_rate": 1.0348292029470865e-05,
+      "loss": 0.5774,
+      "step": 2700
+    },
+    {
+      "epoch": 2.4638336347197107,
+      "grad_norm": 0.8940380215644836,
+      "learning_rate": 9.92967180174146e-06,
+      "loss": 0.6371,
+      "step": 2725
+    },
+    {
+      "epoch": 2.4864376130198913,
+      "grad_norm": 0.25459304451942444,
+      "learning_rate": 9.511051574012057e-06,
+      "loss": 0.5044,
+      "step": 2750
+    },
+    {
+      "epoch": 2.5090415913200723,
+      "grad_norm": 2.767826795578003,
+      "learning_rate": 9.092431346282652e-06,
+      "loss": 0.4203,
+      "step": 2775
+    },
+    {
+      "epoch": 2.5316455696202533,
+      "grad_norm": 1.5824614763259888,
+      "learning_rate": 8.673811118553249e-06,
+      "loss": 0.6947,
+      "step": 2800
+    },
+    {
+      "epoch": 2.554249547920434,
+      "grad_norm": 1.1196787357330322,
+      "learning_rate": 8.255190890823845e-06,
+      "loss": 0.6688,
+      "step": 2825
+    },
+    {
+      "epoch": 2.576853526220615,
+      "grad_norm": 0.9682297706604004,
+      "learning_rate": 7.83657066309444e-06,
+      "loss": 0.4147,
+      "step": 2850
+    },
+    {
+      "epoch": 2.599457504520796,
+      "grad_norm": 6.9166579246521,
+      "learning_rate": 7.417950435365037e-06,
+      "loss": 0.6114,
+      "step": 2875
+    },
+    {
+      "epoch": 2.6220614828209765,
+      "grad_norm": 2.9561591148376465,
+      "learning_rate": 6.999330207635633e-06,
+      "loss": 0.6869,
+      "step": 2900
+    },
+    {
+      "epoch": 2.644665461121157,
+      "grad_norm": 19.65010643005371,
+      "learning_rate": 6.58070997990623e-06,
+      "loss": 0.5901,
+      "step": 2925
+    },
+    {
+      "epoch": 2.667269439421338,
+      "grad_norm": 10.092483520507812,
+      "learning_rate": 6.162089752176826e-06,
+      "loss": 0.7184,
+      "step": 2950
+    },
+    {
+      "epoch": 2.689873417721519,
+      "grad_norm": 5.880400657653809,
+      "learning_rate": 5.7434695244474216e-06,
+      "loss": 0.4771,
+      "step": 2975
+    },
+    {
+      "epoch": 2.7124773960216997,
+      "grad_norm": 0.9661037921905518,
+      "learning_rate": 5.3248492967180175e-06,
+      "loss": 0.4992,
+      "step": 3000
+    },
+    {
+      "epoch": 2.7350813743218807,
+      "grad_norm": 20.191679000854492,
+      "learning_rate": 4.906229068988614e-06,
+      "loss": 0.6437,
+      "step": 3025
+    },
+    {
+      "epoch": 2.7576853526220617,
+      "grad_norm": 35.344791412353516,
+      "learning_rate": 4.487608841259209e-06,
+      "loss": 0.5925,
+      "step": 3050
+    },
+    {
+      "epoch": 2.7802893309222423,
+      "grad_norm": 5.644791126251221,
+      "learning_rate": 4.068988613529806e-06,
+      "loss": 0.574,
+      "step": 3075
+    },
+    {
+      "epoch": 2.8028933092224233,
+      "grad_norm": 8.687640190124512,
+      "learning_rate": 3.650368385800402e-06,
+      "loss": 0.5918,
+      "step": 3100
+    },
+    {
+      "epoch": 2.825497287522604,
+      "grad_norm": 19.680980682373047,
+      "learning_rate": 3.231748158070998e-06,
+      "loss": 0.6377,
+      "step": 3125
+    },
+    {
+      "epoch": 2.848101265822785,
+      "grad_norm": 0.16842712461948395,
+      "learning_rate": 2.813127930341594e-06,
+      "loss": 0.5109,
+      "step": 3150
+    },
+    {
+      "epoch": 2.8707052441229655,
+      "grad_norm": 1.1660349369049072,
+      "learning_rate": 2.3945077026121904e-06,
+      "loss": 0.4715,
+      "step": 3175
+    },
+    {
+      "epoch": 2.8933092224231465,
+      "grad_norm": 7.041762351989746,
+      "learning_rate": 1.9758874748827863e-06,
+      "loss": 0.5119,
+      "step": 3200
+    },
+    {
+      "epoch": 2.9159132007233275,
+      "grad_norm": 27.925931930541992,
+      "learning_rate": 1.5572672471533826e-06,
+      "loss": 0.5079,
+      "step": 3225
+    },
+    {
+      "epoch": 2.938517179023508,
+      "grad_norm": 1.633520483970642,
+      "learning_rate": 1.1386470194239785e-06,
+      "loss": 0.5943,
+      "step": 3250
+    },
+    {
+      "epoch": 2.961121157323689,
+      "grad_norm": 9.762001991271973,
+      "learning_rate": 7.200267916945747e-07,
+      "loss": 0.5058,
+      "step": 3275
+    },
+    {
+      "epoch": 2.9837251356238697,
+      "grad_norm": 23.335742950439453,
+      "learning_rate": 3.014065639651708e-07,
+      "loss": 0.3955,
+      "step": 3300
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.9077217308152044,
+      "eval_f1_macro": 0.876649943334319,
+      "eval_f1_micro": 0.9077217308152044,
+      "eval_f1_weighted": 0.9087694078887676,
+      "eval_loss": 0.3279833495616913,
+      "eval_precision_macro": 0.8488349060784007,
+      "eval_precision_micro": 0.9077217308152044,
+      "eval_precision_weighted": 0.9121960695781595,
+      "eval_recall_macro": 0.9108354827796887,
+      "eval_recall_micro": 0.9077217308152044,
+      "eval_recall_weighted": 0.9077217308152044,
+      "eval_runtime": 724.2824,
+      "eval_samples_per_second": 5.775,
+      "eval_steps_per_second": 0.362,
+      "step": 3318
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 3318,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "EarlyStoppingCallback": {
+      "args": {
+        "early_stopping_patience": 5,
+        "early_stopping_threshold": 0.01
+      },
+      "attributes": {
+        "early_stopping_patience_counter": 0
+      }
+    },
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1745080968172032.0,
+  "train_batch_size": 8,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3318/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:17e5f83b009843f296ef4182ec608574cca58674a944f1cb348ab1701e2ab785
+size 5176

config.json ADDED Viewed

	@@ -0,0 +1,46 @@

+{
+  "_name_or_path": "vinai/phobert-base-v2",
+  "_num_labels": 6,
+  "architectures": [
+    "RobertaForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": 0,
+  "classifier_dropout": null,
+  "eos_token_id": 2,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "2733522",
+    "1": "2733534",
+    "2": "2733540",
+    "3": "2733546",
+    "4": "2733552",
+    "5": "2733570"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "2733522": 0,
+    "2733534": 1,
+    "2733540": 2,
+    "2733546": 3,
+    "2733552": 4,
+    "2733570": 5
+  },
+  "layer_norm_eps": 1e-05,
+  "max_position_embeddings": 258,
+  "model_type": "roberta",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 1,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "tokenizer_class": "PhobertTokenizer",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.2",
+  "type_vocab_size": 1,
+  "use_cache": true,
+  "vocab_size": 64001
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a7f3216c6c1b6968f4f4281cf1783c8a31a1b4bfab39a5c662e9187b46dd9a4
+size 540035688

runs/Jul19_08-08-26_r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l/events.out.tfevents.1721376507.r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l.98.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c2557800a6e5455865380571ab102aabe12ce6f4e19a0b1cbad949eb0ec6b07f
-size 33907

 version https://git-lfs.github.com/spec/v1
+oid sha256:0ea7075d60e5d8c86a82e10ce18fdbb1621203473819b2990d6b7b4747daa8dd
+size 35938

runs/Jul19_08-08-26_r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l/events.out.tfevents.1721396576.r-daccuong2002-runmay3-jzutjz7y-f713d-ewa9l.98.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5043cb141674666e4c7ce9d902bc524d80589143e16617006468bee1e681bd5
+size 921

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,54 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "64000": {
+      "content": "<mask>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "PhobertTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:17e5f83b009843f296ef4182ec608574cca58674a944f1cb348ab1701e2ab785
+size 5176

training_params.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+    "data_path": "PhoBert-MultiLabel-KMeans/autotrain-data",
+    "model": "vinai/phobert-base-v2",
+    "lr": 5e-05,
+    "epochs": 3,
+    "max_seq_length": 128,
+    "batch_size": 8,
+    "warmup_ratio": 0.1,
+    "gradient_accumulation": 1,
+    "optimizer": "adamw_torch",
+    "scheduler": "linear",
+    "weight_decay": 0.0,
+    "max_grad_norm": 1.0,
+    "seed": 42,
+    "train_split": "train",
+    "valid_split": "validation",
+    "text_column": "autotrain_text",
+    "target_column": "autotrain_label",
+    "logging_steps": -1,
+    "project_name": "PhoBert-MultiLabel-KMeans",
+    "auto_find_batch_size": false,
+    "mixed_precision": "fp16",
+    "save_total_limit": 1,
+    "push_to_hub": true,
+    "eval_strategy": "epoch",
+    "username": "daccuong2002",
+    "log": "tensorboard",
+    "early_stopping_patience": 5,
+    "early_stopping_threshold": 0.01
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff