ana-grassmann commited on
Commit
da94d09
1 Parent(s): 98af408

Training in progress, epoch 3

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c94bab8bfe5a92c902d1f1d8b917b3d93ab8a362ccae74283bdbc734d8a71f75
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b3893bc5c1641a53328a59ad528b6ad791ffce6b15bae27923c6df32b6e355
3
  size 437958648
run-1/checkpoint-416/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70a5b54d3a4c3e347067d556c03039c86bdd4c26a269820cbb61f4070d7c464a
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b3893bc5c1641a53328a59ad528b6ad791ffce6b15bae27923c6df32b6e355
3
  size 437958648
run-1/checkpoint-416/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e71d18a10ac192119328a5a3a626b0de77b3a5f16dae3ecf545fd0fcfc8e04e
3
  size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d4163b58ed0781e9f4ce6458eaf24a1b4186a707539bc5ed2c7da5d0d74c7ee
3
  size 876038394
run-1/checkpoint-416/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c690fa67a0ceb6c4695472a312dafbfeb413d5c06e12d40e9597a7c5b52c4a2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b706c7fbc4a0983687f5222b1b6a989d9602a44e64f9f99e1f0554195bd2e2ce
3
  size 14244
run-1/checkpoint-416/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f68652183e32efef3b3da15b6778d033ddb2a871b87f23d3c1e3e0c51356089d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d790a67d9e999d13f888af660baaed57194a30755bfcd0c6c4f98e7622cfa962
3
  size 1064
run-1/checkpoint-416/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.9801677651288196,
3
- "best_model_checkpoint": "bert-base-uncased-finetuned-spam-real/run-1/checkpoint-416",
4
  "epoch": 3.9808612440191387,
5
  "eval_steps": 500,
6
  "global_step": 416,
@@ -10,38 +10,38 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.9651887357699221,
14
- "eval_loss": 0.1194479838013649,
15
- "eval_runtime": 512.5403,
16
- "eval_samples_per_second": 32.563,
17
- "eval_steps_per_second": 4.072,
18
  "step": 104
19
  },
20
  {
21
  "epoch": 2.0,
22
- "eval_accuracy": 0.9775314559616537,
23
- "eval_loss": 0.07069126516580582,
24
- "eval_runtime": 511.5618,
25
- "eval_samples_per_second": 32.626,
26
- "eval_steps_per_second": 4.08,
27
  "step": 209
28
  },
29
  {
30
  "epoch": 3.0,
31
- "eval_accuracy": 0.9791491911324146,
32
- "eval_loss": 0.08672985434532166,
33
- "eval_runtime": 540.0361,
34
- "eval_samples_per_second": 30.905,
35
- "eval_steps_per_second": 3.865,
36
  "step": 313
37
  },
38
  {
39
  "epoch": 3.98,
40
- "eval_accuracy": 0.9801677651288196,
41
- "eval_loss": 0.08871355652809143,
42
- "eval_runtime": 507.4158,
43
- "eval_samples_per_second": 32.892,
44
- "eval_steps_per_second": 4.113,
45
  "step": 416
46
  }
47
  ],
@@ -54,9 +54,9 @@
54
  "train_batch_size": 16,
55
  "trial_name": null,
56
  "trial_params": {
57
- "learning_rate": 3.7633342814387334e-05,
58
  "num_train_epochs": 4,
59
  "per_device_train_batch_size": 16,
60
- "seed": 23
61
  }
62
  }
 
1
  {
2
+ "best_metric": 0.9815458358298382,
3
+ "best_model_checkpoint": "bert-base-uncased-finetuned-spam-real/run-1/checkpoint-313",
4
  "epoch": 3.9808612440191387,
5
  "eval_steps": 500,
6
  "global_step": 416,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.9563211503894548,
14
+ "eval_loss": 0.12384964525699615,
15
+ "eval_runtime": 129.3277,
16
+ "eval_samples_per_second": 129.052,
17
+ "eval_steps_per_second": 16.137,
18
  "step": 104
19
  },
20
  {
21
  "epoch": 2.0,
22
+ "eval_accuracy": 0.9778909526662672,
23
+ "eval_loss": 0.08387715369462967,
24
+ "eval_runtime": 129.286,
25
+ "eval_samples_per_second": 129.094,
26
+ "eval_steps_per_second": 16.143,
27
  "step": 209
28
  },
29
  {
30
  "epoch": 3.0,
31
+ "eval_accuracy": 0.9815458358298382,
32
+ "eval_loss": 0.0810588002204895,
33
+ "eval_runtime": 129.453,
34
+ "eval_samples_per_second": 128.927,
35
+ "eval_steps_per_second": 16.122,
36
  "step": 313
37
  },
38
  {
39
  "epoch": 3.98,
40
+ "eval_accuracy": 0.9811264230077891,
41
+ "eval_loss": 0.08734230697154999,
42
+ "eval_runtime": 129.3665,
43
+ "eval_samples_per_second": 129.013,
44
+ "eval_steps_per_second": 16.132,
45
  "step": 416
46
  }
47
  ],
 
54
  "train_batch_size": 16,
55
  "trial_name": null,
56
  "trial_params": {
57
+ "learning_rate": 3.8529031222986405e-05,
58
  "num_train_epochs": 4,
59
  "per_device_train_batch_size": 16,
60
+ "seed": 15
61
  }
62
  }
run-1/checkpoint-416/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e70c6e682ff4679414666a12647b55c4e70bdccf653d9bd96a7a5f7ed2f6901
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce75d5540cb596dd16321fe0e65b087c9f94fe8fe674dc64d250843c11bb8d7e
3
  size 4920
runs/Apr14_18-31-48_6ec9497f7a76/events.out.tfevents.1713119999.6ec9497f7a76.2144.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a51bff3b45a46812e84d3de1114d5efab85011d29e109c2ab252699ad5074af2
3
- size 5602
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8ca57b51faba3411d9ade1d1eca2c05f5a120520b4a53d12405a619b8732526
3
+ size 6279