cruiser commited on
Commit
fad9e3b
1 Parent(s): 895c12e

Training in progress, epoch 2

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:558fc6c74444158434ea7e5a2abbd7e4bfc87c1409f9ad5653126032a8ce79a6
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e02a2a46a6028315105719ef1e304b4cee34b75184f0950cbdb412fd507ad0d6
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87175da7d5baa1888c80066cbd1b9d34c063f51f5205572230cbfdac03bb57f6
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02b16c32b9d60477848a19c4c437f69a66f810ff9f81f01989f2ba6b664912fc
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1afa4fb390fed62209a33ec31502a83421450b5e725ed87b9f6a0e5a6fe43e4a
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec413b9ccb2e7bf299f05612d1ea984d788cd968b214a3f7972297c05d91216b
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8887e02a63197212eb08e6268a00af8c32453672a22c577dcf1de8bc5e2b976a
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7524676a9651ec8c0d685a583a2fce1a7529148810db182eac434accbd0d75cb
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 1.8788982629776,
3
- "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-1718",
4
- "epoch": 1.0,
5
- "global_step": 1718,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -34,11 +34,39 @@
34
  "eval_samples_per_second": 437.119,
35
  "eval_steps_per_second": 27.335,
36
  "step": 1718
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
37
  }
38
  ],
39
  "max_steps": 34360,
40
  "num_train_epochs": 20,
41
- "total_flos": 782117510345820.0,
42
  "trial_name": null,
43
  "trial_params": null
44
  }
 
1
  {
2
+ "best_metric": 1.7166885137557983,
3
+ "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-3436",
4
+ "epoch": 2.0,
5
+ "global_step": 3436,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
34
  "eval_samples_per_second": 437.119,
35
  "eval_steps_per_second": 27.335,
36
  "step": 1718
37
+ },
38
+ {
39
+ "epoch": 1.16,
40
+ "learning_rate": 1.8835855646100117e-05,
41
+ "loss": 0.0387,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.46,
46
+ "learning_rate": 1.8544819557625148e-05,
47
+ "loss": 0.0449,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 1.75,
52
+ "learning_rate": 1.825378346915018e-05,
53
+ "loss": 0.0541,
54
+ "step": 3000
55
+ },
56
+ {
57
+ "epoch": 2.0,
58
+ "eval_accuracy": 0.7744765138653085,
59
+ "eval_f1": 0.778056670029498,
60
+ "eval_loss": 1.7166885137557983,
61
+ "eval_runtime": 8.1001,
62
+ "eval_samples_per_second": 436.288,
63
+ "eval_steps_per_second": 27.283,
64
+ "step": 3436
65
  }
66
  ],
67
  "max_steps": 34360,
68
  "num_train_epochs": 20,
69
+ "total_flos": 1564235020691640.0,
70
  "trial_name": null,
71
  "trial_params": null
72
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87175da7d5baa1888c80066cbd1b9d34c063f51f5205572230cbfdac03bb57f6
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02b16c32b9d60477848a19c4c437f69a66f810ff9f81f01989f2ba6b664912fc
3
  size 267858605
runs/May01_06-16-39_af1ffd0a72ec/events.out.tfevents.1682921804.af1ffd0a72ec.975.12 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35b858d16e7e1ee6f802bbf7937d9ef1d6f8a782d4582bb785862815821d379c
3
- size 5027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:892bf393fe72c8f7e6e594606d26c338b7c07340da58d54a7449d7822afb3b10
3
+ size 5867