usamaaleem99tech commited on
Commit
5769f60
1 Parent(s): 320996e

Training in progress, epoch 0

Browse files
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.6,
3
- "total_flos": 5.876119984612147e+16,
4
- "train_loss": 0.3996999263763428,
5
- "train_runtime": 229.426,
6
- "train_samples_per_second": 10.722,
7
- "train_steps_per_second": 0.262
8
  }
 
1
  {
2
+ "epoch": 8.89,
3
+ "total_flos": 5.786635923932774e+16,
4
+ "train_loss": 0.40318952401479086,
5
+ "train_runtime": 239.9675,
6
+ "train_samples_per_second": 10.876,
7
+ "train_steps_per_second": 0.25
8
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e18401ae79f0eb7980f71ec062b3dab0bd2d7a2e12d76c839c8151a1579228c9
3
  size 110397937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e460638b4d529c4454281722190369db834fad322c2165720fc7bd2fe8c983f0
3
  size 110397937
runs/Jul19_18-55-35_d59d7adac7e1/events.out.tfevents.1689792946.d59d7adac7e1.10517.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1642621abf8512365c7bc99bdd1b0081aaef1b9b8dde72351cee2b4a226489bf
3
+ size 4832
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 9.6,
3
- "total_flos": 5.876119984612147e+16,
4
- "train_loss": 0.3996999263763428,
5
- "train_runtime": 229.426,
6
- "train_samples_per_second": 10.722,
7
- "train_steps_per_second": 0.262
8
  }
 
1
  {
2
+ "epoch": 8.89,
3
+ "total_flos": 5.786635923932774e+16,
4
+ "train_loss": 0.40318952401479086,
5
+ "train_runtime": 239.9675,
6
+ "train_samples_per_second": 10.876,
7
+ "train_steps_per_second": 0.25
8
  }
trainer_state.json CHANGED
@@ -1,151 +1,142 @@
1
  {
2
- "best_metric": 0.9545454545454546,
3
- "best_model_checkpoint": "segformer-class-classWeights-augmentation/checkpoint-31",
4
- "epoch": 9.6,
5
  "global_step": 60,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 0.96,
12
- "eval_accuracy": 0.4772727272727273,
13
- "eval_loss": 0.9944368600845337,
14
- "eval_runtime": 1.008,
15
- "eval_samples_per_second": 43.653,
16
- "eval_steps_per_second": 4.961,
17
  "step": 6
18
  },
19
  {
20
- "epoch": 1.6,
21
  "learning_rate": 4.62962962962963e-05,
22
- "loss": 1.0159,
23
  "step": 10
24
  },
25
  {
26
- "epoch": 1.92,
27
- "eval_accuracy": 0.75,
28
- "eval_loss": 0.694824755191803,
29
- "eval_runtime": 0.9891,
30
- "eval_samples_per_second": 44.486,
31
- "eval_steps_per_second": 5.055,
32
- "step": 12
33
  },
34
  {
35
- "epoch": 2.88,
36
- "eval_accuracy": 0.9318181818181818,
37
- "eval_loss": 0.34167394042015076,
38
- "eval_runtime": 0.985,
39
- "eval_samples_per_second": 44.669,
40
- "eval_steps_per_second": 5.076,
41
- "step": 18
42
  },
43
  {
44
- "epoch": 3.2,
45
- "learning_rate": 3.7037037037037037e-05,
46
- "loss": 0.5444,
 
 
 
47
  "step": 20
48
  },
49
  {
50
  "epoch": 4.0,
51
- "eval_accuracy": 0.9090909090909091,
52
- "eval_loss": 0.26416999101638794,
53
- "eval_runtime": 1.3817,
54
- "eval_samples_per_second": 31.845,
55
- "eval_steps_per_second": 3.619,
56
- "step": 25
57
  },
58
  {
59
- "epoch": 4.8,
60
  "learning_rate": 2.777777777777778e-05,
61
- "loss": 0.2331,
62
  "step": 30
63
  },
64
  {
65
- "epoch": 4.96,
66
- "eval_accuracy": 0.9545454545454546,
67
- "eval_loss": 0.09864511340856552,
68
- "eval_runtime": 1.0085,
69
- "eval_samples_per_second": 43.627,
70
- "eval_steps_per_second": 4.958,
71
- "step": 31
72
  },
73
  {
74
- "epoch": 5.92,
75
- "eval_accuracy": 0.9545454545454546,
76
- "eval_loss": 0.17346793413162231,
77
- "eval_runtime": 1.0084,
78
- "eval_samples_per_second": 43.634,
79
- "eval_steps_per_second": 4.958,
80
- "step": 37
81
  },
82
  {
83
- "epoch": 6.4,
84
- "learning_rate": 1.8518518518518518e-05,
85
- "loss": 0.2596,
 
 
 
86
  "step": 40
87
  },
88
  {
89
- "epoch": 6.88,
90
- "eval_accuracy": 0.9545454545454546,
91
- "eval_loss": 0.1091495230793953,
92
- "eval_runtime": 1.383,
93
- "eval_samples_per_second": 31.815,
94
- "eval_steps_per_second": 3.615,
95
- "step": 43
96
  },
97
  {
98
- "epoch": 8.0,
99
  "learning_rate": 9.259259259259259e-06,
100
- "loss": 0.1737,
101
  "step": 50
102
  },
103
  {
104
  "epoch": 8.0,
105
- "eval_accuracy": 0.9545454545454546,
106
- "eval_loss": 0.0685076043009758,
107
- "eval_runtime": 1.013,
108
- "eval_samples_per_second": 43.435,
109
- "eval_steps_per_second": 4.936,
110
- "step": 50
111
- },
112
- {
113
- "epoch": 8.96,
114
- "eval_accuracy": 0.9545454545454546,
115
- "eval_loss": 0.09951713681221008,
116
- "eval_runtime": 1.0006,
117
- "eval_samples_per_second": 43.975,
118
- "eval_steps_per_second": 4.997,
119
- "step": 56
120
  },
121
  {
122
- "epoch": 9.6,
123
  "learning_rate": 0.0,
124
- "loss": 0.1716,
125
  "step": 60
126
  },
127
  {
128
- "epoch": 9.6,
129
- "eval_accuracy": 0.9545454545454546,
130
- "eval_loss": 0.09269092231988907,
131
- "eval_runtime": 1.0041,
132
- "eval_samples_per_second": 43.822,
133
- "eval_steps_per_second": 4.98,
134
  "step": 60
135
  },
136
  {
137
- "epoch": 9.6,
138
  "step": 60,
139
- "total_flos": 5.876119984612147e+16,
140
- "train_loss": 0.3996999263763428,
141
- "train_runtime": 229.426,
142
- "train_samples_per_second": 10.722,
143
- "train_steps_per_second": 0.262
144
  }
145
  ],
146
  "max_steps": 60,
147
  "num_train_epochs": 10,
148
- "total_flos": 5.876119984612147e+16,
149
  "trial_name": null,
150
  "trial_params": null
151
  }
 
1
  {
2
+ "best_metric": 0.9310344827586207,
3
+ "best_model_checkpoint": "segformer-class-classWeights-augmentation/checkpoint-40",
4
+ "epoch": 8.88888888888889,
5
  "global_step": 60,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 0.89,
12
+ "eval_accuracy": 0.5862068965517241,
13
+ "eval_loss": 1.0178804397583008,
14
+ "eval_runtime": 1.1426,
15
+ "eval_samples_per_second": 25.38,
16
+ "eval_steps_per_second": 2.626,
17
  "step": 6
18
  },
19
  {
20
+ "epoch": 1.48,
21
  "learning_rate": 4.62962962962963e-05,
22
+ "loss": 0.9897,
23
  "step": 10
24
  },
25
  {
26
+ "epoch": 1.93,
27
+ "eval_accuracy": 0.7241379310344828,
28
+ "eval_loss": 0.760027289390564,
29
+ "eval_runtime": 0.8084,
30
+ "eval_samples_per_second": 35.874,
31
+ "eval_steps_per_second": 3.711,
32
+ "step": 13
33
  },
34
  {
35
+ "epoch": 2.96,
36
+ "learning_rate": 3.7037037037037037e-05,
37
+ "loss": 0.5848,
38
+ "step": 20
 
 
 
39
  },
40
  {
41
+ "epoch": 2.96,
42
+ "eval_accuracy": 0.5862068965517241,
43
+ "eval_loss": 0.8368268609046936,
44
+ "eval_runtime": 1.6581,
45
+ "eval_samples_per_second": 17.49,
46
+ "eval_steps_per_second": 1.809,
47
  "step": 20
48
  },
49
  {
50
  "epoch": 4.0,
51
+ "eval_accuracy": 0.8620689655172413,
52
+ "eval_loss": 0.4708000719547272,
53
+ "eval_runtime": 0.8189,
54
+ "eval_samples_per_second": 35.414,
55
+ "eval_steps_per_second": 3.663,
56
+ "step": 27
57
  },
58
  {
59
+ "epoch": 4.44,
60
  "learning_rate": 2.777777777777778e-05,
61
+ "loss": 0.2747,
62
  "step": 30
63
  },
64
  {
65
+ "epoch": 4.89,
66
+ "eval_accuracy": 0.896551724137931,
67
+ "eval_loss": 0.37271812558174133,
68
+ "eval_runtime": 0.8067,
69
+ "eval_samples_per_second": 35.951,
70
+ "eval_steps_per_second": 3.719,
71
+ "step": 33
72
  },
73
  {
74
+ "epoch": 5.93,
75
+ "learning_rate": 1.8518518518518518e-05,
76
+ "loss": 0.2259,
77
+ "step": 40
 
 
 
78
  },
79
  {
80
+ "epoch": 5.93,
81
+ "eval_accuracy": 0.9310344827586207,
82
+ "eval_loss": 0.3100181221961975,
83
+ "eval_runtime": 1.1422,
84
+ "eval_samples_per_second": 25.389,
85
+ "eval_steps_per_second": 2.626,
86
  "step": 40
87
  },
88
  {
89
+ "epoch": 6.96,
90
+ "eval_accuracy": 0.9310344827586207,
91
+ "eval_loss": 0.22938820719718933,
92
+ "eval_runtime": 0.7944,
93
+ "eval_samples_per_second": 36.504,
94
+ "eval_steps_per_second": 3.776,
95
+ "step": 47
96
  },
97
  {
98
+ "epoch": 7.41,
99
  "learning_rate": 9.259259259259259e-06,
100
+ "loss": 0.1596,
101
  "step": 50
102
  },
103
  {
104
  "epoch": 8.0,
105
+ "eval_accuracy": 0.896551724137931,
106
+ "eval_loss": 0.26314061880111694,
107
+ "eval_runtime": 1.212,
108
+ "eval_samples_per_second": 23.927,
109
+ "eval_steps_per_second": 2.475,
110
+ "step": 54
 
 
 
 
 
 
 
 
 
111
  },
112
  {
113
+ "epoch": 8.89,
114
  "learning_rate": 0.0,
115
+ "loss": 0.1844,
116
  "step": 60
117
  },
118
  {
119
+ "epoch": 8.89,
120
+ "eval_accuracy": 0.9310344827586207,
121
+ "eval_loss": 0.26064130663871765,
122
+ "eval_runtime": 0.8176,
123
+ "eval_samples_per_second": 35.469,
124
+ "eval_steps_per_second": 3.669,
125
  "step": 60
126
  },
127
  {
128
+ "epoch": 8.89,
129
  "step": 60,
130
+ "total_flos": 5.786635923932774e+16,
131
+ "train_loss": 0.40318952401479086,
132
+ "train_runtime": 239.9675,
133
+ "train_samples_per_second": 10.876,
134
+ "train_steps_per_second": 0.25
135
  }
136
  ],
137
  "max_steps": 60,
138
  "num_train_epochs": 10,
139
+ "total_flos": 5.786635923932774e+16,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81dc38e5245c5a8cf5460d3e360997b3861cc2a3b09ccf88c9dd38ff9fc6e1b9
3
  size 4027
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:840a4f8531ac04e05197743d10bdcafb29a5988b65b7d8acdadb673e998891a0
3
  size 4027