jvadlamudi2 commited on
Commit
619c48e
1 Parent(s): df3bc58

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -6,8 +6,8 @@
6
  "eval_samples_per_second": 65.767,
7
  "eval_steps_per_second": 2.349,
8
  "total_flos": 2.071360882398044e+17,
9
- "train_loss": 0.5642238571530297,
10
- "train_runtime": 242.7921,
11
- "train_samples_per_second": 11.009,
12
- "train_steps_per_second": 0.086
13
  }
 
6
  "eval_samples_per_second": 65.767,
7
  "eval_steps_per_second": 2.349,
8
  "total_flos": 2.071360882398044e+17,
9
+ "train_loss": 0.5111370115053087,
10
+ "train_runtime": 228.9442,
11
+ "train_samples_per_second": 11.675,
12
+ "train_steps_per_second": 0.092
13
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c26a23d997b8165baea51a13246c69af462e27a0c5ff581cebee6f018c21b3c1
3
  size 343268717
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03553b005cca996a8f3f9348ec2d19b5814dc0106f855e29bfd7f06c01a530f3
3
  size 343268717
runs/Jul20_22-51-27_fcbe542fc008/events.out.tfevents.1689894625.fcbe542fc008.53766.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9d2bdaab907dff1ddc317331f386036bf16f8c6f1854e562108f04a733bd078
3
+ size 4472
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 2.071360882398044e+17,
4
- "train_loss": 0.5642238571530297,
5
- "train_runtime": 242.7921,
6
- "train_samples_per_second": 11.009,
7
- "train_steps_per_second": 0.086
8
  }
 
1
  {
2
  "epoch": 3.0,
3
  "total_flos": 2.071360882398044e+17,
4
+ "train_loss": 0.5111370115053087,
5
+ "train_runtime": 228.9442,
6
+ "train_samples_per_second": 11.675,
7
+ "train_steps_per_second": 0.092
8
  }
trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.6995515695067265,
3
- "best_model_checkpoint": "vit-base-patch16-224-jvadlamudi2/checkpoint-14",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
@@ -9,51 +9,51 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
- "eval_accuracy": 0.695067264573991,
13
- "eval_loss": 0.5611284971237183,
14
- "eval_runtime": 3.5824,
15
- "eval_samples_per_second": 62.248,
16
- "eval_steps_per_second": 1.954,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
- "loss": 0.5947,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
- "eval_accuracy": 0.6995515695067265,
28
- "eval_loss": 0.5539332032203674,
29
- "eval_runtime": 3.3759,
30
- "eval_samples_per_second": 66.056,
31
- "eval_steps_per_second": 2.073,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
- "loss": 0.5369,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
- "eval_accuracy": 0.672645739910314,
43
- "eval_loss": 0.5587254762649536,
44
- "eval_runtime": 3.5944,
45
- "eval_samples_per_second": 62.041,
46
- "eval_steps_per_second": 1.947,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
  "total_flos": 2.071360882398044e+17,
53
- "train_loss": 0.5642238571530297,
54
- "train_runtime": 242.7921,
55
- "train_samples_per_second": 11.009,
56
- "train_steps_per_second": 0.086
57
  }
58
  ],
59
  "max_steps": 21,
 
1
  {
2
+ "best_metric": 0.8295964125560538,
3
+ "best_model_checkpoint": "vit-base-patch16-224-jvadlamudi2/checkpoint-7",
4
  "epoch": 3.0,
5
  "global_step": 21,
6
  "is_hyper_param_search": false,
 
9
  "log_history": [
10
  {
11
  "epoch": 1.0,
12
+ "eval_accuracy": 0.8295964125560538,
13
+ "eval_loss": 0.49411410093307495,
14
+ "eval_runtime": 3.3119,
15
+ "eval_samples_per_second": 67.333,
16
+ "eval_steps_per_second": 2.114,
17
  "step": 7
18
  },
19
  {
20
  "epoch": 1.43,
21
  "learning_rate": 3.055555555555556e-05,
22
+ "loss": 0.5365,
23
  "step": 10
24
  },
25
  {
26
  "epoch": 2.0,
27
+ "eval_accuracy": 0.8071748878923767,
28
+ "eval_loss": 0.5048662424087524,
29
+ "eval_runtime": 3.5367,
30
+ "eval_samples_per_second": 63.054,
31
+ "eval_steps_per_second": 1.979,
32
  "step": 14
33
  },
34
  {
35
  "epoch": 2.86,
36
  "learning_rate": 2.777777777777778e-06,
37
+ "loss": 0.4893,
38
  "step": 20
39
  },
40
  {
41
  "epoch": 3.0,
42
+ "eval_accuracy": 0.7982062780269058,
43
+ "eval_loss": 0.5039920806884766,
44
+ "eval_runtime": 3.3683,
45
+ "eval_samples_per_second": 66.205,
46
+ "eval_steps_per_second": 2.078,
47
  "step": 21
48
  },
49
  {
50
  "epoch": 3.0,
51
  "step": 21,
52
  "total_flos": 2.071360882398044e+17,
53
+ "train_loss": 0.5111370115053087,
54
+ "train_runtime": 228.9442,
55
+ "train_samples_per_second": 11.675,
56
+ "train_steps_per_second": 0.092
57
  }
58
  ],
59
  "max_steps": 21,