kiranshivaraju commited on
Commit
3d97af6
·
verified ·
1 Parent(s): 84cb16e

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [facebook/convnext-xlarge-224-22k-1k](https://huggingface.co/facebook/convnext-xlarge-224-22k-1k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.0001
22
  - Recall: 1.0
23
 
24
  ## Model description
 
18
 
19
  This model is a fine-tuned version of [facebook/convnext-xlarge-224-22k-1k](https://huggingface.co/facebook/convnext-xlarge-224-22k-1k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.0104
22
  - Recall: 1.0
23
 
24
  ## Model description
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.010405209846794605,
4
+ "eval_recall": 1.0,
5
+ "eval_runtime": 1.6733,
6
+ "eval_samples_per_second": 75.897,
7
+ "eval_steps_per_second": 2.39,
8
+ "total_flos": 1.7954512873784525e+18,
9
+ "train_loss": 0.025862085550195642,
10
+ "train_runtime": 258.3025,
11
+ "train_samples_per_second": 22.106,
12
+ "train_steps_per_second": 0.174
13
+ }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "eval_loss": 0.010405209846794605,
4
+ "eval_recall": 1.0,
5
+ "eval_runtime": 1.6733,
6
+ "eval_samples_per_second": 75.897,
7
+ "eval_steps_per_second": 2.39
8
+ }
runs/Nov23_02-36-39_9254754ac219/events.out.tfevents.1732329738.9254754ac219.483.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:844c01e56407f425f39b4422ff69e724adea3801c9c3f0e7d5e817805206c4a7
3
+ size 403
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 1.7954512873784525e+18,
4
+ "train_loss": 0.025862085550195642,
5
+ "train_runtime": 258.3025,
6
+ "train_samples_per_second": 22.106,
7
+ "train_steps_per_second": 0.174
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "convnext-xlarge-224-22k-1k-v13/checkpoint-9",
4
+ "epoch": 5.0,
5
+ "eval_steps": 500,
6
+ "global_step": 45,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_loss": 0.010405209846794605,
14
+ "eval_recall": 1.0,
15
+ "eval_runtime": 1.6504,
16
+ "eval_samples_per_second": 76.95,
17
+ "eval_steps_per_second": 2.424,
18
+ "step": 9
19
+ },
20
+ {
21
+ "epoch": 1.1111111111111112,
22
+ "grad_norm": 12.378776550292969,
23
+ "learning_rate": 4.375e-05,
24
+ "loss": 0.0652,
25
+ "step": 10
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_loss": 0.027809349820017815,
30
+ "eval_recall": 0.9857142857142858,
31
+ "eval_runtime": 1.6348,
32
+ "eval_samples_per_second": 77.684,
33
+ "eval_steps_per_second": 2.447,
34
+ "step": 18
35
+ },
36
+ {
37
+ "epoch": 2.2222222222222223,
38
+ "grad_norm": 232.1143035888672,
39
+ "learning_rate": 3.125e-05,
40
+ "loss": 0.03,
41
+ "step": 20
42
+ },
43
+ {
44
+ "epoch": 3.0,
45
+ "eval_loss": 0.0006994050927460194,
46
+ "eval_recall": 1.0,
47
+ "eval_runtime": 1.6323,
48
+ "eval_samples_per_second": 77.806,
49
+ "eval_steps_per_second": 2.451,
50
+ "step": 27
51
+ },
52
+ {
53
+ "epoch": 3.3333333333333335,
54
+ "grad_norm": 61.44147872924805,
55
+ "learning_rate": 1.8750000000000002e-05,
56
+ "loss": 0.0156,
57
+ "step": 30
58
+ },
59
+ {
60
+ "epoch": 4.0,
61
+ "eval_loss": 0.00015087063366081566,
62
+ "eval_recall": 1.0,
63
+ "eval_runtime": 1.6426,
64
+ "eval_samples_per_second": 77.318,
65
+ "eval_steps_per_second": 2.435,
66
+ "step": 36
67
+ },
68
+ {
69
+ "epoch": 4.444444444444445,
70
+ "grad_norm": 0.5121456384658813,
71
+ "learning_rate": 6.25e-06,
72
+ "loss": 0.0042,
73
+ "step": 40
74
+ },
75
+ {
76
+ "epoch": 5.0,
77
+ "eval_loss": 0.00012451241491362453,
78
+ "eval_recall": 1.0,
79
+ "eval_runtime": 1.7523,
80
+ "eval_samples_per_second": 72.476,
81
+ "eval_steps_per_second": 2.283,
82
+ "step": 45
83
+ },
84
+ {
85
+ "epoch": 5.0,
86
+ "step": 45,
87
+ "total_flos": 1.7954512873784525e+18,
88
+ "train_loss": 0.025862085550195642,
89
+ "train_runtime": 258.3025,
90
+ "train_samples_per_second": 22.106,
91
+ "train_steps_per_second": 0.174
92
+ }
93
+ ],
94
+ "logging_steps": 10,
95
+ "max_steps": 45,
96
+ "num_input_tokens_seen": 0,
97
+ "num_train_epochs": 5,
98
+ "save_steps": 500,
99
+ "stateful_callbacks": {
100
+ "TrainerControl": {
101
+ "args": {
102
+ "should_epoch_stop": false,
103
+ "should_evaluate": false,
104
+ "should_log": false,
105
+ "should_save": true,
106
+ "should_training_stop": true
107
+ },
108
+ "attributes": {}
109
+ }
110
+ },
111
+ "total_flos": 1.7954512873784525e+18,
112
+ "train_batch_size": 32,
113
+ "trial_name": null,
114
+ "trial_params": null
115
+ }