fayetitchenal commited on
Commit
9ec95fd
1 Parent(s): 36a2996

Training in progress, step 2250, checkpoint

Browse files
checkpoint-2250/config.json ADDED
@@ -0,0 +1,92 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nvidia/mit-b5",
3
+ "architectures": [
4
+ "SegformerForSemanticSegmentation"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "classifier_dropout_prob": 0.1,
8
+ "decoder_hidden_size": 768,
9
+ "depths": [
10
+ 3,
11
+ 6,
12
+ 40,
13
+ 3
14
+ ],
15
+ "downsampling_rates": [
16
+ 1,
17
+ 4,
18
+ 8,
19
+ 16
20
+ ],
21
+ "drop_path_rate": 0.1,
22
+ "hidden_act": "gelu",
23
+ "hidden_dropout_prob": 0.0,
24
+ "hidden_sizes": [
25
+ 64,
26
+ 128,
27
+ 320,
28
+ 512
29
+ ],
30
+ "id2label": {
31
+ "0": "background",
32
+ "1": "double_plant",
33
+ "2": "drydown",
34
+ "3": "endrow",
35
+ "4": "nutrient_deficiency",
36
+ "5": "planter_skip",
37
+ "6": "water",
38
+ "7": "waterway",
39
+ "8": "weed_cluster"
40
+ },
41
+ "image_size": 224,
42
+ "initializer_range": 0.02,
43
+ "label2id": {
44
+ "background": 0,
45
+ "double_plant": 1,
46
+ "drydown": 2,
47
+ "endrow": 3,
48
+ "nutrient_deficiency": 4,
49
+ "planter_skip": 5,
50
+ "water": 6,
51
+ "waterway": 7,
52
+ "weed_cluster": 8
53
+ },
54
+ "layer_norm_eps": 1e-06,
55
+ "mlp_ratios": [
56
+ 4,
57
+ 4,
58
+ 4,
59
+ 4
60
+ ],
61
+ "model_type": "segformer",
62
+ "num_attention_heads": [
63
+ 1,
64
+ 2,
65
+ 5,
66
+ 8
67
+ ],
68
+ "num_channels": 4,
69
+ "num_encoder_blocks": 4,
70
+ "patch_sizes": [
71
+ 7,
72
+ 3,
73
+ 3,
74
+ 3
75
+ ],
76
+ "reshape_last_stage": true,
77
+ "semantic_loss_ignore_index": 255,
78
+ "sr_ratios": [
79
+ 8,
80
+ 4,
81
+ 2,
82
+ 1
83
+ ],
84
+ "strides": [
85
+ 4,
86
+ 2,
87
+ 2,
88
+ 2
89
+ ],
90
+ "torch_dtype": "float32",
91
+ "transformers_version": "4.40.2"
92
+ }
checkpoint-2250/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5a7c9e0b23f21da5d0c0df2d9fe01b7b36387ced02aed77cb295ebaffdb3a05
3
+ size 338562516
checkpoint-2250/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99e4c20582f5d1ba20d6e101473033a5735f5b740d6979fae2b3e8fbce3aa0c7
3
+ size 677518143
checkpoint-2250/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02e2f68ae443f87cd8b308d1de9bf381a9c5361dae9e57aad905042d7e0b6f2d
3
+ size 14575
checkpoint-2250/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f9f829a642e00fe87154fe7e5b3f0f2bf2dc021a22e30606de0337e8dd4418c
3
+ size 563
checkpoint-2250/trainer_state.json ADDED
@@ -0,0 +1,165 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
+ "eval_steps": 500,
6
+ "global_step": 2250,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.2222222222222222,
13
+ "grad_norm": 11.793246269226074,
14
+ "learning_rate": 2.2222222222222223e-05,
15
+ "loss": 3.818,
16
+ "step": 500
17
+ },
18
+ {
19
+ "epoch": 0.2222222222222222,
20
+ "eval_accuracy_background": 0.19581472704788175,
21
+ "eval_accuracy_double_plant": 0.09380215019766877,
22
+ "eval_accuracy_drydown": 0.7107036127331178,
23
+ "eval_accuracy_endrow": 0.02059395079032939,
24
+ "eval_accuracy_nutrient_deficiency": 0.8348166019686053,
25
+ "eval_accuracy_planter_skip": 0.09523015915808461,
26
+ "eval_accuracy_water": 0.9933604093368263,
27
+ "eval_accuracy_waterway": 0.5081417568068439,
28
+ "eval_accuracy_weed_cluster": 0.8598379016004754,
29
+ "eval_iou_background": 0.18808867925529232,
30
+ "eval_iou_double_plant": 0.06203210246822897,
31
+ "eval_iou_drydown": 0.40717237628074626,
32
+ "eval_iou_endrow": 0.0177635377630849,
33
+ "eval_iou_nutrient_deficiency": 0.24616684931318317,
34
+ "eval_iou_planter_skip": 0.08719568132734196,
35
+ "eval_iou_water": 0.2711830537857341,
36
+ "eval_iou_waterway": 0.11493665271237699,
37
+ "eval_iou_weed_cluster": 0.15174042308492286,
38
+ "eval_loss": 3.0543487071990967,
39
+ "eval_mean_accuracy": 0.47914458551553707,
40
+ "eval_mean_iou": 0.1718088173323235,
41
+ "eval_overall_accuracy": 0.3698257009825982,
42
+ "eval_runtime": 233.3045,
43
+ "eval_samples_per_second": 12.182,
44
+ "eval_steps_per_second": 1.526,
45
+ "step": 500
46
+ },
47
+ {
48
+ "epoch": 0.4444444444444444,
49
+ "grad_norm": 18.055360794067383,
50
+ "learning_rate": 4.4444444444444447e-05,
51
+ "loss": 3.0561,
52
+ "step": 1000
53
+ },
54
+ {
55
+ "epoch": 0.4444444444444444,
56
+ "eval_accuracy_background": 0.33281217700519594,
57
+ "eval_accuracy_double_plant": 0.6079763269177568,
58
+ "eval_accuracy_drydown": 0.7946684041913001,
59
+ "eval_accuracy_endrow": 0.349301342050525,
60
+ "eval_accuracy_nutrient_deficiency": 0.7314999843672831,
61
+ "eval_accuracy_planter_skip": 0.6712138070986369,
62
+ "eval_accuracy_water": 0.995121665952459,
63
+ "eval_accuracy_waterway": 0.5701844801294333,
64
+ "eval_accuracy_weed_cluster": 0.5467936481137453,
65
+ "eval_iou_background": 0.3071003729227365,
66
+ "eval_iou_double_plant": 0.05692166554215038,
67
+ "eval_iou_drydown": 0.45070670178291583,
68
+ "eval_iou_endrow": 0.12562451540796912,
69
+ "eval_iou_nutrient_deficiency": 0.2946294028718886,
70
+ "eval_iou_planter_skip": 0.13924388642718094,
71
+ "eval_iou_water": 0.2832997795518204,
72
+ "eval_iou_waterway": 0.10604657522478783,
73
+ "eval_iou_weed_cluster": 0.21995946645651349,
74
+ "eval_loss": 2.7527103424072266,
75
+ "eval_mean_accuracy": 0.6221746484251484,
76
+ "eval_mean_iou": 0.2203924851319959,
77
+ "eval_overall_accuracy": 0.4604543823237725,
78
+ "eval_runtime": 234.4163,
79
+ "eval_samples_per_second": 12.124,
80
+ "eval_steps_per_second": 1.519,
81
+ "step": 1000
82
+ },
83
+ {
84
+ "epoch": 0.6666666666666666,
85
+ "grad_norm": 17.42981719970703,
86
+ "learning_rate": 6.666666666666667e-05,
87
+ "loss": 2.8425,
88
+ "step": 1500
89
+ },
90
+ {
91
+ "epoch": 0.6666666666666666,
92
+ "eval_accuracy_background": 0.3979410567243586,
93
+ "eval_accuracy_double_plant": 0.35090828194540236,
94
+ "eval_accuracy_drydown": 0.990671482434014,
95
+ "eval_accuracy_endrow": 0.2249281722842768,
96
+ "eval_accuracy_nutrient_deficiency": 0.64935174422475,
97
+ "eval_accuracy_planter_skip": 0.5494840964457799,
98
+ "eval_accuracy_water": 0.9732364233609112,
99
+ "eval_accuracy_waterway": 0.32217860917602775,
100
+ "eval_accuracy_weed_cluster": 0.4993965740432129,
101
+ "eval_iou_background": 0.3749426436452205,
102
+ "eval_iou_double_plant": 0.1311586100117858,
103
+ "eval_iou_drydown": 0.377378210407481,
104
+ "eval_iou_endrow": 0.10949437953809864,
105
+ "eval_iou_nutrient_deficiency": 0.3194503546667628,
106
+ "eval_iou_planter_skip": 0.2767050562366308,
107
+ "eval_iou_water": 0.33601793640817545,
108
+ "eval_iou_waterway": 0.17211292189101207,
109
+ "eval_iou_weed_cluster": 0.23999589853669023,
110
+ "eval_loss": 2.7259955406188965,
111
+ "eval_mean_accuracy": 0.5508996045154149,
112
+ "eval_mean_iou": 0.2596951123713175,
113
+ "eval_overall_accuracy": 0.5187459341357686,
114
+ "eval_runtime": 234.4997,
115
+ "eval_samples_per_second": 12.119,
116
+ "eval_steps_per_second": 1.518,
117
+ "step": 1500
118
+ },
119
+ {
120
+ "epoch": 0.8888888888888888,
121
+ "grad_norm": 18.323888778686523,
122
+ "learning_rate": 8.888888888888889e-05,
123
+ "loss": 2.812,
124
+ "step": 2000
125
+ },
126
+ {
127
+ "epoch": 0.8888888888888888,
128
+ "eval_accuracy_background": 0.3444616006736896,
129
+ "eval_accuracy_double_plant": 0.2994677094262697,
130
+ "eval_accuracy_drydown": 0.9219474623777996,
131
+ "eval_accuracy_endrow": 0.08748836836582362,
132
+ "eval_accuracy_nutrient_deficiency": 0.8971747201033099,
133
+ "eval_accuracy_planter_skip": 0.4553112332178167,
134
+ "eval_accuracy_water": 0.9835769083095529,
135
+ "eval_accuracy_waterway": 0.3921009308045625,
136
+ "eval_accuracy_weed_cluster": 0.7258725441601974,
137
+ "eval_iou_background": 0.32680002116655066,
138
+ "eval_iou_double_plant": 0.1689556986493995,
139
+ "eval_iou_drydown": 0.4498001115160996,
140
+ "eval_iou_endrow": 0.07367449850616072,
141
+ "eval_iou_nutrient_deficiency": 0.3152010347192682,
142
+ "eval_iou_planter_skip": 0.28500014113702443,
143
+ "eval_iou_water": 0.3018250386605094,
144
+ "eval_iou_waterway": 0.11357719882212529,
145
+ "eval_iou_weed_cluster": 0.2522793183619568,
146
+ "eval_loss": 2.639113187789917,
147
+ "eval_mean_accuracy": 0.5674890530487802,
148
+ "eval_mean_iou": 0.25412367350434384,
149
+ "eval_overall_accuracy": 0.5034953329987246,
150
+ "eval_runtime": 234.7079,
151
+ "eval_samples_per_second": 12.109,
152
+ "eval_steps_per_second": 1.517,
153
+ "step": 2000
154
+ }
155
+ ],
156
+ "logging_steps": 500,
157
+ "max_steps": 22500,
158
+ "num_input_tokens_seen": 0,
159
+ "num_train_epochs": 10,
160
+ "save_steps": 2250,
161
+ "total_flos": 9.581014347153408e+18,
162
+ "train_batch_size": 8,
163
+ "trial_name": null,
164
+ "trial_params": null
165
+ }
checkpoint-2250/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3c8f0a5eca1cc612f308bd7fd6b8ac1dd6fdf10189506591d24427a556fb2bd
3
+ size 4539