diogopaes10 commited on
Commit
bc23f2e
1 Parent(s): b94cb66

End of training

Browse files
checkpoint-2000/config.json DELETED
@@ -1,50 +0,0 @@
1
- {
2
- "_name_or_path": "microsoft/MiniLM-L12-H384-uncased",
3
- "architectures": [
4
- "BertForSequenceClassification"
5
- ],
6
- "attention_probs_dropout_prob": 0.1,
7
- "classifier_dropout": null,
8
- "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.1,
10
- "hidden_size": 384,
11
- "id2label": {
12
- "0": "Society & Culture",
13
- "1": "Science & Mathematics",
14
- "2": "Health",
15
- "3": "Education & Reference",
16
- "4": "Computers & Internet",
17
- "5": "Sports",
18
- "6": "Business & Finance",
19
- "7": "Entertainment & Music",
20
- "8": "Family & Relationships",
21
- "9": "Politics & Government"
22
- },
23
- "initializer_range": 0.02,
24
- "intermediate_size": 1536,
25
- "label2id": {
26
- "Business & Finance": 6,
27
- "Computers & Internet": 4,
28
- "Education & Reference": 3,
29
- "Entertainment & Music": 7,
30
- "Family & Relationships": 8,
31
- "Health": 2,
32
- "Politics & Government": 9,
33
- "Science & Mathematics": 1,
34
- "Society & Culture": 0,
35
- "Sports": 5
36
- },
37
- "layer_norm_eps": 1e-12,
38
- "max_position_embeddings": 512,
39
- "model_type": "bert",
40
- "num_attention_heads": 12,
41
- "num_hidden_layers": 12,
42
- "pad_token_id": 0,
43
- "position_embedding_type": "absolute",
44
- "problem_type": "single_label_classification",
45
- "torch_dtype": "float32",
46
- "transformers_version": "4.31.0",
47
- "type_vocab_size": 2,
48
- "use_cache": true,
49
- "vocab_size": 30522
50
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-2000/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:09552910dd7d5ed2eb865c6b30253726e3dcd7aed3588cc97c4702b013630f01
3
- size 267028677
 
 
 
 
checkpoint-2000/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:294d34cfcdd9a17427a0a09cdf19e071c82e8ce59c34f4fe159d3c5118d1082d
3
- size 133523761
 
 
 
 
checkpoint-2000/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f48f6150f5133b116ca71b75680965f3b45ab43582cfcc6566086e18896784f
3
- size 14575
 
 
 
 
checkpoint-2000/special_tokens_map.json DELETED
@@ -1,7 +0,0 @@
1
- {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
7
- }
 
 
 
 
 
 
 
 
checkpoint-2000/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
checkpoint-2000/tokenizer_config.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "clean_up_tokenization_spaces": true,
3
- "cls_token": "[CLS]",
4
- "do_basic_tokenize": true,
5
- "do_lower_case": true,
6
- "mask_token": "[MASK]",
7
- "model_max_length": 1000000000000000019884624838656,
8
- "never_split": null,
9
- "pad_token": "[PAD]",
10
- "sep_token": "[SEP]",
11
- "strip_accents": null,
12
- "tokenize_chinese_chars": true,
13
- "tokenizer_class": "BertTokenizer",
14
- "unk_token": "[UNK]"
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-2000/trainer_state.json DELETED
@@ -1,438 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 8.0,
5
- "global_step": 2000,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.0,
12
- "learning_rate": 1.9992e-05,
13
- "loss": 2.3035,
14
- "step": 1
15
- },
16
- {
17
- "epoch": 0.5,
18
- "learning_rate": 1.9e-05,
19
- "loss": 2.1461,
20
- "step": 125
21
- },
22
- {
23
- "epoch": 0.5,
24
- "eval_accuracy": 0.5465,
25
- "eval_disk_space_total": 78.1898422241211,
26
- "eval_disk_space_used": 24.584102630615234,
27
- "eval_f1": 0.4711252488920671,
28
- "eval_gpu_ram_allocated": 0.3996291160583496,
29
- "eval_gpu_ram_cached": 12.9296875,
30
- "eval_gpu_ram_total": 39.56402587890625,
31
- "eval_gpu_utilization": 28,
32
- "eval_loss": 1.8486889600753784,
33
- "eval_precision": 0.5180898369172832,
34
- "eval_recall": 0.5465,
35
- "eval_runtime": 1.5234,
36
- "eval_samples_per_second": 1312.845,
37
- "eval_steps_per_second": 41.355,
38
- "eval_system_ram_total": 83.48074722290039,
39
- "eval_system_ram_used": 3.8797760009765625,
40
- "step": 125
41
- },
42
- {
43
- "epoch": 1.0,
44
- "learning_rate": 1.8e-05,
45
- "loss": 1.6793,
46
- "step": 250
47
- },
48
- {
49
- "epoch": 1.0,
50
- "eval_accuracy": 0.615,
51
- "eval_disk_space_total": 78.1898422241211,
52
- "eval_disk_space_used": 24.584190368652344,
53
- "eval_f1": 0.5799151958404197,
54
- "eval_gpu_ram_allocated": 0.3996119499206543,
55
- "eval_gpu_ram_cached": 12.9296875,
56
- "eval_gpu_ram_total": 39.56402587890625,
57
- "eval_gpu_utilization": 28,
58
- "eval_loss": 1.5279773473739624,
59
- "eval_precision": 0.6206909881233017,
60
- "eval_recall": 0.615,
61
- "eval_runtime": 1.5357,
62
- "eval_samples_per_second": 1302.337,
63
- "eval_steps_per_second": 41.024,
64
- "eval_system_ram_total": 83.48074722290039,
65
- "eval_system_ram_used": 3.8827476501464844,
66
- "step": 250
67
- },
68
- {
69
- "epoch": 1.5,
70
- "learning_rate": 1.7e-05,
71
- "loss": 1.4163,
72
- "step": 375
73
- },
74
- {
75
- "epoch": 1.5,
76
- "eval_accuracy": 0.6675,
77
- "eval_disk_space_total": 78.1898422241211,
78
- "eval_disk_space_used": 24.584190368652344,
79
- "eval_f1": 0.6507803054121275,
80
- "eval_gpu_ram_allocated": 0.3996291160583496,
81
- "eval_gpu_ram_cached": 12.9296875,
82
- "eval_gpu_ram_total": 39.56402587890625,
83
- "eval_gpu_utilization": 28,
84
- "eval_loss": 1.3395830392837524,
85
- "eval_precision": 0.6690538200035159,
86
- "eval_recall": 0.6675,
87
- "eval_runtime": 1.5175,
88
- "eval_samples_per_second": 1317.927,
89
- "eval_steps_per_second": 41.515,
90
- "eval_system_ram_total": 83.48074722290039,
91
- "eval_system_ram_used": 3.883075714111328,
92
- "step": 375
93
- },
94
- {
95
- "epoch": 2.0,
96
- "learning_rate": 1.6000000000000003e-05,
97
- "loss": 1.2855,
98
- "step": 500
99
- },
100
- {
101
- "epoch": 2.0,
102
- "eval_accuracy": 0.6745,
103
- "eval_disk_space_total": 78.1898422241211,
104
- "eval_disk_space_used": 24.584270477294922,
105
- "eval_f1": 0.6633189544214071,
106
- "eval_gpu_ram_allocated": 0.3995933532714844,
107
- "eval_gpu_ram_cached": 12.9296875,
108
- "eval_gpu_ram_total": 39.56402587890625,
109
- "eval_gpu_utilization": 30,
110
- "eval_loss": 1.2413243055343628,
111
- "eval_precision": 0.6741774761001332,
112
- "eval_recall": 0.6745,
113
- "eval_runtime": 1.5166,
114
- "eval_samples_per_second": 1318.761,
115
- "eval_steps_per_second": 41.541,
116
- "eval_system_ram_total": 83.48074722290039,
117
- "eval_system_ram_used": 3.897541046142578,
118
- "step": 500
119
- },
120
- {
121
- "epoch": 2.5,
122
- "learning_rate": 1.5000000000000002e-05,
123
- "loss": 1.1364,
124
- "step": 625
125
- },
126
- {
127
- "epoch": 2.5,
128
- "eval_accuracy": 0.6725,
129
- "eval_disk_space_total": 78.1898422241211,
130
- "eval_disk_space_used": 25.457107543945312,
131
- "eval_f1": 0.665830199533775,
132
- "eval_gpu_ram_allocated": 0.3995990753173828,
133
- "eval_gpu_ram_cached": 12.9296875,
134
- "eval_gpu_ram_total": 39.56402587890625,
135
- "eval_gpu_utilization": 31,
136
- "eval_loss": 1.1794828176498413,
137
- "eval_precision": 0.6758089281502129,
138
- "eval_recall": 0.6725,
139
- "eval_runtime": 1.5306,
140
- "eval_samples_per_second": 1306.704,
141
- "eval_steps_per_second": 41.161,
142
- "eval_system_ram_total": 83.48074722290039,
143
- "eval_system_ram_used": 4.096714019775391,
144
- "step": 625
145
- },
146
- {
147
- "epoch": 3.0,
148
- "learning_rate": 1.4e-05,
149
- "loss": 1.0569,
150
- "step": 750
151
- },
152
- {
153
- "epoch": 3.0,
154
- "eval_accuracy": 0.6845,
155
- "eval_disk_space_total": 78.1898422241211,
156
- "eval_disk_space_used": 25.457260131835938,
157
- "eval_f1": 0.6785417667541389,
158
- "eval_gpu_ram_allocated": 0.3996105194091797,
159
- "eval_gpu_ram_cached": 12.9296875,
160
- "eval_gpu_ram_total": 39.56402587890625,
161
- "eval_gpu_utilization": 29,
162
- "eval_loss": 1.1167317628860474,
163
- "eval_precision": 0.6841220967269329,
164
- "eval_recall": 0.6845,
165
- "eval_runtime": 1.5379,
166
- "eval_samples_per_second": 1300.49,
167
- "eval_steps_per_second": 40.965,
168
- "eval_system_ram_total": 83.48074722290039,
169
- "eval_system_ram_used": 4.092338562011719,
170
- "step": 750
171
- },
172
- {
173
- "epoch": 3.5,
174
- "learning_rate": 1.3000000000000001e-05,
175
- "loss": 0.9596,
176
- "step": 875
177
- },
178
- {
179
- "epoch": 3.5,
180
- "eval_accuracy": 0.698,
181
- "eval_disk_space_total": 78.1898422241211,
182
- "eval_disk_space_used": 25.457298278808594,
183
- "eval_f1": 0.6882774085430846,
184
- "eval_gpu_ram_allocated": 0.3996591567993164,
185
- "eval_gpu_ram_cached": 12.9296875,
186
- "eval_gpu_ram_total": 39.56402587890625,
187
- "eval_gpu_utilization": 29,
188
- "eval_loss": 1.0866354703903198,
189
- "eval_precision": 0.692037318372609,
190
- "eval_recall": 0.698,
191
- "eval_runtime": 1.5638,
192
- "eval_samples_per_second": 1278.976,
193
- "eval_steps_per_second": 40.288,
194
- "eval_system_ram_total": 83.48074722290039,
195
- "eval_system_ram_used": 3.876514434814453,
196
- "step": 875
197
- },
198
- {
199
- "epoch": 4.0,
200
- "learning_rate": 1.2e-05,
201
- "loss": 0.917,
202
- "step": 1000
203
- },
204
- {
205
- "epoch": 4.0,
206
- "eval_accuracy": 0.6875,
207
- "eval_disk_space_total": 78.1898422241211,
208
- "eval_disk_space_used": 25.45730209350586,
209
- "eval_f1": 0.6796355379748251,
210
- "eval_gpu_ram_allocated": 0.3995933532714844,
211
- "eval_gpu_ram_cached": 12.9296875,
212
- "eval_gpu_ram_total": 39.56402587890625,
213
- "eval_gpu_utilization": 29,
214
- "eval_loss": 1.0703401565551758,
215
- "eval_precision": 0.6840559389245768,
216
- "eval_recall": 0.6875,
217
- "eval_runtime": 1.5204,
218
- "eval_samples_per_second": 1315.473,
219
- "eval_steps_per_second": 41.437,
220
- "eval_system_ram_total": 83.48074722290039,
221
- "eval_system_ram_used": 3.8976211547851562,
222
- "step": 1000
223
- },
224
- {
225
- "epoch": 4.5,
226
- "learning_rate": 1.1008e-05,
227
- "loss": 0.8512,
228
- "step": 1125
229
- },
230
- {
231
- "epoch": 4.5,
232
- "eval_accuracy": 0.6915,
233
- "eval_disk_space_total": 78.1898422241211,
234
- "eval_disk_space_used": 25.830577850341797,
235
- "eval_f1": 0.6913447845710189,
236
- "eval_gpu_ram_allocated": 0.3996849060058594,
237
- "eval_gpu_ram_cached": 12.9296875,
238
- "eval_gpu_ram_total": 39.56402587890625,
239
- "eval_gpu_utilization": 28,
240
- "eval_loss": 1.0628596544265747,
241
- "eval_precision": 0.6944500140220231,
242
- "eval_recall": 0.6915,
243
- "eval_runtime": 1.5986,
244
- "eval_samples_per_second": 1251.121,
245
- "eval_steps_per_second": 39.41,
246
- "eval_system_ram_total": 83.48074722290039,
247
- "eval_system_ram_used": 4.0599517822265625,
248
- "step": 1125
249
- },
250
- {
251
- "epoch": 5.0,
252
- "learning_rate": 1.0008e-05,
253
- "loss": 0.8121,
254
- "step": 1250
255
- },
256
- {
257
- "epoch": 5.0,
258
- "eval_accuracy": 0.691,
259
- "eval_disk_space_total": 78.1898422241211,
260
- "eval_disk_space_used": 25.830596923828125,
261
- "eval_f1": 0.6838005278906992,
262
- "eval_gpu_ram_allocated": 0.39963626861572266,
263
- "eval_gpu_ram_cached": 12.9296875,
264
- "eval_gpu_ram_total": 39.56402587890625,
265
- "eval_gpu_utilization": 31,
266
- "eval_loss": 1.0575964450836182,
267
- "eval_precision": 0.6905089592227732,
268
- "eval_recall": 0.691,
269
- "eval_runtime": 1.5391,
270
- "eval_samples_per_second": 1299.447,
271
- "eval_steps_per_second": 40.933,
272
- "eval_system_ram_total": 83.48074722290039,
273
- "eval_system_ram_used": 4.043186187744141,
274
- "step": 1250
275
- },
276
- {
277
- "epoch": 5.5,
278
- "learning_rate": 9.008e-06,
279
- "loss": 0.7733,
280
- "step": 1375
281
- },
282
- {
283
- "epoch": 5.5,
284
- "eval_accuracy": 0.6805,
285
- "eval_disk_space_total": 78.1898422241211,
286
- "eval_disk_space_used": 25.83068084716797,
287
- "eval_f1": 0.6773653982197514,
288
- "eval_gpu_ram_allocated": 0.3996090888977051,
289
- "eval_gpu_ram_cached": 12.9296875,
290
- "eval_gpu_ram_total": 39.56402587890625,
291
- "eval_gpu_utilization": 28,
292
- "eval_loss": 1.0597690343856812,
293
- "eval_precision": 0.683800229871734,
294
- "eval_recall": 0.6805,
295
- "eval_runtime": 1.5511,
296
- "eval_samples_per_second": 1289.373,
297
- "eval_steps_per_second": 40.615,
298
- "eval_system_ram_total": 83.48074722290039,
299
- "eval_system_ram_used": 3.837909698486328,
300
- "step": 1375
301
- },
302
- {
303
- "epoch": 6.0,
304
- "learning_rate": 8.008e-06,
305
- "loss": 0.7431,
306
- "step": 1500
307
- },
308
- {
309
- "epoch": 6.0,
310
- "eval_accuracy": 0.702,
311
- "eval_disk_space_total": 78.1898422241211,
312
- "eval_disk_space_used": 25.830699920654297,
313
- "eval_f1": 0.6973584149072398,
314
- "eval_gpu_ram_allocated": 0.39962053298950195,
315
- "eval_gpu_ram_cached": 12.9296875,
316
- "eval_gpu_ram_total": 39.56402587890625,
317
- "eval_gpu_utilization": 31,
318
- "eval_loss": 1.0375711917877197,
319
- "eval_precision": 0.6975777506719404,
320
- "eval_recall": 0.702,
321
- "eval_runtime": 1.5383,
322
- "eval_samples_per_second": 1300.155,
323
- "eval_steps_per_second": 40.955,
324
- "eval_system_ram_total": 83.48074722290039,
325
- "eval_system_ram_used": 3.8545989990234375,
326
- "step": 1500
327
- },
328
- {
329
- "epoch": 6.5,
330
- "learning_rate": 7.0080000000000005e-06,
331
- "loss": 0.7065,
332
- "step": 1625
333
- },
334
- {
335
- "epoch": 6.5,
336
- "eval_accuracy": 0.6995,
337
- "eval_disk_space_total": 78.1898422241211,
338
- "eval_disk_space_used": 26.203968048095703,
339
- "eval_f1": 0.6990180197515704,
340
- "eval_gpu_ram_allocated": 0.39959049224853516,
341
- "eval_gpu_ram_cached": 12.9296875,
342
- "eval_gpu_ram_total": 39.56402587890625,
343
- "eval_gpu_utilization": 28,
344
- "eval_loss": 1.0457407236099243,
345
- "eval_precision": 0.701399008937391,
346
- "eval_recall": 0.6995,
347
- "eval_runtime": 1.5796,
348
- "eval_samples_per_second": 1266.127,
349
- "eval_steps_per_second": 39.883,
350
- "eval_system_ram_total": 83.48074722290039,
351
- "eval_system_ram_used": 4.033943176269531,
352
- "step": 1625
353
- },
354
- {
355
- "epoch": 7.0,
356
- "learning_rate": 6.008000000000001e-06,
357
- "loss": 0.671,
358
- "step": 1750
359
- },
360
- {
361
- "epoch": 7.0,
362
- "eval_accuracy": 0.698,
363
- "eval_disk_space_total": 78.1898422241211,
364
- "eval_disk_space_used": 26.203968048095703,
365
- "eval_f1": 0.6956310421863513,
366
- "eval_gpu_ram_allocated": 0.39962339401245117,
367
- "eval_gpu_ram_cached": 12.9296875,
368
- "eval_gpu_ram_total": 39.56402587890625,
369
- "eval_gpu_utilization": 28,
370
- "eval_loss": 1.039590835571289,
371
- "eval_precision": 0.696566876815876,
372
- "eval_recall": 0.698,
373
- "eval_runtime": 1.5301,
374
- "eval_samples_per_second": 1307.136,
375
- "eval_steps_per_second": 41.175,
376
- "eval_system_ram_total": 83.48074722290039,
377
- "eval_system_ram_used": 4.038356781005859,
378
- "step": 1750
379
- },
380
- {
381
- "epoch": 7.5,
382
- "learning_rate": 5.008000000000001e-06,
383
- "loss": 0.6438,
384
- "step": 1875
385
- },
386
- {
387
- "epoch": 7.5,
388
- "eval_accuracy": 0.6925,
389
- "eval_disk_space_total": 78.1898422241211,
390
- "eval_disk_space_used": 26.203964233398438,
391
- "eval_f1": 0.6886960392924729,
392
- "eval_gpu_ram_allocated": 0.3995976448059082,
393
- "eval_gpu_ram_cached": 12.9296875,
394
- "eval_gpu_ram_total": 39.56402587890625,
395
- "eval_gpu_utilization": 28,
396
- "eval_loss": 1.0473765134811401,
397
- "eval_precision": 0.6906747949914751,
398
- "eval_recall": 0.6925,
399
- "eval_runtime": 1.5569,
400
- "eval_samples_per_second": 1284.611,
401
- "eval_steps_per_second": 40.465,
402
- "eval_system_ram_total": 83.48074722290039,
403
- "eval_system_ram_used": 3.827362060546875,
404
- "step": 1875
405
- },
406
- {
407
- "epoch": 8.0,
408
- "learning_rate": 4.008e-06,
409
- "loss": 0.6326,
410
- "step": 2000
411
- },
412
- {
413
- "epoch": 8.0,
414
- "eval_accuracy": 0.698,
415
- "eval_disk_space_total": 78.1898422241211,
416
- "eval_disk_space_used": 26.204063415527344,
417
- "eval_f1": 0.6972467602684949,
418
- "eval_gpu_ram_allocated": 0.39958906173706055,
419
- "eval_gpu_ram_cached": 12.9296875,
420
- "eval_gpu_ram_total": 39.56402587890625,
421
- "eval_gpu_utilization": 34,
422
- "eval_loss": 1.03837251663208,
423
- "eval_precision": 0.6982790583069545,
424
- "eval_recall": 0.698,
425
- "eval_runtime": 1.5106,
426
- "eval_samples_per_second": 1323.952,
427
- "eval_steps_per_second": 41.704,
428
- "eval_system_ram_total": 83.48074722290039,
429
- "eval_system_ram_used": 3.8401947021484375,
430
- "step": 2000
431
- }
432
- ],
433
- "max_steps": 2500,
434
- "num_train_epochs": 10,
435
- "total_flos": 1010109883418496.0,
436
- "trial_name": null,
437
- "trial_params": null
438
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-2000/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b163d01ba6550b4d0ea94aab97f417a764349c69c3237b0edc7b5507f1235fe6
3
- size 4091
 
 
 
 
checkpoint-2000/vocab.txt DELETED
The diff for this file is too large to render. See raw diff
 
runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073651.c587bebf8fcc.2239.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbecb5c809c6be6c8afb303e013916d04358d96b487dee4dec559b0dcf5d3a75
3
- size 26897
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:923bfa4184be2ac7c1ae1dfa982802a88f61003483e02ccb0e3223406b74d6d2
3
+ size 27251
checkpoint-2000/scheduler.pt → runs/Jul23_00-54-01_c587bebf8fcc/events.out.tfevents.1690073907.c587bebf8fcc.2239.1 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ad0c62478b179935d131a5f36054eef5c951ef7612bbd788e7a63be9d94d8ef
3
- size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4718c55f24759e71c5aa9bbe1950c8cce6ea2f7597149730814404da616703cd
3
+ size 1033