fsicoli commited on
Commit
217edc5
1 Parent(s): fda56ca

Model save

Browse files
README.md CHANGED
@@ -53,11 +53,11 @@ More information needed
53
 
54
  The following hyperparameters were used during training:
55
  - learning_rate: 1e-05
56
- - train_batch_size: 1
57
- - eval_batch_size: 1
58
  - seed: 42
59
  - gradient_accumulation_steps: 32
60
- - total_train_batch_size: 32
61
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
62
  - lr_scheduler_type: linear
63
  - lr_scheduler_warmup_steps: 1000
 
53
 
54
  The following hyperparameters were used during training:
55
  - learning_rate: 1e-05
56
+ - train_batch_size: 8
57
+ - eval_batch_size: 8
58
  - seed: 42
59
  - gradient_accumulation_steps: 32
60
+ - total_train_batch_size: 256
61
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
62
  - lr_scheduler_type: linear
63
  - lr_scheduler_warmup_steps: 1000
all_results.json CHANGED
@@ -7,9 +7,9 @@
7
  "eval_steps_per_second": 0.516,
8
  "eval_wer": 0.10174567584881486,
9
  "total_flos": 1.5025096510930944e+20,
10
- "train_loss": 0.029662437230219198,
11
- "train_runtime": 33102.9931,
12
  "train_samples": 22116,
13
- "train_samples_per_second": 1.336,
14
- "train_steps_per_second": 0.042
15
  }
 
7
  "eval_steps_per_second": 0.516,
8
  "eval_wer": 0.10174567584881486,
9
  "total_flos": 1.5025096510930944e+20,
10
+ "train_loss": 0.0,
11
+ "train_runtime": 0.2812,
12
  "train_samples": 22116,
13
+ "train_samples_per_second": 157281.733,
14
+ "train_steps_per_second": 4914.165
15
  }
runs/Aug20_11-15-37_DITEC2014063010/events.out.tfevents.1724163511.DITEC2014063010.19184.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c12437b077e2382e32242751fe8592b161637632ce0c6b4ae80a1a29bdefcf7d
3
+ size 6099
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.999819135467535,
3
  "total_flos": 1.5025096510930944e+20,
4
- "train_loss": 0.029662437230219198,
5
- "train_runtime": 33102.9931,
6
  "train_samples": 22116,
7
- "train_samples_per_second": 1.336,
8
- "train_steps_per_second": 0.042
9
  }
 
1
  {
2
  "epoch": 1.999819135467535,
3
  "total_flos": 1.5025096510930944e+20,
4
+ "train_loss": 0.0,
5
+ "train_runtime": 0.2812,
6
  "train_samples": 22116,
7
+ "train_samples_per_second": 157281.733,
8
+ "train_steps_per_second": 4914.165
9
  }
trainer_state.json CHANGED
@@ -402,23 +402,14 @@
402
  "loss": 0.0844,
403
  "step": 1375
404
  },
405
- {
406
- "epoch": 1.999819135467535,
407
- "eval_loss": 0.14780554175376892,
408
- "eval_runtime": 18259.5061,
409
- "eval_samples_per_second": 0.52,
410
- "eval_steps_per_second": 0.52,
411
- "eval_wer": 0.10174567584881486,
412
- "step": 1382
413
- },
414
  {
415
  "epoch": 1.999819135467535,
416
  "step": 1382,
417
  "total_flos": 1.5025096510930944e+20,
418
- "train_loss": 0.029662437230219198,
419
- "train_runtime": 33102.9931,
420
- "train_samples_per_second": 1.336,
421
- "train_steps_per_second": 0.042
422
  }
423
  ],
424
  "logging_steps": 25,
 
402
  "loss": 0.0844,
403
  "step": 1375
404
  },
 
 
 
 
 
 
 
 
 
405
  {
406
  "epoch": 1.999819135467535,
407
  "step": 1382,
408
  "total_flos": 1.5025096510930944e+20,
409
+ "train_loss": 0.0,
410
+ "train_runtime": 0.2812,
411
+ "train_samples_per_second": 157281.733,
412
+ "train_steps_per_second": 4914.165
413
  }
414
  ],
415
  "logging_steps": 25,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:116e25ebda8a70d357a01b41e14270f82bdd6e179b329884f001f9aabbeebd0f
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f49e1c774ad26e8ca9801f06aeb95b535c1d5764f78640973f4d9d39e6c0f33f
3
  size 5368