peterbeamish commited on
Commit
9ff1453
1 Parent(s): 0273197

End of training

Browse files
Files changed (3) hide show
  1. README.md +7 -7
  2. trainer_state.json +24 -24
  3. training_args.bin +1 -1
README.md CHANGED
@@ -18,10 +18,10 @@ should probably proofread and complete it, then remove this comment. -->
18
  This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
  - Loss: 1.3339
21
- - Rouge1: 0.3861
22
- - Rouge2: 0.2867
23
- - Rougel: 0.3878
24
- - Rougelsum: 0.3898
25
  - Gen Len: 13.16
26
 
27
  ## Model description
@@ -53,9 +53,9 @@ The following hyperparameters were used during training:
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
55
  |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:-------:|
56
- | 1.9101 | 2.0 | 100 | 1.4032 | 0.3914 | 0.2858 | 0.3924 | 0.3934 | 12.7 |
57
- | 1.4264 | 4.0 | 200 | 1.3399 | 0.3805 | 0.287 | 0.382 | 0.3841 | 12.68 |
58
- | 1.3121 | 6.0 | 300 | 1.3339 | 0.3861 | 0.2867 | 0.3878 | 0.3898 | 13.16 |
59
 
60
 
61
  ### Framework versions
 
18
  This model is a fine-tuned version of [google/flan-t5-small](https://huggingface.co/google/flan-t5-small) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
  - Loss: 1.3339
21
+ - Rouge1: 0.3878
22
+ - Rouge2: 0.2902
23
+ - Rougel: 0.3871
24
+ - Rougelsum: 0.3871
25
  - Gen Len: 13.16
26
 
27
  ## Model description
 
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Gen Len |
55
  |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:-------:|
56
+ | 1.9101 | 2.0 | 100 | 1.4032 | 0.3928 | 0.2897 | 0.3915 | 0.3911 | 12.7 |
57
+ | 1.4264 | 4.0 | 200 | 1.3399 | 0.3826 | 0.2908 | 0.3808 | 0.3809 | 12.68 |
58
+ | 1.3121 | 6.0 | 300 | 1.3339 | 0.3878 | 0.2902 | 0.3871 | 0.3871 | 13.16 |
59
 
60
 
61
  ### Framework versions
trainer_state.json CHANGED
@@ -18,13 +18,13 @@
18
  "epoch": 2.0,
19
  "eval_gen_len": 12.7,
20
  "eval_loss": 1.4032484292984009,
21
- "eval_rouge1": 0.3914,
22
- "eval_rouge2": 0.2858,
23
- "eval_rougeL": 0.3924,
24
- "eval_rougeLsum": 0.3934,
25
- "eval_runtime": 14.4875,
26
- "eval_samples_per_second": 6.903,
27
- "eval_steps_per_second": 3.451,
28
  "step": 100
29
  },
30
  {
@@ -37,13 +37,13 @@
37
  "epoch": 4.0,
38
  "eval_gen_len": 12.68,
39
  "eval_loss": 1.3398905992507935,
40
- "eval_rouge1": 0.3805,
41
- "eval_rouge2": 0.287,
42
- "eval_rougeL": 0.382,
43
- "eval_rougeLsum": 0.3841,
44
- "eval_runtime": 14.5729,
45
- "eval_samples_per_second": 6.862,
46
- "eval_steps_per_second": 3.431,
47
  "step": 200
48
  },
49
  {
@@ -56,13 +56,13 @@
56
  "epoch": 6.0,
57
  "eval_gen_len": 13.16,
58
  "eval_loss": 1.3339253664016724,
59
- "eval_rouge1": 0.3861,
60
- "eval_rouge2": 0.2867,
61
- "eval_rougeL": 0.3878,
62
- "eval_rougeLsum": 0.3898,
63
- "eval_runtime": 15.3545,
64
- "eval_samples_per_second": 6.513,
65
- "eval_steps_per_second": 3.256,
66
  "step": 300
67
  },
68
  {
@@ -70,9 +70,9 @@
70
  "step": 300,
71
  "total_flos": 111534302822400.0,
72
  "train_loss": 1.5495406595865886,
73
- "train_runtime": 74.9004,
74
- "train_samples_per_second": 8.011,
75
- "train_steps_per_second": 4.005
76
  }
77
  ],
78
  "logging_steps": 100,
 
18
  "epoch": 2.0,
19
  "eval_gen_len": 12.7,
20
  "eval_loss": 1.4032484292984009,
21
+ "eval_rouge1": 0.3928,
22
+ "eval_rouge2": 0.2897,
23
+ "eval_rougeL": 0.3915,
24
+ "eval_rougeLsum": 0.3911,
25
+ "eval_runtime": 14.5472,
26
+ "eval_samples_per_second": 6.874,
27
+ "eval_steps_per_second": 3.437,
28
  "step": 100
29
  },
30
  {
 
37
  "epoch": 4.0,
38
  "eval_gen_len": 12.68,
39
  "eval_loss": 1.3398905992507935,
40
+ "eval_rouge1": 0.3826,
41
+ "eval_rouge2": 0.2908,
42
+ "eval_rougeL": 0.3808,
43
+ "eval_rougeLsum": 0.3809,
44
+ "eval_runtime": 14.6388,
45
+ "eval_samples_per_second": 6.831,
46
+ "eval_steps_per_second": 3.416,
47
  "step": 200
48
  },
49
  {
 
56
  "epoch": 6.0,
57
  "eval_gen_len": 13.16,
58
  "eval_loss": 1.3339253664016724,
59
+ "eval_rouge1": 0.3878,
60
+ "eval_rouge2": 0.2902,
61
+ "eval_rougeL": 0.3871,
62
+ "eval_rougeLsum": 0.3871,
63
+ "eval_runtime": 15.4855,
64
+ "eval_samples_per_second": 6.458,
65
+ "eval_steps_per_second": 3.229,
66
  "step": 300
67
  },
68
  {
 
70
  "step": 300,
71
  "total_flos": 111534302822400.0,
72
  "train_loss": 1.5495406595865886,
73
+ "train_runtime": 75.3909,
74
+ "train_samples_per_second": 7.959,
75
+ "train_steps_per_second": 3.979
76
  }
77
  ],
78
  "logging_steps": 100,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9da472b08deaef8c8414c7727a31d6ee03fb06b4f3e229ea402bdd50ebbc5835
3
  size 4219
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47e37319b6c5f5fc1cf34c2c247f61d37f8f85bb95fcd70040aa535f8b9d85e4
3
  size 4219