nandavikas16
commited on
Commit
•
5651fce
1
Parent(s):
e277a4f
Model save
Browse files
README.md
CHANGED
@@ -17,11 +17,11 @@ should probably proofread and complete it, then remove this comment. -->
|
|
17 |
|
18 |
This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on an unknown dataset.
|
19 |
It achieves the following results on the evaluation set:
|
20 |
-
- Loss: 1.
|
21 |
-
- Rouge1:
|
22 |
-
- Rouge2:
|
23 |
-
- Rougel: 36.
|
24 |
-
- Rougelsum:
|
25 |
|
26 |
## Model description
|
27 |
|
@@ -52,31 +52,31 @@ The following hyperparameters were used during training:
|
|
52 |
|
53 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
|
54 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
|
55 |
-
| No log | 1.0 |
|
56 |
-
| 0.
|
57 |
-
| 0.
|
58 |
-
| 0.
|
59 |
-
| 0.
|
60 |
-
| 0.
|
61 |
-
| 0.
|
62 |
-
| 0.
|
63 |
-
| 0.
|
64 |
-
| 0.
|
65 |
-
| 0.
|
66 |
-
| 0.
|
67 |
-
| 0.
|
68 |
-
| 0.
|
69 |
-
| 0.
|
70 |
-
| 0.
|
71 |
-
| 0.
|
72 |
-
| 0.
|
73 |
-
| 0.
|
74 |
-
| 0.
|
75 |
|
76 |
|
77 |
### Framework versions
|
78 |
|
79 |
-
- Transformers 4.38.
|
80 |
- Pytorch 2.2.1+cu121
|
81 |
-
- Datasets 2.
|
82 |
- Tokenizers 0.15.2
|
|
|
17 |
|
18 |
This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on an unknown dataset.
|
19 |
It achieves the following results on the evaluation set:
|
20 |
+
- Loss: 1.1824
|
21 |
+
- Rouge1: 50.8184
|
22 |
+
- Rouge2: 30.1612
|
23 |
+
- Rougel: 36.9904
|
24 |
+
- Rougelsum: 49.4235
|
25 |
|
26 |
## Model description
|
27 |
|
|
|
52 |
|
53 |
| Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum |
|
54 |
|:-------------:|:-----:|:----:|:---------------:|:-------:|:-------:|:-------:|:---------:|
|
55 |
+
| No log | 1.0 | 34 | 0.7061 | 44.9133 | 26.0507 | 34.7329 | 43.2231 |
|
56 |
+
| 0.8927 | 2.0 | 68 | 0.7190 | 46.3702 | 26.952 | 36.2244 | 44.7608 |
|
57 |
+
| 0.617 | 3.0 | 102 | 0.6815 | 50.5658 | 28.4213 | 36.4503 | 49.3129 |
|
58 |
+
| 0.617 | 4.0 | 136 | 0.7083 | 50.7172 | 28.1621 | 37.0023 | 49.3293 |
|
59 |
+
| 0.5169 | 5.0 | 170 | 0.6819 | 50.0364 | 27.5729 | 35.9607 | 48.0331 |
|
60 |
+
| 0.4614 | 6.0 | 204 | 0.7171 | 51.0974 | 29.0043 | 36.4498 | 49.6124 |
|
61 |
+
| 0.3995 | 7.0 | 238 | 0.7577 | 50.8879 | 29.3509 | 35.9144 | 49.4029 |
|
62 |
+
| 0.3995 | 8.0 | 272 | 0.8192 | 50.332 | 28.9931 | 36.458 | 48.8301 |
|
63 |
+
| 0.3185 | 9.0 | 306 | 0.8635 | 49.4501 | 27.6673 | 35.7586 | 47.891 |
|
64 |
+
| 0.2627 | 10.0 | 340 | 0.9229 | 51.0907 | 30.1515 | 36.5669 | 49.6126 |
|
65 |
+
| 0.2627 | 11.0 | 374 | 0.9910 | 49.6877 | 29.4712 | 36.5784 | 48.6087 |
|
66 |
+
| 0.1952 | 12.0 | 408 | 1.0266 | 51.3167 | 30.619 | 36.5097 | 49.7864 |
|
67 |
+
| 0.1234 | 13.0 | 442 | 1.0313 | 49.6518 | 28.2854 | 35.9773 | 48.4327 |
|
68 |
+
| 0.0859 | 14.0 | 476 | 1.0791 | 50.3139 | 29.9343 | 35.8756 | 49.0233 |
|
69 |
+
| 0.0859 | 15.0 | 510 | 1.1431 | 50.4173 | 29.047 | 36.4338 | 48.8672 |
|
70 |
+
| 0.0591 | 16.0 | 544 | 1.1455 | 51.733 | 30.786 | 37.4082 | 50.4284 |
|
71 |
+
| 0.0448 | 17.0 | 578 | 1.1353 | 49.5046 | 29.3628 | 36.2758 | 48.324 |
|
72 |
+
| 0.0341 | 18.0 | 612 | 1.1619 | 51.7577 | 31.1043 | 37.9571 | 50.6969 |
|
73 |
+
| 0.0341 | 19.0 | 646 | 1.1748 | 51.4652 | 30.6309 | 36.7434 | 49.9184 |
|
74 |
+
| 0.0255 | 20.0 | 680 | 1.1824 | 50.8184 | 30.1612 | 36.9904 | 49.4235 |
|
75 |
|
76 |
|
77 |
### Framework versions
|
78 |
|
79 |
+
- Transformers 4.38.2
|
80 |
- Pytorch 2.2.1+cu121
|
81 |
+
- Datasets 2.18.0
|
82 |
- Tokenizers 0.15.2
|
generation_config.json
CHANGED
@@ -11,6 +11,6 @@
|
|
11 |
"no_repeat_ngram_size": 3,
|
12 |
"num_beams": 4,
|
13 |
"pad_token_id": 1,
|
14 |
-
"transformers_version": "4.38.
|
15 |
"use_cache": false
|
16 |
}
|
|
|
11 |
"no_repeat_ngram_size": 3,
|
12 |
"num_beams": 4,
|
13 |
"pad_token_id": 1,
|
14 |
+
"transformers_version": "4.38.2",
|
15 |
"use_cache": false
|
16 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1625422896
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23459b45621db9abdac4e7887133ab6b7949bfcb5fe5292ccdb2805eb3cf47e5
|
3 |
size 1625422896
|
runs/Mar02_17-15-34_n5qclzvvia/events.out.tfevents.1709399740.n5qclzvvia.422.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2df30cb0402c5d89169845931088c5ee05303f996571b5ac83b0229e26f6a319
|
3 |
+
size 18598
|
runs/Mar02_17-15-34_n5qclzvvia/events.out.tfevents.1709404316.n5qclzvvia.422.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2249e4178ebbb769d376e9505ee7e60a0aa20aeb0b89e9656b39dfc24fc2ce56
|
3 |
+
size 514
|