waiman721 commited on
Commit
ecfe389
1 Parent(s): 13250f3

waiman721/fine_tuned_bart-large-cnn_multi_news

Browse files
README.md CHANGED
@@ -1,10 +1,8 @@
1
  ---
2
- license: apache-2.0
3
- base_model: facebook/bart-base
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - rouge
8
  model-index:
9
  - name: results
10
  results: []
@@ -15,14 +13,19 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # results
17
 
18
- This model is a fine-tuned version of [facebook/bart-base](https://huggingface.co/facebook/bart-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 4.3563
21
- - Rouge1: 21.9158
22
- - Rouge2: 7.8595
23
- - Rougel: 16.6472
24
- - Rougelsum: 18.5866
25
- - Gen Len: 20.0
 
 
 
 
 
26
 
27
  ## Model description
28
 
@@ -48,13 +51,9 @@ The following hyperparameters were used during training:
48
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
49
  - lr_scheduler_type: linear
50
  - lr_scheduler_warmup_steps: 500
51
- - num_epochs: 4
52
  - label_smoothing_factor: 0.1
53
 
54
- ### Training results
55
-
56
-
57
-
58
  ### Framework versions
59
 
60
  - Transformers 4.38.2
 
1
  ---
2
+ license: mit
3
+ base_model: facebook/bart-large-cnn
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: results
8
  results: []
 
13
 
14
  # results
15
 
16
+ This model is a fine-tuned version of [facebook/bart-large-cnn](https://huggingface.co/facebook/bart-large-cnn) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - eval_loss: 3.5112
19
+ - eval_rouge1: 36.7687
20
+ - eval_rouge2: 12.7988
21
+ - eval_rougeL: 23.4116
22
+ - eval_rougeLsum: 29.7494
23
+ - eval_gen_len: 65.0396
24
+ - eval_runtime: 1370.2695
25
+ - eval_samples_per_second: 1.641
26
+ - eval_steps_per_second: 0.411
27
+ - epoch: 0.09
28
+ - step: 999
29
 
30
  ## Model description
31
 
 
51
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
52
  - lr_scheduler_type: linear
53
  - lr_scheduler_warmup_steps: 500
54
+ - num_epochs: 1
55
  - label_smoothing_factor: 0.1
56
 
 
 
 
 
57
  ### Framework versions
58
 
59
  - Transformers 4.38.2
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "facebook/bart-base",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": false,
@@ -20,12 +20,12 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "fc1",
24
- "out_proj",
25
  "fc2",
 
26
  "q_proj",
27
- "k_proj",
28
- "v_proj"
 
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "facebook/bart-large-cnn",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "fc2",
24
+ "v_proj",
25
  "q_proj",
26
+ "out_proj",
27
+ "fc1",
28
+ "k_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1f03eb2ee64b8916f5ea413bf8c86370a1c121ae83de06145764f0f9614bf5c
3
- size 51931152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adb96cab28617a8199818c9f1b5cce18e1b9c6292e34246ac774cbf743498ed0
3
+ size 138465976
generation_config.json CHANGED
@@ -5,6 +5,9 @@
5
  "eos_token_id": 2,
6
  "forced_bos_token_id": 0,
7
  "forced_eos_token_id": 2,
 
 
 
8
  "no_repeat_ngram_size": 3,
9
  "num_beams": 4,
10
  "pad_token_id": 1,
 
5
  "eos_token_id": 2,
6
  "forced_bos_token_id": 0,
7
  "forced_eos_token_id": 2,
8
+ "length_penalty": 2.0,
9
+ "max_length": 142,
10
+ "min_length": 56,
11
  "no_repeat_ngram_size": 3,
12
  "num_beams": 4,
13
  "pad_token_id": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:355b9322e55c41a0568c56d3a42865467d431e62102f27845604372b50ae0961
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:242f0197648bbbdcd8d0d3954e84f1b447715477abe7c9a5f5171d30d2bd29b5
3
  size 4984