SumanNazir commited on
Commit
c60f61e
1 Parent(s): 047dfa4

Training in progress, step 548

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "SumanNazir/highlight_summary_model_trained_on_reduced_data",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
@@ -19,7 +19,7 @@
19
  "decoder_layers": 12,
20
  "decoder_start_token_id": 2,
21
  "dropout": 0.1,
22
- "early_stopping": null,
23
  "encoder_attention_heads": 16,
24
  "encoder_ffn_dim": 4096,
25
  "encoder_layerdrop": 0.0,
@@ -42,14 +42,14 @@
42
  "LABEL_1": 1,
43
  "LABEL_2": 2
44
  },
45
- "max_length": null,
46
  "max_position_embeddings": 1024,
47
- "min_length": null,
48
  "model_type": "bart",
49
- "no_repeat_ngram_size": null,
50
  "normalize_before": false,
51
  "normalize_embedding": true,
52
- "num_beams": null,
53
  "num_hidden_layers": 12,
54
  "output_past": true,
55
  "pad_token_id": 1,
@@ -61,7 +61,7 @@
61
  "student_encoder_layers": null,
62
  "task_specific_params": {},
63
  "torch_dtype": "float32",
64
- "transformers_version": "4.45.1",
65
  "use_cache": true,
66
  "vocab_size": 50264
67
  }
 
1
  {
2
+ "_name_or_path": "facebook/bart-large-xsum",
3
  "_num_labels": 3,
4
  "activation_dropout": 0.0,
5
  "activation_function": "gelu",
 
19
  "decoder_layers": 12,
20
  "decoder_start_token_id": 2,
21
  "dropout": 0.1,
22
+ "early_stopping": true,
23
  "encoder_attention_heads": 16,
24
  "encoder_ffn_dim": 4096,
25
  "encoder_layerdrop": 0.0,
 
42
  "LABEL_1": 1,
43
  "LABEL_2": 2
44
  },
45
+ "max_length": 62,
46
  "max_position_embeddings": 1024,
47
+ "min_length": 11,
48
  "model_type": "bart",
49
+ "no_repeat_ngram_size": 3,
50
  "normalize_before": false,
51
  "normalize_embedding": true,
52
+ "num_beams": 6,
53
  "num_hidden_layers": 12,
54
  "output_past": true,
55
  "pad_token_id": 1,
 
61
  "student_encoder_layers": null,
62
  "task_specific_params": {},
63
  "torch_dtype": "float32",
64
+ "transformers_version": "4.44.2",
65
  "use_cache": true,
66
  "vocab_size": 50264
67
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb2c1409d0b0378fa857e6f38e5c28c0457f2cd3f4f0ad1ecec0aa69046479e2
3
  size 1625422896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d66c059ea26aa5cd256e556385200e2a5dad918635b21d5534409b1141106f37
3
  size 1625422896
runs/Sep30_19-19-52_13959885f477/events.out.tfevents.1727723993.13959885f477.218.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f97c0ee59cdede55e235dff16075fbff428037e907923b650ec1bb92087cc2f8
3
+ size 6063
runs/Sep30_19-21-23_13959885f477/events.out.tfevents.1727724084.13959885f477.218.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03bf3b4430ffeead23e8546c8acdd91eb69c042c8597324c50f4b074111169b8
3
+ size 6063
runs/Sep30_19-22-06_13959885f477/events.out.tfevents.1727724127.13959885f477.218.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7034599ca5c205444a3941b41076d3af4c2ce0e59b80e840740d1d603fdea655
3
+ size 6063
runs/Sep30_19-26-28_13959885f477/events.out.tfevents.1727724389.13959885f477.218.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cf299bff97b5911f1ad6faee44682ebacd1639996cad5ca7b66fa9c5446a543
3
+ size 7168
special_tokens_map.json CHANGED
@@ -1,25 +1,7 @@
1
  {
2
- "bos_token": {
3
- "content": "<s>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "cls_token": {
10
- "content": "<s>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "eos_token": {
17
- "content": "</s>",
18
- "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
  "mask_token": {
24
  "content": "<mask>",
25
  "lstrip": true,
@@ -27,25 +9,7 @@
27
  "rstrip": false,
28
  "single_word": false
29
  },
30
- "pad_token": {
31
- "content": "<pad>",
32
- "lstrip": false,
33
- "normalized": true,
34
- "rstrip": false,
35
- "single_word": false
36
- },
37
- "sep_token": {
38
- "content": "</s>",
39
- "lstrip": false,
40
- "normalized": true,
41
- "rstrip": false,
42
- "single_word": false
43
- },
44
- "unk_token": {
45
- "content": "<unk>",
46
- "lstrip": false,
47
- "normalized": true,
48
- "rstrip": false,
49
- "single_word": false
50
- }
51
  }
 
1
  {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "mask_token": {
6
  "content": "<mask>",
7
  "lstrip": true,
 
9
  "rstrip": false,
10
  "single_word": false
11
  },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -48,14 +48,10 @@
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
51
- "max_length": 128,
52
  "model_max_length": 1024,
53
  "pad_token": "<pad>",
54
  "sep_token": "</s>",
55
- "stride": 0,
56
  "tokenizer_class": "BartTokenizer",
57
  "trim_offsets": true,
58
- "truncation_side": "right",
59
- "truncation_strategy": "longest_first",
60
  "unk_token": "<unk>"
61
  }
 
48
  "eos_token": "</s>",
49
  "errors": "replace",
50
  "mask_token": "<mask>",
 
51
  "model_max_length": 1024,
52
  "pad_token": "<pad>",
53
  "sep_token": "</s>",
 
54
  "tokenizer_class": "BartTokenizer",
55
  "trim_offsets": true,
 
 
56
  "unk_token": "<unk>"
57
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91d28a5d8ed58d85f6623fb26bf4c5e3cfd45cab54f6826968ddc935cbca09c8
3
- size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6035351f6f9d1fa4425975b1fe2fc2c505ee88cbad734c53c485bbb25c9e4e79
3
+ size 5368