w05230505 commited on
Commit
793ef90
1 Parent(s): 8368c0c

End of training

Browse files
Files changed (5) hide show
  1. README.md +17 -2
  2. all_results.json +17 -0
  3. eval_results.json +11 -0
  4. train_results.json +9 -0
  5. trainer_state.json +96 -0
README.md CHANGED
@@ -1,14 +1,29 @@
1
  ---
2
  library_name: transformers
 
 
3
  license: apache-2.0
4
  base_model: bert-base-uncased
5
  tags:
6
  - generated_from_trainer
 
 
7
  metrics:
8
  - spearmanr
9
  model-index:
10
  - name: bert-base-uncased-finetuned-stsb
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,7 +31,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # bert-base-uncased-finetuned-stsb
18
 
19
- This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
  - Loss: 0.5010
22
  - Pearson: 0.8856
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  license: apache-2.0
6
  base_model: bert-base-uncased
7
  tags:
8
  - generated_from_trainer
9
+ datasets:
10
+ - glue
11
  metrics:
12
  - spearmanr
13
  model-index:
14
  - name: bert-base-uncased-finetuned-stsb
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE STSB
21
+ type: glue
22
+ args: stsb
23
+ metrics:
24
+ - name: Spearmanr
25
+ type: spearmanr
26
+ value: 0.8816479546260654
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
31
 
32
  # bert-base-uncased-finetuned-stsb
33
 
34
+ This model is a fine-tuned version of [bert-base-uncased](https://huggingface.co/bert-base-uncased) on the GLUE STSB dataset.
35
  It achieves the following results on the evaluation set:
36
  - Loss: 0.5010
37
  - Pearson: 0.8856
all_results.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_combined_score": 0.8836428004813802,
4
+ "eval_loss": 0.5009750723838806,
5
+ "eval_pearson": 0.8856376463366951,
6
+ "eval_runtime": 6.5531,
7
+ "eval_samples": 1500,
8
+ "eval_samples_per_second": 228.9,
9
+ "eval_spearmanr": 0.8816479546260654,
10
+ "eval_steps_per_second": 28.689,
11
+ "total_flos": 4537835628033024.0,
12
+ "train_loss": 0.615536986456977,
13
+ "train_runtime": 261.8102,
14
+ "train_samples": 5749,
15
+ "train_samples_per_second": 65.876,
16
+ "train_steps_per_second": 4.125
17
+ }
eval_results.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_combined_score": 0.8836428004813802,
4
+ "eval_loss": 0.5009750723838806,
5
+ "eval_pearson": 0.8856376463366951,
6
+ "eval_runtime": 6.5531,
7
+ "eval_samples": 1500,
8
+ "eval_samples_per_second": 228.9,
9
+ "eval_spearmanr": 0.8816479546260654,
10
+ "eval_steps_per_second": 28.689
11
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "total_flos": 4537835628033024.0,
4
+ "train_loss": 0.615536986456977,
5
+ "train_runtime": 261.8102,
6
+ "train_samples": 5749,
7
+ "train_samples_per_second": 65.876,
8
+ "train_steps_per_second": 4.125
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 1080,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "grad_norm": 36.04340744018555,
14
+ "learning_rate": 1.3333333333333333e-05,
15
+ "loss": 1.1212,
16
+ "step": 360
17
+ },
18
+ {
19
+ "epoch": 1.0,
20
+ "eval_combined_score": 0.8775720604589583,
21
+ "eval_loss": 0.5732272267341614,
22
+ "eval_pearson": 0.8789818053039898,
23
+ "eval_runtime": 6.5665,
24
+ "eval_samples_per_second": 228.431,
25
+ "eval_spearmanr": 0.8761623156139267,
26
+ "eval_steps_per_second": 28.63,
27
+ "step": 360
28
+ },
29
+ {
30
+ "epoch": 2.0,
31
+ "grad_norm": 15.674260139465332,
32
+ "learning_rate": 6.666666666666667e-06,
33
+ "loss": 0.4308,
34
+ "step": 720
35
+ },
36
+ {
37
+ "epoch": 2.0,
38
+ "eval_combined_score": 0.8794983049402647,
39
+ "eval_loss": 0.5606899261474609,
40
+ "eval_pearson": 0.881313245175558,
41
+ "eval_runtime": 6.5051,
42
+ "eval_samples_per_second": 230.59,
43
+ "eval_spearmanr": 0.8776833647049715,
44
+ "eval_steps_per_second": 28.901,
45
+ "step": 720
46
+ },
47
+ {
48
+ "epoch": 3.0,
49
+ "grad_norm": 56.831668853759766,
50
+ "learning_rate": 0.0,
51
+ "loss": 0.2947,
52
+ "step": 1080
53
+ },
54
+ {
55
+ "epoch": 3.0,
56
+ "eval_combined_score": 0.8836428004813802,
57
+ "eval_loss": 0.5009750723838806,
58
+ "eval_pearson": 0.8856376463366951,
59
+ "eval_runtime": 6.5121,
60
+ "eval_samples_per_second": 230.341,
61
+ "eval_spearmanr": 0.8816479546260654,
62
+ "eval_steps_per_second": 28.869,
63
+ "step": 1080
64
+ },
65
+ {
66
+ "epoch": 3.0,
67
+ "step": 1080,
68
+ "total_flos": 4537835628033024.0,
69
+ "train_loss": 0.615536986456977,
70
+ "train_runtime": 261.8102,
71
+ "train_samples_per_second": 65.876,
72
+ "train_steps_per_second": 4.125
73
+ }
74
+ ],
75
+ "logging_steps": 500,
76
+ "max_steps": 1080,
77
+ "num_input_tokens_seen": 0,
78
+ "num_train_epochs": 3,
79
+ "save_steps": 500,
80
+ "stateful_callbacks": {
81
+ "TrainerControl": {
82
+ "args": {
83
+ "should_epoch_stop": false,
84
+ "should_evaluate": false,
85
+ "should_log": false,
86
+ "should_save": true,
87
+ "should_training_stop": true
88
+ },
89
+ "attributes": {}
90
+ }
91
+ },
92
+ "total_flos": 4537835628033024.0,
93
+ "train_batch_size": 16,
94
+ "trial_name": null,
95
+ "trial_params": null
96
+ }