Shu Huang
commited on
Commit
·
20744c3
1
Parent(s):
cf856ed
1000000 steps
Browse files- all_results.json +15 -0
- config.json +26 -0
- eval_results.json +10 -0
- pytorch_model.bin +3 -0
- runs/Feb15_13-06-05_thetagpu16/1644959202.968566/events.out.tfevents.1644959202.thetagpu16.3475223.1 +3 -0
- runs/Feb15_13-06-05_thetagpu16/events.out.tfevents.1644959202.thetagpu16.3475223.0 +3 -0
- runs/Feb16_03-38-57_thetagpu10/1645004399.7457194/events.out.tfevents.1645004399.thetagpu10.1078855.1 +3 -0
- runs/Feb16_03-38-57_thetagpu10/events.out.tfevents.1645004399.thetagpu10.1078855.0 +3 -0
- runs/Feb16_11-21-45_thetagpu01/1645032183.4491427/events.out.tfevents.1645032183.thetagpu01.894464.1 +3 -0
- runs/Feb16_11-21-45_thetagpu01/events.out.tfevents.1645032183.thetagpu01.894464.0 +3 -0
- runs/Feb17_17-29-07_thetagpu22/1645140625.1277843/events.out.tfevents.1645140625.thetagpu22.688945.1 +3 -0
- runs/Feb17_17-29-07_thetagpu22/events.out.tfevents.1645140625.thetagpu22.688945.0 +3 -0
- runs/Feb18_13-06-02_thetagpu19/1645211235.6252458/events.out.tfevents.1645211235.thetagpu19.1546579.1 +3 -0
- runs/Feb18_13-06-02_thetagpu19/events.out.tfevents.1645211235.thetagpu19.1546579.0 +3 -0
- runs/Feb19_03-36-57_thetagpu09/1645263494.9753404/events.out.tfevents.1645263494.thetagpu09.140427.1 +3 -0
- runs/Feb19_03-36-57_thetagpu09/events.out.tfevents.1645263494.thetagpu09.140427.0 +3 -0
- runs/Feb19_21-48-52_thetagpu16/1645329014.1607616/events.out.tfevents.1645329014.thetagpu16.3307329.1 +3 -0
- runs/Feb19_21-48-52_thetagpu16/events.out.tfevents.1645329014.thetagpu16.3307329.0 +3 -0
- runs/Feb21_21-03-03_thetagpu22/1645499051.7776277/events.out.tfevents.1645499051.thetagpu22.2987543.1 +3 -0
- runs/Feb21_21-03-03_thetagpu22/events.out.tfevents.1645499051.thetagpu22.2987543.0 +3 -0
- runs/Feb23_00-42-24_thetagpu10/1645598615.9464502/events.out.tfevents.1645598615.thetagpu10.3971422.1 +3 -0
- runs/Feb23_00-42-24_thetagpu10/events.out.tfevents.1645598615.thetagpu10.3971422.0 +3 -0
- runs/Feb23_21-04-16_thetagpu03/1645671939.900241/events.out.tfevents.1645671939.thetagpu03.3458548.1 +3 -0
- runs/Feb23_21-04-16_thetagpu03/events.out.tfevents.1645671939.thetagpu03.3458548.0 +3 -0
- runs/Feb25_04-37-03_thetagpu06/1645785500.2812984/events.out.tfevents.1645785500.thetagpu06.1824549.1 +3 -0
- runs/Feb25_04-37-03_thetagpu06/events.out.tfevents.1645785500.thetagpu06.1824549.0 +3 -0
- runs/Feb25_12-30-51_thetagpu14/1645813958.182742/events.out.tfevents.1645813958.thetagpu14.3540880.1 +3 -0
- runs/Feb25_12-30-51_thetagpu14/events.out.tfevents.1645813958.thetagpu14.3540880.0 +3 -0
- runs/Feb25_12-30-51_thetagpu14/events.out.tfevents.1645825337.thetagpu14.3540880.2 +3 -0
- special_tokens_map.json +1 -0
- tokenizer.json +0 -0
- tokenizer_config.json +1 -0
- train_results.json +8 -0
- trainer_state.json +0 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
all_results.json
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 45.04,
|
3 |
+
"eval_accuracy": 0.7908352567121055,
|
4 |
+
"eval_loss": 0.8752322793006897,
|
5 |
+
"eval_runtime": 52.2322,
|
6 |
+
"eval_samples": 48910,
|
7 |
+
"eval_samples_per_second": 936.395,
|
8 |
+
"eval_steps_per_second": 14.646,
|
9 |
+
"perplexity": 2.3994325677619006,
|
10 |
+
"train_loss": 0.020673565490722655,
|
11 |
+
"train_runtime": 11326.2724,
|
12 |
+
"train_samples": 5683580,
|
13 |
+
"train_samples_per_second": 22602.317,
|
14 |
+
"train_steps_per_second": 88.29
|
15 |
+
}
|
config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "bert-base-uncased",
|
3 |
+
"architectures": [
|
4 |
+
"BertForMaskedLM"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"gradient_checkpointing": false,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-12,
|
15 |
+
"max_position_embeddings": 512,
|
16 |
+
"model_type": "bert",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"position_embedding_type": "absolute",
|
21 |
+
"torch_dtype": "float32",
|
22 |
+
"transformers_version": "4.17.0.dev0",
|
23 |
+
"type_vocab_size": 2,
|
24 |
+
"use_cache": true,
|
25 |
+
"vocab_size": 30522
|
26 |
+
}
|
eval_results.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 45.04,
|
3 |
+
"eval_accuracy": 0.7908352567121055,
|
4 |
+
"eval_loss": 0.8752322793006897,
|
5 |
+
"eval_runtime": 52.2322,
|
6 |
+
"eval_samples": 48910,
|
7 |
+
"eval_samples_per_second": 936.395,
|
8 |
+
"eval_steps_per_second": 14.646,
|
9 |
+
"perplexity": 2.3994325677619006
|
10 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:234a60db1081ced4920b77ea390eea5ebbcbb2d230babecbb023847c73bf45ff
|
3 |
+
size 438147282
|
runs/Feb15_13-06-05_thetagpu16/1644959202.968566/events.out.tfevents.1644959202.thetagpu16.3475223.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9094a4850862a791140c8f5c9e3e8ffcdeaea1f51616d3eff81f585df17872a6
|
3 |
+
size 4921
|
runs/Feb15_13-06-05_thetagpu16/events.out.tfevents.1644959202.thetagpu16.3475223.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5167bff58a1a17e8306c356248b1127ceca62729a48baaa5a07f32d33af1692
|
3 |
+
size 32677
|
runs/Feb16_03-38-57_thetagpu10/1645004399.7457194/events.out.tfevents.1645004399.thetagpu10.1078855.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:458f6208b576f6ca6c03b2e88e81c006bb7e57809d9dae1e07e48aebd03aa087
|
3 |
+
size 4921
|
runs/Feb16_03-38-57_thetagpu10/events.out.tfevents.1645004399.thetagpu10.1078855.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82215f833df3b39e85358b91ed7d5d644c27ec08a2ca30e4b5d6f681ee0a90ca
|
3 |
+
size 3471
|
runs/Feb16_11-21-45_thetagpu01/1645032183.4491427/events.out.tfevents.1645032183.thetagpu01.894464.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2efa2b8b30262095e8af521cffa1a69cbb0ad523d10c90ea51e5fdff7280905c
|
3 |
+
size 4921
|
runs/Feb16_11-21-45_thetagpu01/events.out.tfevents.1645032183.thetagpu01.894464.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09a42a10378e34a7b038f5858b234ab9997b2e7768194a7c889c001e7b0430f0
|
3 |
+
size 42395
|
runs/Feb17_17-29-07_thetagpu22/1645140625.1277843/events.out.tfevents.1645140625.thetagpu22.688945.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7587fb5780d1d90fa46b2d3d4c9347c5100e1829889ffde742438a1e358a603
|
3 |
+
size 4921
|
runs/Feb17_17-29-07_thetagpu22/events.out.tfevents.1645140625.thetagpu22.688945.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa8cf611f14617ce0f054dabf7d523c1eb32b73cc654710d7697712c2b6c7e9a
|
3 |
+
size 28458
|
runs/Feb18_13-06-02_thetagpu19/1645211235.6252458/events.out.tfevents.1645211235.thetagpu19.1546579.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01af60a9ab98726b5b8c5ee0885eed1c5620d68ae0afcd1a29dad61133ace817
|
3 |
+
size 4921
|
runs/Feb18_13-06-02_thetagpu19/events.out.tfevents.1645211235.thetagpu19.1546579.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4c39cd4bf63ac197c94c58ed8f1e6f286ae217f55aee3a6e8c10eafb926913b
|
3 |
+
size 42557
|
runs/Feb19_03-36-57_thetagpu09/1645263494.9753404/events.out.tfevents.1645263494.thetagpu09.140427.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:850afb32bf32ba255b139d88a8cadbe9d3d86f9628dd6997b73c022530d9bbb2
|
3 |
+
size 4921
|
runs/Feb19_03-36-57_thetagpu09/events.out.tfevents.1645263494.thetagpu09.140427.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e4cce1e830c592b026dc20d5ff28b5be6038e00f8fd7f079da86674c896b147
|
3 |
+
size 39037
|
runs/Feb19_21-48-52_thetagpu16/1645329014.1607616/events.out.tfevents.1645329014.thetagpu16.3307329.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a686b60004bee38fb2d4f55d3dbce6200a71b810dd4ca9040a58590acb7bd90
|
3 |
+
size 4921
|
runs/Feb19_21-48-52_thetagpu16/events.out.tfevents.1645329014.thetagpu16.3307329.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f09d0dd7b46f15c3b54d7ebb00bda8c1a693658238dc3b68e5e4b98840f2265
|
3 |
+
size 42557
|
runs/Feb21_21-03-03_thetagpu22/1645499051.7776277/events.out.tfevents.1645499051.thetagpu22.2987543.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:374b17001790ae2b1379f83e500d4e57e1b98980fc383d3acc40c907671f302c
|
3 |
+
size 4921
|
runs/Feb21_21-03-03_thetagpu22/events.out.tfevents.1645499051.thetagpu22.2987543.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c9524f35c9e3f6bec6b688bbd2fe5aedb4de2ea16fcd7d06a0b2951ca57c83c
|
3 |
+
size 39188
|
runs/Feb23_00-42-24_thetagpu10/1645598615.9464502/events.out.tfevents.1645598615.thetagpu10.3971422.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1bdbb10284167937b6d61e8e567258fa3b8c27e6463f1d6d301aa87a36344e0
|
3 |
+
size 4921
|
runs/Feb23_00-42-24_thetagpu10/events.out.tfevents.1645598615.thetagpu10.3971422.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03fd962da98d2e1bd07cdbd846b77518344bede5f662d1344370ba017a4ce726
|
3 |
+
size 43197
|
runs/Feb23_21-04-16_thetagpu03/1645671939.900241/events.out.tfevents.1645671939.thetagpu03.3458548.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6784e633e67f122e49f2129923996932cecc07a0cc6c6718c2b69d2d6a51eb8
|
3 |
+
size 4921
|
runs/Feb23_21-04-16_thetagpu03/events.out.tfevents.1645671939.thetagpu03.3458548.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4371ce8d0a16b754e37f917967175e132601e4019685088b7f48b6593799c89e
|
3 |
+
size 38557
|
runs/Feb25_04-37-03_thetagpu06/1645785500.2812984/events.out.tfevents.1645785500.thetagpu06.1824549.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28a72c16c0d8bb4fa40e4491242d7f91680310e85e9504c1c4af19888e269309
|
3 |
+
size 4921
|
runs/Feb25_04-37-03_thetagpu06/events.out.tfevents.1645785500.thetagpu06.1824549.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add3c888dba5e3c257311b8c969ec55e9209a56374a4a7d44e63057e5f5d6d84
|
3 |
+
size 29908
|
runs/Feb25_12-30-51_thetagpu14/1645813958.182742/events.out.tfevents.1645813958.thetagpu14.3540880.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37fae465b3d781d9fa9bd96c87d16da40b6345c0cf2220b43d6f00f138735aeb
|
3 |
+
size 4921
|
runs/Feb25_12-30-51_thetagpu14/events.out.tfevents.1645813958.thetagpu14.3540880.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f72ed888f3113ffaeeb4935aa454c458d7b33b9022cf7302909ffd328c652a1b
|
3 |
+
size 10890
|
runs/Feb25_12-30-51_thetagpu14/events.out.tfevents.1645825337.thetagpu14.3540880.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b671dff4c1fede13614a3238c83013dbc0d8ae04266809fff200611968963521
|
3 |
+
size 369
|
special_tokens_map.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "bert-base-uncased", "tokenizer_class": "BertTokenizer"}
|
train_results.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 45.04,
|
3 |
+
"train_loss": 0.020673565490722655,
|
4 |
+
"train_runtime": 11326.2724,
|
5 |
+
"train_samples": 5683580,
|
6 |
+
"train_samples_per_second": 22602.317,
|
7 |
+
"train_steps_per_second": 88.29
|
8 |
+
}
|
trainer_state.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b281e81ecd6452c20367a7c7e17efff7357d0120916f07b27ff0aa0f14b44d8
|
3 |
+
size 3119
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|