aapot
commited on
Commit
•
48ec1f9
1
Parent(s):
d30d525
Saving weights and logs of step 10000
Browse files
events.out.tfevents.1629925854.t1v-n-1ae8dadb-w-0.258038.0.v2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3ba93cc73524ee91a324c9c60c9b1944661982351b153371e82ee189b547e08
|
3 |
+
size 8166703
|
events.out.tfevents.1629954669.t1v-n-1ae8dadb-w-0.348909.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2754b0718aaa184806c065e66c1e4cd5de84a84f740d764fa0aa7b57e056c74
|
3 |
+
size 1176479
|
events.out.tfevents.1629959691.t1v-n-1ae8dadb-w-0.364831.0.v2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f17a856d2fd8e07f6e5dfeff9ef002b11a709812bd05c57144322ca7fbd2b929
|
3 |
+
size 1470757
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 711588089
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4b00a73b13270205d21872705ba7bc03f609ecf3c5a6dc99ec19895a8184c9d
|
3 |
size 711588089
|
start_train.sh
CHANGED
@@ -15,8 +15,9 @@ python3 run_mlm_flax.py \
|
|
15 |
--adam_beta1="0.9" \
|
16 |
--adam_beta2="0.98" \
|
17 |
--adam_epsilon="1e-6" \
|
18 |
-
--learning_rate="
|
19 |
-
--
|
|
|
20 |
--overwrite_output_dir \
|
21 |
--num_train_epochs="3" \
|
22 |
--save_strategy="steps" \
|
|
|
15 |
--adam_beta1="0.9" \
|
16 |
--adam_beta2="0.98" \
|
17 |
--adam_epsilon="1e-6" \
|
18 |
+
--learning_rate="2e-4" \
|
19 |
+
# --weight_decay="0.01" \
|
20 |
+
--warmup_steps="1500" \
|
21 |
--overwrite_output_dir \
|
22 |
--num_train_epochs="3" \
|
23 |
--save_strategy="steps" \
|