remove old exp&model and lower steps to save
Browse files
events.out.tfevents.1625918979.t1v-n-bf8aeee7-w-0.7214.3.v2
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:ef474e83a08aee1c207f08dd5317d5ac90a71305e8c74e12268e8e7fabeef00d
|
3 |
-
size 1471307
|
|
|
|
|
|
|
|
flax_model.msgpack
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:c4b91ba56a9d6472f9f270d739f351db729a31f24ff11fd4bd77ba47504d3ff0
|
3 |
-
size 249750019
|
|
|
|
|
|
|
|
run.sh
CHANGED
@@ -1,6 +1,5 @@
|
|
1 |
#!/usr/bin/env bash
|
2 |
python3 run_mlm_flax.py \
|
3 |
-
--model_name_or_path="flax_model.msgpack" \
|
4 |
--output_dir="./" \
|
5 |
--model_type="roberta" \
|
6 |
--config_name="./" \
|
@@ -13,14 +12,14 @@ python3 run_mlm_flax.py \
|
|
13 |
--per_device_train_batch_size="32" \
|
14 |
--per_device_eval_batch_size="32" \
|
15 |
--learning_rate="3e-5" \
|
16 |
-
--warmup_steps="
|
17 |
--overwrite_output_dir \
|
18 |
--seed="19" \
|
19 |
--num_train_epochs="8" \
|
20 |
--adam_beta1="0.9" \
|
21 |
--adam_beta2="0.98" \
|
22 |
--logging_steps="500" \
|
23 |
-
--save_steps="
|
24 |
--eval_steps="20000" \
|
25 |
--dtype="bfloat16" \
|
26 |
--push_to_hub
|
|
|
1 |
#!/usr/bin/env bash
|
2 |
python3 run_mlm_flax.py \
|
|
|
3 |
--output_dir="./" \
|
4 |
--model_type="roberta" \
|
5 |
--config_name="./" \
|
|
|
12 |
--per_device_train_batch_size="32" \
|
13 |
--per_device_eval_batch_size="32" \
|
14 |
--learning_rate="3e-5" \
|
15 |
+
--warmup_steps="5000" \
|
16 |
--overwrite_output_dir \
|
17 |
--seed="19" \
|
18 |
--num_train_epochs="8" \
|
19 |
--adam_beta1="0.9" \
|
20 |
--adam_beta2="0.98" \
|
21 |
--logging_steps="500" \
|
22 |
+
--save_steps="5000" \
|
23 |
--eval_steps="20000" \
|
24 |
--dtype="bfloat16" \
|
25 |
--push_to_hub
|