Update README.md
Browse files
README.md
CHANGED
@@ -11,7 +11,7 @@ Training configuration
|
|
11 |
gradient_checkpointing: true
|
12 |
learning_rate: 1e-5
|
13 |
max_grad_norm: 5.0
|
14 |
-
num_epochs:
|
15 |
optimizer: adamw_torch
|
16 |
lr_scheduler: cosine
|
17 |
batch_size: 128
|
|
|
11 |
gradient_checkpointing: true
|
12 |
learning_rate: 1e-5
|
13 |
max_grad_norm: 5.0
|
14 |
+
num_epochs: 6 # 4110 steps in total
|
15 |
optimizer: adamw_torch
|
16 |
lr_scheduler: cosine
|
17 |
batch_size: 128
|