model
Browse files- scripts/model.yaml +2 -2
scripts/model.yaml
CHANGED
@@ -62,11 +62,11 @@ train:
|
|
62 |
lr_warmup_steps: 2000
|
63 |
|
64 |
# Number of epochs to train on (type: Optional[int], default: null)
|
65 |
-
epochs:
|
66 |
|
67 |
# Total number of tokens to train on (type: Optional[int], default: 3000000000000)
|
68 |
# max_tokens: 3000000000000
|
69 |
-
max_tokens:
|
70 |
|
71 |
# Limits the number of optimizer steps to run. (type: Optional[int], default: null)
|
72 |
max_steps:
|
|
|
62 |
lr_warmup_steps: 2000
|
63 |
|
64 |
# Number of epochs to train on (type: Optional[int], default: null)
|
65 |
+
epochs:
|
66 |
|
67 |
# Total number of tokens to train on (type: Optional[int], default: 3000000000000)
|
68 |
# max_tokens: 3000000000000
|
69 |
+
max_tokens: 9782206713 # 1591379 * 2049 * 3
|
70 |
|
71 |
# Limits the number of optimizer steps to run. (type: Optional[int], default: null)
|
72 |
max_steps:
|