model
Browse files- scripts/model.yaml +1 -1
scripts/model.yaml
CHANGED
@@ -54,7 +54,7 @@ train:
|
|
54 |
global_batch_size: 512
|
55 |
|
56 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
57 |
-
micro_batch_size: 4
|
58 |
|
59 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
60 |
lr_warmup_steps: 2000
|
|
|
54 |
global_batch_size: 512
|
55 |
|
56 |
# Number of samples per data-parallel rank (type: int, default: 4)
|
57 |
+
micro_batch_size: 16 # 4
|
58 |
|
59 |
# Number of iterations with learning rate warmup active (type: int, default: 2000)
|
60 |
lr_warmup_steps: 2000
|