Update README.md
Browse files
README.md
CHANGED
@@ -59,12 +59,12 @@ trainer = SFTTrainer(
|
|
59 |
max_steps=10000,
|
60 |
learning_rate=1e-4,
|
61 |
logging_steps=1,
|
62 |
-
output_dir="
|
63 |
optim="paged_adamw_32bit",report_to="none"
|
64 |
)
|
65 |
)
|
66 |
trainer.train()
|
67 |
-
trainer.model.save_pretrained("
|
68 |
-
trainer.tokenizer.save_pretrained("
|
69 |
|
70 |
```
|
|
|
59 |
max_steps=10000,
|
60 |
learning_rate=1e-4,
|
61 |
logging_steps=1,
|
62 |
+
output_dir="1B_outputs", overwrite_output_dir=True,save_steps=1000,
|
63 |
optim="paged_adamw_32bit",report_to="none"
|
64 |
)
|
65 |
)
|
66 |
trainer.train()
|
67 |
+
trainer.model.save_pretrained("1B-final", dtype=torch.float32)
|
68 |
+
trainer.tokenizer.save_pretrained("1B-final")
|
69 |
|
70 |
```
|