Update README.md
Browse files
README.md
CHANGED
@@ -44,6 +44,7 @@ REILX/neo_sft_phase2_conversations</br>
|
|
44 |
- learning_rate: 5e-06
|
45 |
- train_batch_size: 1
|
46 |
- eval_batch_size: 8
|
|
|
47 |
- seed: 42
|
48 |
- distributed_type: multi-GPU
|
49 |
- num_devices: 8
|
@@ -59,6 +60,7 @@ REILX/neo_sft_phase2_multi</br>
|
|
59 |
- learning_rate: 5e-05
|
60 |
- train_batch_size: 1
|
61 |
- eval_batch_size: 8
|
|
|
62 |
- seed: 42
|
63 |
- distributed_type: multi-GPU
|
64 |
- num_devices: 8
|
@@ -74,6 +76,7 @@ REILX/neo_sft_phase2_single</br>
|
|
74 |
- learning_rate: 5e-05
|
75 |
- train_batch_size: 1
|
76 |
- eval_batch_size: 8
|
|
|
77 |
- seed: 42
|
78 |
- distributed_type: multi-GPU
|
79 |
- num_devices: 8
|
|
|
44 |
- learning_rate: 5e-06
|
45 |
- train_batch_size: 1
|
46 |
- eval_batch_size: 8
|
47 |
+
- cutoff_len:8192
|
48 |
- seed: 42
|
49 |
- distributed_type: multi-GPU
|
50 |
- num_devices: 8
|
|
|
60 |
- learning_rate: 5e-05
|
61 |
- train_batch_size: 1
|
62 |
- eval_batch_size: 8
|
63 |
+
- cutoff_len:8192
|
64 |
- seed: 42
|
65 |
- distributed_type: multi-GPU
|
66 |
- num_devices: 8
|
|
|
76 |
- learning_rate: 5e-05
|
77 |
- train_batch_size: 1
|
78 |
- eval_batch_size: 8
|
79 |
+
- cutoff_len:4096
|
80 |
- seed: 42
|
81 |
- distributed_type: multi-GPU
|
82 |
- num_devices: 8
|