Update README.md
Browse files
README.md
CHANGED
@@ -9,6 +9,11 @@ base_model: jingyeom/freeze_KoSoLAR-10.7B-v0.2_1.4_dedup
|
|
9 |
model-index:
|
10 |
- name: lora_freeze_KoSoLAR-10.7B-v0.2_1.4_dedup_SFT-DPO
|
11 |
results: []
|
|
|
|
|
|
|
|
|
|
|
12 |
---
|
13 |
|
14 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
9 |
model-index:
|
10 |
- name: lora_freeze_KoSoLAR-10.7B-v0.2_1.4_dedup_SFT-DPO
|
11 |
results: []
|
12 |
+
datasets:
|
13 |
+
- jondurbin/truthy-dpo-v0.1
|
14 |
+
- Intel/orca_dpo_pairs
|
15 |
+
- HuggingFaceH4/ultrafeedback_binarized
|
16 |
+
- argilla/distilabel-math-preference-dpo
|
17 |
---
|
18 |
|
19 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|