Model save
Browse files- README.md +1 -1
- all_results.json +4 -4
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
- runs/Feb26_10-47-03_na-clops-debugging-pipeline-s6tg6-049f-0/events.out.tfevents.1740566847.na-clops-debugging-pipeline-s6tg6-049f-0 +2 -2
- train_results.json +4 -4
README.md
CHANGED
@@ -27,7 +27,7 @@ print(output["generated_text"])
|
|
27 |
|
28 |
## Training procedure
|
29 |
|
30 |
-
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/nlee28/reasoning/runs/
|
31 |
|
32 |
|
33 |
This model was trained with SFT.
|
|
|
27 |
|
28 |
## Training procedure
|
29 |
|
30 |
+
[<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/nlee28/reasoning/runs/o20hygkn)
|
31 |
|
32 |
|
33 |
This model was trained with SFT.
|
all_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"total_flos": 1.182462262019883e+18,
|
3 |
-
"train_loss":
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 817,
|
6 |
-
"train_samples_per_second": 0.
|
7 |
-
"train_steps_per_second": 0.
|
8 |
}
|
|
|
1 |
{
|
2 |
"total_flos": 1.182462262019883e+18,
|
3 |
+
"train_loss": 2.9186187465985616,
|
4 |
+
"train_runtime": 4944.9437,
|
5 |
"train_samples": 817,
|
6 |
+
"train_samples_per_second": 0.826,
|
7 |
+
"train_steps_per_second": 0.012
|
8 |
}
|
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58e01e7d2d951dff37e70aec71be657f8d06b83010b75f9dbba847be08cff729
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d37f1215e894b8fb82e502cfcf908a9d22322d4181f3e259c59dd960932fdf1
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98d6eba46181c7247e99a0d7449c8cb072fa5b84be4e5b9f5328cbb0e5c8548d
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3c2acf9182f6e318d518a995a4aa6355f1700834e5a007b23a5012e22a7a7f8
|
3 |
size 1089994880
|
runs/Feb26_10-47-03_na-clops-debugging-pipeline-s6tg6-049f-0/events.out.tfevents.1740566847.na-clops-debugging-pipeline-s6tg6-049f-0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32ba7ca663df882362ee9b8ed1d8b05983b8dc58a306e68c1b0673d48cb22713
|
3 |
+
size 14003
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"total_flos": 1.182462262019883e+18,
|
3 |
-
"train_loss":
|
4 |
-
"train_runtime":
|
5 |
"train_samples": 817,
|
6 |
-
"train_samples_per_second": 0.
|
7 |
-
"train_steps_per_second": 0.
|
8 |
}
|
|
|
1 |
{
|
2 |
"total_flos": 1.182462262019883e+18,
|
3 |
+
"train_loss": 2.9186187465985616,
|
4 |
+
"train_runtime": 4944.9437,
|
5 |
"train_samples": 817,
|
6 |
+
"train_samples_per_second": 0.826,
|
7 |
+
"train_steps_per_second": 0.012
|
8 |
}
|