Commit
·
4e3188d
1
Parent(s):
db461e9
Upload folder using huggingface_hub
Browse files- README.md +1 -14
- checkpoint-250/optimizer.pt +1 -1
- checkpoint-250/rng_state_0.pth +1 -1
- checkpoint-250/rng_state_1.pth +1 -1
- checkpoint-250/rng_state_2.pth +1 -1
- checkpoint-250/rng_state_3.pth +1 -1
- checkpoint-250/rng_state_4.pth +1 -1
- checkpoint-250/rng_state_5.pth +1 -1
- checkpoint-250/rng_state_6.pth +1 -1
- checkpoint-250/rng_state_7.pth +1 -1
- checkpoint-250/scaler.pt +1 -1
- checkpoint-250/scheduler.pt +1 -1
- checkpoint-250/trainer_state.json +22 -22
- checkpoint-250/training_args.bin +1 -1
- pytorch_model.bin +1 -1
- training_args.bin +1 -1
README.md
CHANGED
@@ -1,16 +1,3 @@
|
|
1 |
---
|
2 |
-
|
3 |
-
- yahma/alpaca-cleaned
|
4 |
-
language:
|
5 |
-
- en
|
6 |
-
license: apache-2.0
|
7 |
-
tags:
|
8 |
-
- pytorch
|
9 |
-
- causal-lm
|
10 |
-
- llama2
|
11 |
-
- fine-tuning
|
12 |
-
- alpaca
|
13 |
-
|
14 |
---
|
15 |
-
|
16 |
-
# Llama-2-7B fine-tuned on LoRA alpaca-cleaned
|
|
|
1 |
---
|
2 |
+
library_name: peft
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
checkpoint-250/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 12833221
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ded573f92c39e528107cac185cefc599bebc3bfbb1d852e9aad4a51a7bdb7db7
|
3 |
size 12833221
|
checkpoint-250/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ff556034ef66a33dd1f91f7f1ef90f610ea8987dff216a09ed637103885dfa5
|
3 |
size 21687
|
checkpoint-250/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de1a2d4f34d9aeef36aed2599ac40c0387f8da8f835084f463ddb571558f0325
|
3 |
size 21687
|
checkpoint-250/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d6c619900787e84a5702e58ef0bffd64f674f634df49641cda2328ce1fe5706
|
3 |
size 21687
|
checkpoint-250/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f4674ef7c7d8ec461683b46f5971c8f885f64c1b3fc9a70c7e5436d3560dd31
|
3 |
size 21687
|
checkpoint-250/rng_state_4.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b1ab8e049e32f0534c4a919d53a677c5398b3cbfb027803551a6e1d4b5f7742
|
3 |
size 21687
|
checkpoint-250/rng_state_5.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98b7ecaf90b364d9591ed06b1e8bc5b1645d39186f79de3a85d7cf2f0e2a1c4c
|
3 |
size 21687
|
checkpoint-250/rng_state_6.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:650f9ba046ba1a5afa025b52ce144ab73433f97ea82b55c1630d28c3ba12d021
|
3 |
size 21687
|
checkpoint-250/rng_state_7.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 21687
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf1c9914411568e259b1d4038ac031fab5bd50d477b3c73ab8d56d74886d922f
|
3 |
size 21687
|
checkpoint-250/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83631d6b9b43704f4441079f38c387b400af9960c249438a99f32f1f1df322fc
|
3 |
size 557
|
checkpoint-250/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b34b17be1093848601ee7f49e83fbfc9190b9769b8cbabfb75dfed691603a84
|
3 |
size 627
|
checkpoint-250/trainer_state.json
CHANGED
@@ -10,79 +10,79 @@
|
|
10 |
{
|
11 |
"epoch": 0.01,
|
12 |
"learning_rate": 9.949107209404665e-05,
|
13 |
-
"loss": 1.
|
14 |
"step": 20
|
15 |
},
|
16 |
{
|
17 |
"epoch": 0.01,
|
18 |
"learning_rate": 9.62558321769342e-05,
|
19 |
-
"loss":
|
20 |
"step": 40
|
21 |
},
|
22 |
{
|
23 |
"epoch": 0.02,
|
24 |
"learning_rate": 8.98317278228618e-05,
|
25 |
-
"loss": 0.
|
26 |
"step": 60
|
27 |
},
|
28 |
{
|
29 |
"epoch": 0.02,
|
30 |
-
"learning_rate": 8.
|
31 |
-
"loss": 0.
|
32 |
"step": 80
|
33 |
},
|
34 |
{
|
35 |
"epoch": 0.03,
|
36 |
-
"learning_rate": 7.
|
37 |
-
"loss": 0.
|
38 |
"step": 100
|
39 |
},
|
40 |
{
|
41 |
"epoch": 0.04,
|
42 |
-
"learning_rate": 5.
|
43 |
-
"loss": 0.
|
44 |
"step": 120
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.04,
|
48 |
-
"learning_rate": 4.
|
49 |
-
"loss": 0.
|
50 |
"step": 140
|
51 |
},
|
52 |
{
|
53 |
"epoch": 0.05,
|
54 |
-
"learning_rate": 3.
|
55 |
-
"loss": 0.
|
56 |
"step": 160
|
57 |
},
|
58 |
{
|
59 |
"epoch": 0.06,
|
60 |
-
"learning_rate": 2.
|
61 |
-
"loss": 0.
|
62 |
"step": 180
|
63 |
},
|
64 |
{
|
65 |
"epoch": 0.06,
|
66 |
-
"learning_rate": 1.
|
67 |
-
"loss": 0.
|
68 |
"step": 200
|
69 |
},
|
70 |
{
|
71 |
"epoch": 0.07,
|
72 |
-
"learning_rate":
|
73 |
-
"loss": 0.
|
74 |
"step": 220
|
75 |
},
|
76 |
{
|
77 |
"epoch": 0.07,
|
78 |
-
"learning_rate":
|
79 |
-
"loss": 0.
|
80 |
"step": 240
|
81 |
}
|
82 |
],
|
83 |
"max_steps": 250,
|
84 |
"num_train_epochs": 1,
|
85 |
-
"total_flos": 3.
|
86 |
"trial_name": null,
|
87 |
"trial_params": null
|
88 |
}
|
|
|
10 |
{
|
11 |
"epoch": 0.01,
|
12 |
"learning_rate": 9.949107209404665e-05,
|
13 |
+
"loss": 1.6279,
|
14 |
"step": 20
|
15 |
},
|
16 |
{
|
17 |
"epoch": 0.01,
|
18 |
"learning_rate": 9.62558321769342e-05,
|
19 |
+
"loss": 0.9748,
|
20 |
"step": 40
|
21 |
},
|
22 |
{
|
23 |
"epoch": 0.02,
|
24 |
"learning_rate": 8.98317278228618e-05,
|
25 |
+
"loss": 0.8434,
|
26 |
"step": 60
|
27 |
},
|
28 |
{
|
29 |
"epoch": 0.02,
|
30 |
+
"learning_rate": 8.274303669726426e-05,
|
31 |
+
"loss": 0.8162,
|
32 |
"step": 80
|
33 |
},
|
34 |
{
|
35 |
"epoch": 0.03,
|
36 |
+
"learning_rate": 7.19444824755478e-05,
|
37 |
+
"loss": 0.7719,
|
38 |
"step": 100
|
39 |
},
|
40 |
{
|
41 |
"epoch": 0.04,
|
42 |
+
"learning_rate": 5.967492612770999e-05,
|
43 |
+
"loss": 0.7687,
|
44 |
"step": 120
|
45 |
},
|
46 |
{
|
47 |
"epoch": 0.04,
|
48 |
+
"learning_rate": 4.675683150061285e-05,
|
49 |
+
"loss": 0.7753,
|
50 |
"step": 140
|
51 |
},
|
52 |
{
|
53 |
"epoch": 0.05,
|
54 |
+
"learning_rate": 3.4056135837619074e-05,
|
55 |
+
"loss": 0.7509,
|
56 |
"step": 160
|
57 |
},
|
58 |
{
|
59 |
"epoch": 0.06,
|
60 |
+
"learning_rate": 2.2424203500786474e-05,
|
61 |
+
"loss": 0.75,
|
62 |
"step": 180
|
63 |
},
|
64 |
{
|
65 |
"epoch": 0.06,
|
66 |
+
"learning_rate": 1.2640756555442684e-05,
|
67 |
+
"loss": 0.7337,
|
68 |
"step": 200
|
69 |
},
|
70 |
{
|
71 |
"epoch": 0.07,
|
72 |
+
"learning_rate": 5.361607745106817e-06,
|
73 |
+
"loss": 0.7484,
|
74 |
"step": 220
|
75 |
},
|
76 |
{
|
77 |
"epoch": 0.07,
|
78 |
+
"learning_rate": 1.0746994666109234e-06,
|
79 |
+
"loss": 0.7386,
|
80 |
"step": 240
|
81 |
}
|
82 |
],
|
83 |
"max_steps": 250,
|
84 |
"num_train_epochs": 1,
|
85 |
+
"total_flos": 3.752851705482445e+16,
|
86 |
"trial_name": null,
|
87 |
"trial_params": null
|
88 |
}
|
checkpoint-250/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3963
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e39446b5d41d7b95abf21f50c4d1c0231f70f7bb45b7195adab288b3f3adcfd
|
3 |
size 3963
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 25234701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5192bf8275b5aed54b0b89798b6cb8c0e43c871c4be9ecee36bac033782f1c47
|
3 |
size 25234701
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3963
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e39446b5d41d7b95abf21f50c4d1c0231f70f7bb45b7195adab288b3f3adcfd
|
3 |
size 3963
|