Upload folder using huggingface_hub
Browse files- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[1].attn_0.pt +3 -0
- checkpoints/torso[1].attn_1024.pt +3 -0
- checkpoints/torso[1].attn_1536.pt +3 -0
- checkpoints/torso[1].attn_2048.pt +3 -0
- checkpoints/torso[1].attn_512.pt +3 -0
- checkpoints/torso[1].res_final_0.pt +3 -0
- checkpoints/torso[1].res_final_1024.pt +3 -0
- checkpoints/torso[1].res_final_1536.pt +3 -0
- checkpoints/torso[1].res_final_2048.pt +3 -0
- checkpoints/torso[1].res_final_512.pt +3 -0
- checkpoints/torso[1].res_mlp_0.pt +3 -0
- checkpoints/torso[1].res_mlp_1024.pt +3 -0
- checkpoints/torso[1].res_mlp_1536.pt +3 -0
- checkpoints/torso[1].res_mlp_2048.pt +3 -0
- checkpoints/torso[1].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[1].attn.pt +3 -0
- trainer_0/torso[1].res_final.pt +3 -0
- trainer_0/torso[1].res_mlp.pt +3 -0
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c377f21c50477e617dc255c1e5c3853d2229fb77c3ef4647a1e693d8ce3742b
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f82f4c5ccdd541a450db83b316c39cca25a7cb8de48e410bece2ea19e84177ad
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:195afc37ffaed9878344d791d19ca8c7b3cd9172a076609370cb86df8dae54a9
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b88fd0e3e3a7082d963f3fab28a9cdef5975642fc9152627f835f468ce75b568
|
3 |
+
size 37778696
|
checkpoints/torso[1].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
|
3 |
+
size 37778576
|
checkpoints/torso[1].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9634c61c9826731fa04f081fe361461e1b9e01ca704d388623666a48b4ac4e03
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea118422179444c6d037f1e326ee3d8d56ff3be7601e9d8b06971f7a33d2cbcf
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1736175ae94a663d536ffeb86ec01000f1beaeec01d29f5c466640fe51da1f1
|
3 |
+
size 37778600
|
checkpoints/torso[1].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6f157204c0ad7843f32e84a88f0bf610d6d6a0b264a8d012ba73962d2964dc
|
3 |
+
size 37778592
|
checkpoints/torso[1].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
|
3 |
+
size 37778616
|
checkpoints/torso[1].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:930a8a6e78b627db435688867bc72c6df57d654274d82c2fc9c720b60c97fe2d
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:448822d131314d5c91b6439aae8b35452380dda0c87dfc76829fd0d86d513f87
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e0c81f73d93066657784f2f1fd94bb8bf2c6ca11a60ab1ae26515865d961a1c
|
3 |
+
size 37778704
|
checkpoints/torso[1].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:003cc87c376c48556d55d09f2062da823c4272ea75d475d2216e1a87690149c4
|
3 |
+
size 37778696
|
checkpoints/torso[1].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
|
3 |
+
size 37778600
|
checkpoints/torso[1].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ed280a81fd4f3e8063bdfdeee9c4ac0cb9402fee6e4e606f5c6860732679503
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:094b07a661efd424cebd7b7d127f8d928729645d078a7926eec9df276c80c314
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca23db2ec9606744565710eb84d8176d891037fd3c1a52cc7b35e3a55a6ffc5e
|
3 |
+
size 37778624
|
checkpoints/torso[1].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6acf7df233fcfde04e830a99a11bb2fe4225e9af2b61dee5c2eb26259105d142
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 1,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2680d27df283338845c7b35fef6eacf8707ae5a9163e27fb4ca17836f3ec7f18
|
3 |
+
size 37778600
|
trainer_0/torso[1].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:025320bd4cd801b6091a51e80f89ad1763162a9937c878444cae93716543697d
|
3 |
+
size 37778560
|
trainer_0/torso[1].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db6562dc37257290d67f9016af9cdb3999bca08809f0287df44a8dbf0f236ae
|
3 |
+
size 37778600
|
trainer_0/torso[1].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4502d4493c69f43720e0b780bfdc0b99c42e551df1a9920ff7c3e0fdcc7d30f6
|
3 |
+
size 37778584
|