Upload folder using huggingface_hub
Browse files- checkpoints/embed_0.pt +3 -0
- checkpoints/embed_1024.pt +3 -0
- checkpoints/embed_1536.pt +3 -0
- checkpoints/embed_2048.pt +3 -0
- checkpoints/embed_512.pt +3 -0
- checkpoints/torso[0].attn_0.pt +3 -0
- checkpoints/torso[0].attn_1024.pt +3 -0
- checkpoints/torso[0].attn_1536.pt +3 -0
- checkpoints/torso[0].attn_2048.pt +3 -0
- checkpoints/torso[0].attn_512.pt +3 -0
- checkpoints/torso[0].res_final_0.pt +3 -0
- checkpoints/torso[0].res_final_1024.pt +3 -0
- checkpoints/torso[0].res_final_1536.pt +3 -0
- checkpoints/torso[0].res_final_2048.pt +3 -0
- checkpoints/torso[0].res_final_512.pt +3 -0
- checkpoints/torso[0].res_mlp_0.pt +3 -0
- checkpoints/torso[0].res_mlp_1024.pt +3 -0
- checkpoints/torso[0].res_mlp_1536.pt +3 -0
- checkpoints/torso[0].res_mlp_2048.pt +3 -0
- checkpoints/torso[0].res_mlp_512.pt +3 -0
- trainer_0/config.json +26 -0
- trainer_0/embed.pt +3 -0
- trainer_0/torso[0].attn.pt +3 -0
- trainer_0/torso[0].res_final.pt +3 -0
- trainer_0/torso[0].res_mlp.pt +3 -0
checkpoints/embed_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78dbb0e1385cb5a48e0a8fec6416a7de71b9513d183816a2aa0d8a171b2ac6c1
|
3 |
+
size 37778320
|
checkpoints/embed_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f908b17944f9c6ee5b9ce6f0cb03469e1fc0c4992652aad5d6b23172316c9c9e
|
3 |
+
size 37778536
|
checkpoints/embed_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76bb4f964163cb015911632b3b2e80b934810c37dd2e65c50de31f4f221ac4af
|
3 |
+
size 37778536
|
checkpoints/embed_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c80369a5e46c48f7ded519a5adb171775da998fdb0ca97970442b6b2150276e9
|
3 |
+
size 37778536
|
checkpoints/embed_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:accba7b57285c47b4b884c70e6018bd694374f0bfa6a1f6d3ee7d4b0fc1c8c2e
|
3 |
+
size 37778528
|
checkpoints/torso[0].attn_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffc354c3a5802b66bbccd7d7df0772ed0743cbd1cae5c9d84b80f3e2bdfbdc6f
|
3 |
+
size 37778576
|
checkpoints/torso[0].attn_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90041301954e56cebd7a4fa3c6f5ca265c92ac81f96ab7187a5828cd7d64088f
|
3 |
+
size 37778600
|
checkpoints/torso[0].attn_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f867e44b4fd8a6fc4c40ac1038f0dc164a6f49828da57694028095068bc93d34
|
3 |
+
size 37778600
|
checkpoints/torso[0].attn_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44c775c09a643eb221551b643af75480d016b5c7efe178a17a56fdc3ac2a6be6
|
3 |
+
size 37778600
|
checkpoints/torso[0].attn_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de9bc1d577516a1343a9bf886cf3f1cc341a503bdb1a4e3d89313b81ed93440
|
3 |
+
size 37778592
|
checkpoints/torso[0].res_final_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
|
3 |
+
size 37778616
|
checkpoints/torso[0].res_final_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4faa5414f978254e5fc035209cabed3c20cbee940d6608389fe00293af16bf7
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4bccb2ba5df23341091b57a3fa86fa8507902ac8242e43a02901fa866a74bb7
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a774defc7bd4844ce2f18cb62e555257160d58dc62ea316373798cad1bb4030d
|
3 |
+
size 37778704
|
checkpoints/torso[0].res_final_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3fa5c2ae2c3855835b8c2fe15bfdba70937e22ee79d38296082aeccd60ba3bb
|
3 |
+
size 37778696
|
checkpoints/torso[0].res_mlp_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f739e58039152b9ae31520b5c9ed20ab8dcf14095c3150eed62a9fe58d0f5217
|
3 |
+
size 37778600
|
checkpoints/torso[0].res_mlp_1024.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab7cc432d63049235d9ef8c82daac06688cd99227dbcdae08709333a6bd85a91
|
3 |
+
size 37778624
|
checkpoints/torso[0].res_mlp_1536.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5996499555f8b551875bd1bea8907d3f0d08d08361f238e589987ee794f5425
|
3 |
+
size 37778624
|
checkpoints/torso[0].res_mlp_2048.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e86a64f736337856cbb0ecc67053f8ef0058dd3f3a32f42acaaff99e08791545
|
3 |
+
size 37778624
|
checkpoints/torso[0].res_mlp_512.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41df90396100ec698afa4280e833a5ee63169e293965b66270ade076cb2ae86f
|
3 |
+
size 37778616
|
trainer_0/config.json
ADDED
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"trainer": {
|
3 |
+
"trainer_class": "TrainerTopK",
|
4 |
+
"dict_class": "AutoEncoderTopK",
|
5 |
+
"lr": 0.00032659863237109043,
|
6 |
+
"steps": 30000,
|
7 |
+
"seed": null,
|
8 |
+
"activation_dim": 768,
|
9 |
+
"dict_size": 6144,
|
10 |
+
"k": 30,
|
11 |
+
"device": "cuda",
|
12 |
+
"layer": 0,
|
13 |
+
"lm_name": "TinyModel_2L_3E",
|
14 |
+
"wandb_name": "AutoEncoderTopK",
|
15 |
+
"submodule_name": null
|
16 |
+
},
|
17 |
+
"buffer": {
|
18 |
+
"d_submodule": 768,
|
19 |
+
"io": "out",
|
20 |
+
"n_ctxs": 128,
|
21 |
+
"ctx_len": 256,
|
22 |
+
"refresh_batch_size": 512,
|
23 |
+
"out_batch_size": 1024,
|
24 |
+
"device": "cuda"
|
25 |
+
}
|
26 |
+
}
|
trainer_0/embed.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a72603d231e312afe4ce41bba1e9dc004b7c2510bc00db1e70427259d5c43be1
|
3 |
+
size 37778240
|
trainer_0/torso[0].attn.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e63f4b4762e5b043742b4628c57d0b3dfaf51a3df6e7e7b86ca5eb4fdd87aa56
|
3 |
+
size 37778560
|
trainer_0/torso[0].res_final.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1e9a1341334c6fac87c24fea8b50ac8e466dfd5f74077b1a538691ec42a1782
|
3 |
+
size 37778600
|
trainer_0/torso[0].res_mlp.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a702156273de46b053d76c97bd366f25c60650c9fb539028d224560bdacfdab1
|
3 |
+
size 37778584
|