jbrinkma commited on
Commit
24b7ae2
·
verified ·
1 Parent(s): 72f24fe

Upload folder using huggingface_hub

Browse files
checkpoints/torso[0].res_final_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97c6e916cbcd13b1865aa13704d9d6b6bc63ea69b284fd56b0b1eb2c23936be2
3
+ size 37778616
checkpoints/torso[0].res_final_1024.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c377f21c50477e617dc255c1e5c3853d2229fb77c3ef4647a1e693d8ce3742b
3
+ size 37778704
checkpoints/torso[0].res_final_1536.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f82f4c5ccdd541a450db83b316c39cca25a7cb8de48e410bece2ea19e84177ad
3
+ size 37778704
checkpoints/torso[0].res_final_2048.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:195afc37ffaed9878344d791d19ca8c7b3cd9172a076609370cb86df8dae54a9
3
+ size 37778704
checkpoints/torso[0].res_final_512.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b88fd0e3e3a7082d963f3fab28a9cdef5975642fc9152627f835f468ce75b568
3
+ size 37778696
checkpoints/torso[1].attn_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f917464c3ce5df53bb10f1ccd084edd49f0ed66ebacea0d15a776cf90815e83c
3
+ size 37778576
checkpoints/torso[1].attn_1024.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9634c61c9826731fa04f081fe361461e1b9e01ca704d388623666a48b4ac4e03
3
+ size 37778600
checkpoints/torso[1].attn_1536.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea118422179444c6d037f1e326ee3d8d56ff3be7601e9d8b06971f7a33d2cbcf
3
+ size 37778600
checkpoints/torso[1].attn_2048.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1736175ae94a663d536ffeb86ec01000f1beaeec01d29f5c466640fe51da1f1
3
+ size 37778600
checkpoints/torso[1].attn_512.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d6f157204c0ad7843f32e84a88f0bf610d6d6a0b264a8d012ba73962d2964dc
3
+ size 37778592
checkpoints/torso[1].res_final_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5e834572edda79e57e9136fca9e4569c34517d91dd21ffc17a3158157fa98e
3
+ size 37778616
checkpoints/torso[1].res_final_1024.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:930a8a6e78b627db435688867bc72c6df57d654274d82c2fc9c720b60c97fe2d
3
+ size 37778704
checkpoints/torso[1].res_final_1536.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:448822d131314d5c91b6439aae8b35452380dda0c87dfc76829fd0d86d513f87
3
+ size 37778704
checkpoints/torso[1].res_final_2048.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e0c81f73d93066657784f2f1fd94bb8bf2c6ca11a60ab1ae26515865d961a1c
3
+ size 37778704
checkpoints/torso[1].res_final_512.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:003cc87c376c48556d55d09f2062da823c4272ea75d475d2216e1a87690149c4
3
+ size 37778696
checkpoints/torso[1].res_mlp_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cb903e0f743da72bee32af184e6a99805d72ef53124c0944ea5114a91a9c67a
3
+ size 37778600
checkpoints/torso[1].res_mlp_1024.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ed280a81fd4f3e8063bdfdeee9c4ac0cb9402fee6e4e606f5c6860732679503
3
+ size 37778624
checkpoints/torso[1].res_mlp_1536.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:094b07a661efd424cebd7b7d127f8d928729645d078a7926eec9df276c80c314
3
+ size 37778624
checkpoints/torso[1].res_mlp_2048.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca23db2ec9606744565710eb84d8176d891037fd3c1a52cc7b35e3a55a6ffc5e
3
+ size 37778624
checkpoints/torso[1].res_mlp_512.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6acf7df233fcfde04e830a99a11bb2fe4225e9af2b61dee5c2eb26259105d142
3
+ size 37778616
trainer_0/config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "trainer": {
3
+ "trainer_class": "TrainerTopK",
4
+ "dict_class": "AutoEncoderTopK",
5
+ "lr": 0.00032659863237109043,
6
+ "steps": 30000,
7
+ "seed": null,
8
+ "activation_dim": 768,
9
+ "dict_size": 6144,
10
+ "k": 30,
11
+ "device": "cuda",
12
+ "layer": 1,
13
+ "lm_name": "TinyModel_2L_3E",
14
+ "wandb_name": "AutoEncoderTopK",
15
+ "submodule_name": null
16
+ },
17
+ "buffer": {
18
+ "d_submodule": 768,
19
+ "io": "out",
20
+ "n_ctxs": 128,
21
+ "ctx_len": 256,
22
+ "refresh_batch_size": 512,
23
+ "out_batch_size": 1024,
24
+ "device": "cuda"
25
+ }
26
+ }
trainer_0/torso[0].res_final.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2680d27df283338845c7b35fef6eacf8707ae5a9163e27fb4ca17836f3ec7f18
3
+ size 37778600
trainer_0/torso[1].attn.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:025320bd4cd801b6091a51e80f89ad1763162a9937c878444cae93716543697d
3
+ size 37778560
trainer_0/torso[1].res_final.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0db6562dc37257290d67f9016af9cdb3999bca08809f0287df44a8dbf0f236ae
3
+ size 37778600
trainer_0/torso[1].res_mlp.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4502d4493c69f43720e0b780bfdc0b99c42e551df1a9920ff7c3e0fdcc7d30f6
3
+ size 37778584