Upload folder using huggingface_hub
Browse files- config.json +1 -0
- lr_scheduler.pt +3 -0
- model.layers.10/cfg.json +1 -0
- model.layers.10/sae.safetensors +3 -0
- model.layers.14/cfg.json +1 -0
- model.layers.14/sae.safetensors +3 -0
- model.layers.15/cfg.json +1 -0
- model.layers.15/sae.safetensors +3 -0
- optimizer.pt +3 -0
- state.pt +3 -0
config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"sae": {"expansion_factor": 32, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false}, "batch_size": 8, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["model.layers.10", "model.layers.14", "model.layers.15"], "layers": [10, 14, 15], "layer_stride": 1, "distribute_modules": false, "save_every": 1000, "log_to_wandb": true, "run_name": null, "wandb_log_frequency": 1}
|
lr_scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8932ce3add8e9547e06aa17f1456cd5d95b5de3d07b3e09782902a495c23dc7d
|
3 |
+
size 1076
|
model.layers.10/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 32, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 4096}
|
model.layers.10/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f2e6658c7c873b8c1431330c3da930918602635dc03dac0b311be1e1dcd18a3
|
3 |
+
size 4295508312
|
model.layers.14/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 32, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 4096}
|
model.layers.14/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c916681b50b6499b9132b941376b52881357f081e4c5cc1c22d20bc3178624e7
|
3 |
+
size 4295508312
|
model.layers.15/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 32, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 4096}
|
model.layers.15/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fb735d452659a480087b8093a9c73fd66e4e37a8c7d69357c90ab18c97545b7
|
3 |
+
size 4295508312
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b40ce389cb1c62609cd06276d1ffac4461cf75d8f9f8c384e7c5645a0411ea1a
|
3 |
+
size 6455863976
|
state.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de93b21e9e4eab77c559b56f25f31f1bfd1e94650743b0c72473d1de810d5fd1
|
3 |
+
size 3147334
|