Upload 11 files
Browse files- cfg.json +1 -0
- gpt_neox.layers.0/cfg.json +1 -0
- gpt_neox.layers.0/sae.safetensors +3 -0
- gpt_neox.layers.1/cfg.json +1 -0
- gpt_neox.layers.1/sae.safetensors +3 -0
- gpt_neox.layers.2/cfg.json +1 -0
- gpt_neox.layers.2/sae.safetensors +3 -0
- gpt_neox.layers.4/cfg.json +1 -0
- gpt_neox.layers.4/sae.safetensors +3 -0
- gpt_neox.layers.5/cfg.json +1 -0
- gpt_neox.layers.5/sae.safetensors +3 -0
cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"sae": {"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false}, "batch_size": 4, "grad_acc_steps": 8, "micro_acc_steps": 2, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["gpt_neox.layers.0", "gpt_neox.layers.1", "gpt_neox.layers.2", "gpt_neox.layers.3", "gpt_neox.layers.4", "gpt_neox.layers.5"], "layers": [0, 1, 2, 3, 4, 5], "layer_stride": 1, "distribute_modules": false, "save_every": 1000, "max_tokens": 1000000000, "log_to_wandb": false, "run_name": "/home/random_sae/experiments/saved_models/pythia-70m-deduped_64_k32/redpajama-data-1t-sample_plain_text_100M_rerandomised", "wandb_log_frequency": 1}
|
gpt_neox.layers.0/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 512}
|
gpt_neox.layers.0/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aeceb7a016df334e27ee71fb6565289e52685b4e98c461afff8240da17c1cd07
|
3 |
+
size 134351176
|
gpt_neox.layers.1/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 512}
|
gpt_neox.layers.1/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea2fbc2ff64140b968d9e9f5519c0d037a7a69b062ad8790d58953424c3d5312
|
3 |
+
size 134351176
|
gpt_neox.layers.2/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 512}
|
gpt_neox.layers.2/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f8abb524f81afc7a9e2ffae1a8c229d5f7a78a71b7616575c5caeb2a43fbc58
|
3 |
+
size 134351176
|
gpt_neox.layers.4/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 512}
|
gpt_neox.layers.4/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81aafb814a9a9822eaa2599ca9bf0b43e88311d9a01dad71b6b84736167d472b
|
3 |
+
size 134351176
|
gpt_neox.layers.5/cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"expansion_factor": 64, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "d_in": 512}
|
gpt_neox.layers.5/sae.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e58365f6b86de229a20b334ffe9f99bf304ae527f10fdc6153fe97bc796e6ce4
|
3 |
+
size 134351176
|