canrager
/

lm_sae

Model card Files Files and versions Community

canrager commited on 29 days ago

Commit

d4252e9

•

1 Parent(s): 60d3d0c

Upload folder using huggingface_hub

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_0/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_0/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_1/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_1/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_2/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_2/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_3/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_3/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_4/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_4/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_5/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_5/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_0/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_0/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_154/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_154/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_1544/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_1544/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_19531/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_19531/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_29296/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_29296/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_48/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_48/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_488/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_488/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_4882/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_4882/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_9765/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_9765/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_0/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_0/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_154/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_154/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_1544/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_1544/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_19531/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_19531/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_29296/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_29296/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_48/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_48/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_488/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_488/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_4882/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_4882/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_9765/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_9765/config.json +26 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_2_step_0/ae.pt +3 -0
pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_2_step_0/config.json +26 -0

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_0/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f931bbd2be0cf27730cf6315612899804a86d40faa2a8acb8d6f4a2534fdaddc
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_0/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_1/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:77c04025750f094a1207b5c13d9c0513bfb6738d7b56ccf82823b5cece85ec97
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_1/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_2/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:777821e6b4ba99d790da876723dc8e934cb1723b8126a848baa763bb716050ec
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_2/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 80,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_3/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9165f71a2c18bc3a3c5db1008be308f7dff6bf8c89227924af9cb3065de69064
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_3/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 160,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_4/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bd61e41012e58b8d9599f2cc17d064146bf530fae5c81420128b6c6c91dd05af
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_4/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 320,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_5/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e946949d76acfd70c4e05de0701fee087ab718e6503dcef0651efc0f732713d1
+size 268511016

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11/trainer_5/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": 48828,
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 640,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_0/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6adbecf89ab611c06dd7362aeed0c6223349b95ca84867cd6c4fa1aaee62e51
+size 268511032

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_0/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "0",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_154/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0b67e75ad65e356011f6408fa8110bc0781b2b342a7ded331c7dda307480c614
+size 268511048

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_154/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "154",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_1544/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1983dc5a21aef1fd81c3bc5f11f083c8e6eaa9702bce34ef9493c647b5884972
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_1544/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "1544",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_19531/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a6755014321c45b857963ffdf611282d3c2725576f5c0e106ad001843fdda12
+size 268511320

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_19531/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "19531",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_29296/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5845ca9123c5cd425cfb70f950e0d791bb99e986ed461b6d71fb5071f3d63dc3
+size 268511320

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_29296/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "29296",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_48/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:07fe5d2d6477315d213d5eb4c4759a5186541e3be5e087512a23bb4f9cc12617
+size 268511040

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_48/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "48",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_488/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1bec26256c8c3ba421bb3b42a864678b00b999101543869c1ba642835be4b156
+size 268511048

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_488/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "488",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_4882/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d4b5711335410894032df7a45fdcc95e0c3288daae6dca00dfa501df123fcf82
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_4882/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "4882",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_9765/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:45541576a35a7e1167ea8acdb8d1ef865f24163bcffd0ee92c5ddb4a1527bd2f
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_0_step_9765/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "9765",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 20,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_0/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6adbecf89ab611c06dd7362aeed0c6223349b95ca84867cd6c4fa1aaee62e51
+size 268511032

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_0/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "0",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_154/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c4caef5ae1673ad808e2d7726be2ea3624c070025e17a6e3a70e988632b003a3
+size 268511048

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_154/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "154",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_1544/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:baa3efb085b9a91077c06f6d7b69397242041feec0ede677f11f424c1fb30686
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_1544/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "1544",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_19531/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:990c2f403a04c9e4f15972f9f1e3d93eca79f878fd70d0a9f4c7571113040fa9
+size 268511320

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_19531/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "19531",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_29296/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dcb7920bb0cb1115a3966b3a81ad046e9220eed41e9626792278914c4f8035a7
+size 268511320

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_29296/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "29296",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_48/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1e0c4fee3f2d78c9a5cb1c1016c3a54dc2dd72f88e3fc2ab09e63157679d8c07
+size 268511040

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_48/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "48",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_488/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a8dd04b0baf20a9a97f5c63901f6d96b329fb9ca9f22167af7c23296fa087b08
+size 268511048

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_488/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "488",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_4882/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9861440d2992b23f094bae25bb91a4d04513194387a2ad7ff333557396280ed2
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_4882/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "4882",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_9765/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2270228e169e6210fe2544982668f8345b32d7d0dbe2c65127f650929905054c
+size 268511120

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_1_step_9765/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "9765",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 40,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_2_step_0/ae.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f6adbecf89ab611c06dd7362aeed0c6223349b95ca84867cd6c4fa1aaee62e51
+size 268511032

pythia1.4b/pythia1.4b_sweep_topk_ctx128_0913/resid_post_layer_11_checkpoints/trainer_2_step_0/config.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+ "trainer": {
+ "trainer_class": "TrainerTopK",
+ "dict_class": "AutoEncoderTopK",
+ "lr": 0.0002,
+ "steps": "0",
+ "seed": 0,
+ "activation_dim": 2048,
+ "dict_size": 16384,
+ "k": 80,
+ "device": "cuda:0",
+ "layer": 11,
+ "lm_name": "EleutherAI/pythia-1.4b-deduped",
+ "wandb_name": "TopKTrainer-EleutherAI/pythia-1.4b-deduped-resid_post_layer_11",
+ "submodule_name": "resid_post_layer_11"
+ },
+ "buffer": {
+ "d_submodule": 2048,
+ "io": "out",
+ "n_ctxs": 2000,
+ "ctx_len": 128,
+ "refresh_batch_size": 24,
+ "out_batch_size": 4096,
+ "device": "cuda:0"
+ }
+}