diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..e993dca7b2554ac0d56ad8267b153248b4253315 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+benchmark_stats.png filter=lfs diff=lfs merge=lfs -text
diff --git a/benchmark_stats.csv b/benchmark_stats.csv
new file mode 100644
index 0000000000000000000000000000000000000000..d7a7d35fdaee59372e15cfc3711efb67b8ac69a1
--- /dev/null
+++ b/benchmark_stats.csv
@@ -0,0 +1,13 @@
+,version,d_sae,layer,kl_div_with_sae,kl_div_with_ablation,ce_loss_with_sae,ce_loss_without_sae,ce_loss_with_ablation,kl_div_score,ce_loss_score,l2_norm_in,l2_norm_out,l2_ratio,l0,l1,explained_variance,mse,total_tokens_evaluated,filepath
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_0/metrics.json,5,32,0,0.0048454091884195805,3.094083309173584,3.6054646968841553,3.599064588546753,6.694648742675781,0.9984339758486613,0.9979325038445924,29.933448791503906,29.601543426513672,0.9893707036972046,32.0,71.21115112304688,0.9667970538139343,21.729291915893555,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_0/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_1/metrics.json,5,32,1,0.006601419299840927,0.05105271190404892,3.605595588684082,3.599064588546753,3.6525371074676514,0.8706940522131719,0.8778624933119316,18.973735809326172,17.91716766357422,0.910649299621582,32.0,86.5653305053711,0.8854424357414246,25.637441635131836,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_1/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_2/metrics.json,5,32,2,0.00936876516789198,0.05874736234545708,3.601879119873047,3.599064588546753,3.6459126472473145,0.8405244968650671,0.9399221354232932,49.106536865234375,47.64448165893555,0.8887979388237,31.875,85.81163024902344,0.9745470285415649,37.83729553222656,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_2/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_3/metrics.json,5,32,3,0.010681239888072014,0.07059153914451599,3.6096014976501465,3.599064588546753,3.658677577972412,0.8486895169376428,0.823244745735597,16.98731803894043,15.157210350036621,0.8746687173843384,31.91145896911621,85.93821716308594,0.7805342078208923,50.548057556152344,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_3/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_4/metrics.json,5,32,4,0.012658017687499523,0.06332532316446304,3.611159086227417,3.599064588546753,3.6600804328918457,0.8001112816333331,0.8017810322797447,17.251985549926758,15.012179374694824,0.8525444865226746,31.95556640625,82.4767074584961,0.7294961810112,63.70451354980469,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_4/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_5/metrics.json,5,32,5,0.014466611668467522,0.06850520521402359,3.613976240158081,3.599064588546753,3.6693859100341797,0.7888246356861349,0.7879497811486054,18.888967514038086,16.209918975830078,0.8484395742416382,32.0,81.43401336669922,0.7174215316772461,87.28172302246094,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_5/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_6/metrics.json,5,32,6,0.016599537804722786,0.07569437474012375,3.6187987327575684,3.599064588546753,3.67651629447937,0.7807031518298047,0.7452071071490137,21.466564178466797,18.40247344970703,0.852634608745575,32.0,78.82976531982422,0.7063077688217163,117.07249450683594,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_6/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_7/metrics.json,5,32,7,0.017009764909744263,0.08048636466264725,3.614975929260254,3.599064588546753,3.6727118492126465,0.7886627756013151,0.7839520361024154,25.444438934326172,22.004989624023438,0.8624889254570007,32.0,76.41993713378906,0.7180025577545166,157.79141235351562,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_7/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_8/metrics.json,5,32,8,0.01810324750840664,0.08732372522354126,3.6162450313568115,3.599064588546753,3.6803367137908936,0.792688098657451,0.7886059610420089,30.250225067138672,26.306936264038086,0.8676368594169617,32.0,76.72819519042969,0.7239155769348145,219.98291015625,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_8/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_9/metrics.json,5,32,9,0.01999707892537117,0.09758877754211426,3.6174559593200684,3.599064588546753,3.6962451934814453,0.7950883346526042,0.8107506041388108,40.192413330078125,35.94580841064453,0.8897998332977295,32.0,72.42656707763672,0.7423521876335144,318.1434326171875,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_9/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_10/metrics.json,5,32,10,0.02311515063047409,0.12674781680107117,3.6171722412109375,3.599064588546753,3.708984136581421,0.8176288064452188,0.8352644912761693,81.75682830810547,78.3930892944336,0.9553598165512085,32.0,50.45811462402344,0.7926573753356934,514.5535888671875,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_10/metrics.json
+OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_11/metrics.json,5,32,11,0.028952505439519882,0.17384076118469238,3.62371826171875,3.599064588546753,3.783318281173706,0.8334538732906256,0.8661971284238421,92.90629577636719,87.66377258300781,0.9233807325363159,32.0,73.98703002929688,0.840599000453949,742.95751953125,6144.0,OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_11/metrics.json
diff --git a/benchmark_stats.html b/benchmark_stats.html
new file mode 100644
index 0000000000000000000000000000000000000000..2d16c17e7e3ee01da8e247b83b841ee97f090ebd
--- /dev/null
+++ b/benchmark_stats.html
@@ -0,0 +1,646 @@
+<style type="text/css">
+#T_03f5d_row0_col2, #T_03f5d_row0_col3, #T_03f5d_row0_col6, #T_03f5d_row0_col16, #T_03f5d_row0_col17, #T_03f5d_row1_col4, #T_03f5d_row1_col6, #T_03f5d_row1_col7, #T_03f5d_row1_col17, #T_03f5d_row2_col4, #T_03f5d_row2_col5, #T_03f5d_row2_col6, #T_03f5d_row2_col7, #T_03f5d_row2_col13, #T_03f5d_row2_col17, #T_03f5d_row3_col6, #T_03f5d_row3_col10, #T_03f5d_row3_col11, #T_03f5d_row3_col17, #T_03f5d_row4_col6, #T_03f5d_row4_col10, #T_03f5d_row4_col11, #T_03f5d_row4_col17, #T_03f5d_row5_col6, #T_03f5d_row5_col12, #T_03f5d_row5_col17, #T_03f5d_row6_col6, #T_03f5d_row6_col8, #T_03f5d_row6_col9, #T_03f5d_row6_col15, #T_03f5d_row6_col17, #T_03f5d_row7_col6, #T_03f5d_row7_col17, #T_03f5d_row8_col6, #T_03f5d_row8_col17, #T_03f5d_row9_col6, #T_03f5d_row9_col17, #T_03f5d_row10_col6, #T_03f5d_row10_col14, #T_03f5d_row10_col17, #T_03f5d_row11_col6, #T_03f5d_row11_col17 {
+  background-color: #440154;
+  color: #f1f1f1;
+}
+#T_03f5d_row0_col4, #T_03f5d_row0_col7, #T_03f5d_row0_col8, #T_03f5d_row0_col9, #T_03f5d_row0_col12, #T_03f5d_row0_col13, #T_03f5d_row1_col13, #T_03f5d_row1_col14, #T_03f5d_row2_col15, #T_03f5d_row5_col13, #T_03f5d_row6_col13, #T_03f5d_row7_col13, #T_03f5d_row8_col13, #T_03f5d_row9_col13, #T_03f5d_row10_col13, #T_03f5d_row11_col2, #T_03f5d_row11_col3, #T_03f5d_row11_col5, #T_03f5d_row11_col10, #T_03f5d_row11_col11, #T_03f5d_row11_col13, #T_03f5d_row11_col16 {
+  background-color: #fde725;
+  color: #000000;
+}
+#T_03f5d_row0_col5 {
+  background-color: #443983;
+  color: #f1f1f1;
+}
+#T_03f5d_row0_col10, #T_03f5d_row1_col5, #T_03f5d_row5_col9, #T_03f5d_row8_col9, #T_03f5d_row10_col8 {
+  background-color: #443a83;
+  color: #f1f1f1;
+}
+#T_03f5d_row0_col11 {
+  background-color: #414487;
+  color: #f1f1f1;
+}
+#T_03f5d_row0_col14 {
+  background-color: #1fa287;
+  color: #f1f1f1;
+}
+#T_03f5d_row0_col15 {
+  background-color: #ece51b;
+  color: #000000;
+}
+#T_03f5d_row1_col2, #T_03f5d_row5_col16 {
+  background-color: #482173;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col3 {
+  background-color: #481b6d;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col8, #T_03f5d_row9_col16 {
+  background-color: #297b8e;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col9 {
+  background-color: #1f968b;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col10, #T_03f5d_row5_col10, #T_03f5d_row10_col4 {
+  background-color: #460a5d;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col11, #T_03f5d_row3_col16, #T_03f5d_row5_col15, #T_03f5d_row11_col4 {
+  background-color: #471063;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col12 {
+  background-color: #26828e;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col15 {
+  background-color: #35b779;
+  color: #f1f1f1;
+}
+#T_03f5d_row1_col16, #T_03f5d_row3_col4, #T_03f5d_row3_col7, #T_03f5d_row4_col4, #T_03f5d_row4_col7, #T_03f5d_row5_col4, #T_03f5d_row5_col7 {
+  background-color: #440256;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col2 {
+  background-color: #433e85;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col3, #T_03f5d_row7_col16 {
+  background-color: #424086;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col8, #T_03f5d_row3_col15, #T_03f5d_row8_col16 {
+  background-color: #38598c;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col9 {
+  background-color: #69cd5b;
+  color: #000000;
+}
+#T_03f5d_row2_col10, #T_03f5d_row4_col5 {
+  background-color: #277e8e;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col11 {
+  background-color: #25838e;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col12, #T_03f5d_row9_col11 {
+  background-color: #365c8d;
+  color: #f1f1f1;
+}
+#T_03f5d_row2_col14 {
+  background-color: #f1e51d;
+  color: #000000;
+}
+#T_03f5d_row2_col16, #T_03f5d_row10_col7 {
+  background-color: #46085c;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col2 {
+  background-color: #38588c;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col3 {
+  background-color: #3c4f8a;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col5 {
+  background-color: #2e6d8e;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col8, #T_03f5d_row3_col9 {
+  background-color: #33628d;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col12 {
+  background-color: #423f85;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col13 {
+  background-color: #365d8d;
+  color: #f1f1f1;
+}
+#T_03f5d_row3_col14 {
+  background-color: #f4e61e;
+  color: #000000;
+}
+#T_03f5d_row4_col2 {
+  background-color: #2d708e;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col3, #T_03f5d_row10_col15 {
+  background-color: #32658e;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col8, #T_03f5d_row4_col15 {
+  background-color: #482071;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col9 {
+  background-color: #3e4a89;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col12, #T_03f5d_row6_col12 {
+  background-color: #460b5e;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col13 {
+  background-color: #2eb37c;
+  color: #f1f1f1;
+}
+#T_03f5d_row4_col14 {
+  background-color: #b5de2b;
+  color: #000000;
+}
+#T_03f5d_row4_col16, #T_03f5d_row8_col8 {
+  background-color: #481668;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col2 {
+  background-color: #25858e;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col3 {
+  background-color: #2a788e;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col5 {
+  background-color: #1e9d89;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col8, #T_03f5d_row7_col8 {
+  background-color: #470e61;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col11, #T_03f5d_row9_col7 {
+  background-color: #46075a;
+  color: #f1f1f1;
+}
+#T_03f5d_row5_col14 {
+  background-color: #a0da39;
+  color: #000000;
+}
+#T_03f5d_row6_col2 {
+  background-color: #1e9b8a;
+  color: #f1f1f1;
+}
+#T_03f5d_row6_col3 {
+  background-color: #228d8d;
+  color: #f1f1f1;
+}
+#T_03f5d_row6_col4, #T_03f5d_row6_col7, #T_03f5d_row7_col4, #T_03f5d_row7_col7, #T_03f5d_row8_col7 {
+  background-color: #450457;
+  color: #f1f1f1;
+}
+#T_03f5d_row6_col5 {
+  background-color: #6ccd5a;
+  color: #000000;
+}
+#T_03f5d_row6_col10 {
+  background-color: #481769;
+  color: #f1f1f1;
+}
+#T_03f5d_row6_col11, #T_03f5d_row7_col15, #T_03f5d_row11_col7 {
+  background-color: #471164;
+  color: #f1f1f1;
+}
+#T_03f5d_row6_col14 {
+  background-color: #73d056;
+  color: #000000;
+}
+#T_03f5d_row6_col16 {
+  background-color: #472e7c;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col2 {
+  background-color: #2ab07f;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col3 {
+  background-color: #20928c;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col5 {
+  background-color: #22a884;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col9, #T_03f5d_row8_col11 {
+  background-color: #453581;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col10 {
+  background-color: #482878;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col11 {
+  background-color: #482374;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col12 {
+  background-color: #482475;
+  color: #f1f1f1;
+}
+#T_03f5d_row7_col14 {
+  background-color: #4ec36b;
+  color: #000000;
+}
+#T_03f5d_row8_col2, #T_03f5d_row8_col14 {
+  background-color: #52c569;
+  color: #000000;
+}
+#T_03f5d_row8_col3 {
+  background-color: #1e9c89;
+  color: #f1f1f1;
+}
+#T_03f5d_row8_col4, #T_03f5d_row9_col4 {
+  background-color: #450559;
+  color: #f1f1f1;
+}
+#T_03f5d_row8_col5 {
+  background-color: #32b67a;
+  color: #f1f1f1;
+}
+#T_03f5d_row8_col10 {
+  background-color: #443b84;
+  color: #f1f1f1;
+}
+#T_03f5d_row8_col12, #T_03f5d_row9_col15 {
+  background-color: #472f7d;
+  color: #f1f1f1;
+}
+#T_03f5d_row8_col15, #T_03f5d_row9_col8 {
+  background-color: #48186a;
+  color: #f1f1f1;
+}
+#T_03f5d_row9_col2 {
+  background-color: #86d549;
+  color: #000000;
+}
+#T_03f5d_row9_col3 {
+  background-color: #28ae80;
+  color: #f1f1f1;
+}
+#T_03f5d_row9_col5 {
+  background-color: #4ac16d;
+  color: #000000;
+}
+#T_03f5d_row9_col9 {
+  background-color: #3a548c;
+  color: #f1f1f1;
+}
+#T_03f5d_row9_col10 {
+  background-color: #34618d;
+  color: #f1f1f1;
+}
+#T_03f5d_row9_col12 {
+  background-color: #355e8d;
+  color: #f1f1f1;
+}
+#T_03f5d_row9_col14 {
+  background-color: #24aa83;
+  color: #f1f1f1;
+}
+#T_03f5d_row10_col2 {
+  background-color: #c2df23;
+  color: #000000;
+}
+#T_03f5d_row10_col3, #T_03f5d_row10_col12 {
+  background-color: #63cb5f;
+  color: #000000;
+}
+#T_03f5d_row10_col5 {
+  background-color: #44bf70;
+  color: #f1f1f1;
+}
+#T_03f5d_row10_col9 {
+  background-color: #2e6e8e;
+  color: #f1f1f1;
+}
+#T_03f5d_row10_col10 {
+  background-color: #9dd93b;
+  color: #000000;
+}
+#T_03f5d_row10_col11 {
+  background-color: #aadc32;
+  color: #000000;
+}
+#T_03f5d_row10_col16 {
+  background-color: #3bbb75;
+  color: #f1f1f1;
+}
+#T_03f5d_row11_col8 {
+  background-color: #3c508b;
+  color: #f1f1f1;
+}
+#T_03f5d_row11_col9 {
+  background-color: #228b8d;
+  color: #f1f1f1;
+}
+#T_03f5d_row11_col12 {
+  background-color: #1f988b;
+  color: #f1f1f1;
+}
+#T_03f5d_row11_col14 {
+  background-color: #2fb47c;
+  color: #f1f1f1;
+}
+#T_03f5d_row11_col15 {
+  background-color: #21918c;
+  color: #f1f1f1;
+}
+</style>
+<table id="T_03f5d">
+  <thead>
+    <tr>
+      <th class="blank level0" >&nbsp;</th>
+      <th id="T_03f5d_level0_col0" class="col_heading level0 col0" >version</th>
+      <th id="T_03f5d_level0_col1" class="col_heading level0 col1" >d_sae</th>
+      <th id="T_03f5d_level0_col2" class="col_heading level0 col2" >layer</th>
+      <th id="T_03f5d_level0_col3" class="col_heading level0 col3" >kl_div_with_sae</th>
+      <th id="T_03f5d_level0_col4" class="col_heading level0 col4" >kl_div_with_ablation</th>
+      <th id="T_03f5d_level0_col5" class="col_heading level0 col5" >ce_loss_with_sae</th>
+      <th id="T_03f5d_level0_col6" class="col_heading level0 col6" >ce_loss_without_sae</th>
+      <th id="T_03f5d_level0_col7" class="col_heading level0 col7" >ce_loss_with_ablation</th>
+      <th id="T_03f5d_level0_col8" class="col_heading level0 col8" >kl_div_score</th>
+      <th id="T_03f5d_level0_col9" class="col_heading level0 col9" >ce_loss_score</th>
+      <th id="T_03f5d_level0_col10" class="col_heading level0 col10" >l2_norm_in</th>
+      <th id="T_03f5d_level0_col11" class="col_heading level0 col11" >l2_norm_out</th>
+      <th id="T_03f5d_level0_col12" class="col_heading level0 col12" >l2_ratio</th>
+      <th id="T_03f5d_level0_col13" class="col_heading level0 col13" >l0</th>
+      <th id="T_03f5d_level0_col14" class="col_heading level0 col14" >l1</th>
+      <th id="T_03f5d_level0_col15" class="col_heading level0 col15" >explained_variance</th>
+      <th id="T_03f5d_level0_col16" class="col_heading level0 col16" >mse</th>
+      <th id="T_03f5d_level0_col17" class="col_heading level0 col17" >total_tokens_evaluated</th>
+      <th id="T_03f5d_level0_col18" class="col_heading level0 col18" >filepath</th>
+    </tr>
+  </thead>
+  <tbody>
+    <tr>
+      <th id="T_03f5d_level0_row0" class="row_heading level0 row0" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_0/metrics.json</th>
+      <td id="T_03f5d_row0_col0" class="data row0 col0" >5</td>
+      <td id="T_03f5d_row0_col1" class="data row0 col1" >32</td>
+      <td id="T_03f5d_row0_col2" class="data row0 col2" >0</td>
+      <td id="T_03f5d_row0_col3" class="data row0 col3" >0.004845</td>
+      <td id="T_03f5d_row0_col4" class="data row0 col4" >3.094083</td>
+      <td id="T_03f5d_row0_col5" class="data row0 col5" >3.605465</td>
+      <td id="T_03f5d_row0_col6" class="data row0 col6" >3.599065</td>
+      <td id="T_03f5d_row0_col7" class="data row0 col7" >6.694649</td>
+      <td id="T_03f5d_row0_col8" class="data row0 col8" >0.998434</td>
+      <td id="T_03f5d_row0_col9" class="data row0 col9" >0.997933</td>
+      <td id="T_03f5d_row0_col10" class="data row0 col10" >29.933449</td>
+      <td id="T_03f5d_row0_col11" class="data row0 col11" >29.601543</td>
+      <td id="T_03f5d_row0_col12" class="data row0 col12" >0.989371</td>
+      <td id="T_03f5d_row0_col13" class="data row0 col13" >32.000000</td>
+      <td id="T_03f5d_row0_col14" class="data row0 col14" >71.211151</td>
+      <td id="T_03f5d_row0_col15" class="data row0 col15" >0.966797</td>
+      <td id="T_03f5d_row0_col16" class="data row0 col16" >21.729292</td>
+      <td id="T_03f5d_row0_col17" class="data row0 col17" >6144.000000</td>
+      <td id="T_03f5d_row0_col18" class="data row0 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_0/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row1" class="row_heading level0 row1" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_1/metrics.json</th>
+      <td id="T_03f5d_row1_col0" class="data row1 col0" >5</td>
+      <td id="T_03f5d_row1_col1" class="data row1 col1" >32</td>
+      <td id="T_03f5d_row1_col2" class="data row1 col2" >1</td>
+      <td id="T_03f5d_row1_col3" class="data row1 col3" >0.006601</td>
+      <td id="T_03f5d_row1_col4" class="data row1 col4" >0.051053</td>
+      <td id="T_03f5d_row1_col5" class="data row1 col5" >3.605596</td>
+      <td id="T_03f5d_row1_col6" class="data row1 col6" >3.599065</td>
+      <td id="T_03f5d_row1_col7" class="data row1 col7" >3.652537</td>
+      <td id="T_03f5d_row1_col8" class="data row1 col8" >0.870694</td>
+      <td id="T_03f5d_row1_col9" class="data row1 col9" >0.877862</td>
+      <td id="T_03f5d_row1_col10" class="data row1 col10" >18.973736</td>
+      <td id="T_03f5d_row1_col11" class="data row1 col11" >17.917168</td>
+      <td id="T_03f5d_row1_col12" class="data row1 col12" >0.910649</td>
+      <td id="T_03f5d_row1_col13" class="data row1 col13" >32.000000</td>
+      <td id="T_03f5d_row1_col14" class="data row1 col14" >86.565331</td>
+      <td id="T_03f5d_row1_col15" class="data row1 col15" >0.885442</td>
+      <td id="T_03f5d_row1_col16" class="data row1 col16" >25.637442</td>
+      <td id="T_03f5d_row1_col17" class="data row1 col17" >6144.000000</td>
+      <td id="T_03f5d_row1_col18" class="data row1 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_1/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row2" class="row_heading level0 row2" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_2/metrics.json</th>
+      <td id="T_03f5d_row2_col0" class="data row2 col0" >5</td>
+      <td id="T_03f5d_row2_col1" class="data row2 col1" >32</td>
+      <td id="T_03f5d_row2_col2" class="data row2 col2" >2</td>
+      <td id="T_03f5d_row2_col3" class="data row2 col3" >0.009369</td>
+      <td id="T_03f5d_row2_col4" class="data row2 col4" >0.058747</td>
+      <td id="T_03f5d_row2_col5" class="data row2 col5" >3.601879</td>
+      <td id="T_03f5d_row2_col6" class="data row2 col6" >3.599065</td>
+      <td id="T_03f5d_row2_col7" class="data row2 col7" >3.645913</td>
+      <td id="T_03f5d_row2_col8" class="data row2 col8" >0.840524</td>
+      <td id="T_03f5d_row2_col9" class="data row2 col9" >0.939922</td>
+      <td id="T_03f5d_row2_col10" class="data row2 col10" >49.106537</td>
+      <td id="T_03f5d_row2_col11" class="data row2 col11" >47.644482</td>
+      <td id="T_03f5d_row2_col12" class="data row2 col12" >0.888798</td>
+      <td id="T_03f5d_row2_col13" class="data row2 col13" >31.875000</td>
+      <td id="T_03f5d_row2_col14" class="data row2 col14" >85.811630</td>
+      <td id="T_03f5d_row2_col15" class="data row2 col15" >0.974547</td>
+      <td id="T_03f5d_row2_col16" class="data row2 col16" >37.837296</td>
+      <td id="T_03f5d_row2_col17" class="data row2 col17" >6144.000000</td>
+      <td id="T_03f5d_row2_col18" class="data row2 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_2/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row3" class="row_heading level0 row3" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_3/metrics.json</th>
+      <td id="T_03f5d_row3_col0" class="data row3 col0" >5</td>
+      <td id="T_03f5d_row3_col1" class="data row3 col1" >32</td>
+      <td id="T_03f5d_row3_col2" class="data row3 col2" >3</td>
+      <td id="T_03f5d_row3_col3" class="data row3 col3" >0.010681</td>
+      <td id="T_03f5d_row3_col4" class="data row3 col4" >0.070592</td>
+      <td id="T_03f5d_row3_col5" class="data row3 col5" >3.609601</td>
+      <td id="T_03f5d_row3_col6" class="data row3 col6" >3.599065</td>
+      <td id="T_03f5d_row3_col7" class="data row3 col7" >3.658678</td>
+      <td id="T_03f5d_row3_col8" class="data row3 col8" >0.848690</td>
+      <td id="T_03f5d_row3_col9" class="data row3 col9" >0.823245</td>
+      <td id="T_03f5d_row3_col10" class="data row3 col10" >16.987318</td>
+      <td id="T_03f5d_row3_col11" class="data row3 col11" >15.157210</td>
+      <td id="T_03f5d_row3_col12" class="data row3 col12" >0.874669</td>
+      <td id="T_03f5d_row3_col13" class="data row3 col13" >31.911459</td>
+      <td id="T_03f5d_row3_col14" class="data row3 col14" >85.938217</td>
+      <td id="T_03f5d_row3_col15" class="data row3 col15" >0.780534</td>
+      <td id="T_03f5d_row3_col16" class="data row3 col16" >50.548058</td>
+      <td id="T_03f5d_row3_col17" class="data row3 col17" >6144.000000</td>
+      <td id="T_03f5d_row3_col18" class="data row3 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_3/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row4" class="row_heading level0 row4" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_4/metrics.json</th>
+      <td id="T_03f5d_row4_col0" class="data row4 col0" >5</td>
+      <td id="T_03f5d_row4_col1" class="data row4 col1" >32</td>
+      <td id="T_03f5d_row4_col2" class="data row4 col2" >4</td>
+      <td id="T_03f5d_row4_col3" class="data row4 col3" >0.012658</td>
+      <td id="T_03f5d_row4_col4" class="data row4 col4" >0.063325</td>
+      <td id="T_03f5d_row4_col5" class="data row4 col5" >3.611159</td>
+      <td id="T_03f5d_row4_col6" class="data row4 col6" >3.599065</td>
+      <td id="T_03f5d_row4_col7" class="data row4 col7" >3.660080</td>
+      <td id="T_03f5d_row4_col8" class="data row4 col8" >0.800111</td>
+      <td id="T_03f5d_row4_col9" class="data row4 col9" >0.801781</td>
+      <td id="T_03f5d_row4_col10" class="data row4 col10" >17.251986</td>
+      <td id="T_03f5d_row4_col11" class="data row4 col11" >15.012179</td>
+      <td id="T_03f5d_row4_col12" class="data row4 col12" >0.852544</td>
+      <td id="T_03f5d_row4_col13" class="data row4 col13" >31.955566</td>
+      <td id="T_03f5d_row4_col14" class="data row4 col14" >82.476707</td>
+      <td id="T_03f5d_row4_col15" class="data row4 col15" >0.729496</td>
+      <td id="T_03f5d_row4_col16" class="data row4 col16" >63.704514</td>
+      <td id="T_03f5d_row4_col17" class="data row4 col17" >6144.000000</td>
+      <td id="T_03f5d_row4_col18" class="data row4 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_4/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row5" class="row_heading level0 row5" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_5/metrics.json</th>
+      <td id="T_03f5d_row5_col0" class="data row5 col0" >5</td>
+      <td id="T_03f5d_row5_col1" class="data row5 col1" >32</td>
+      <td id="T_03f5d_row5_col2" class="data row5 col2" >5</td>
+      <td id="T_03f5d_row5_col3" class="data row5 col3" >0.014467</td>
+      <td id="T_03f5d_row5_col4" class="data row5 col4" >0.068505</td>
+      <td id="T_03f5d_row5_col5" class="data row5 col5" >3.613976</td>
+      <td id="T_03f5d_row5_col6" class="data row5 col6" >3.599065</td>
+      <td id="T_03f5d_row5_col7" class="data row5 col7" >3.669386</td>
+      <td id="T_03f5d_row5_col8" class="data row5 col8" >0.788825</td>
+      <td id="T_03f5d_row5_col9" class="data row5 col9" >0.787950</td>
+      <td id="T_03f5d_row5_col10" class="data row5 col10" >18.888968</td>
+      <td id="T_03f5d_row5_col11" class="data row5 col11" >16.209919</td>
+      <td id="T_03f5d_row5_col12" class="data row5 col12" >0.848440</td>
+      <td id="T_03f5d_row5_col13" class="data row5 col13" >32.000000</td>
+      <td id="T_03f5d_row5_col14" class="data row5 col14" >81.434013</td>
+      <td id="T_03f5d_row5_col15" class="data row5 col15" >0.717422</td>
+      <td id="T_03f5d_row5_col16" class="data row5 col16" >87.281723</td>
+      <td id="T_03f5d_row5_col17" class="data row5 col17" >6144.000000</td>
+      <td id="T_03f5d_row5_col18" class="data row5 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_5/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row6" class="row_heading level0 row6" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_6/metrics.json</th>
+      <td id="T_03f5d_row6_col0" class="data row6 col0" >5</td>
+      <td id="T_03f5d_row6_col1" class="data row6 col1" >32</td>
+      <td id="T_03f5d_row6_col2" class="data row6 col2" >6</td>
+      <td id="T_03f5d_row6_col3" class="data row6 col3" >0.016600</td>
+      <td id="T_03f5d_row6_col4" class="data row6 col4" >0.075694</td>
+      <td id="T_03f5d_row6_col5" class="data row6 col5" >3.618799</td>
+      <td id="T_03f5d_row6_col6" class="data row6 col6" >3.599065</td>
+      <td id="T_03f5d_row6_col7" class="data row6 col7" >3.676516</td>
+      <td id="T_03f5d_row6_col8" class="data row6 col8" >0.780703</td>
+      <td id="T_03f5d_row6_col9" class="data row6 col9" >0.745207</td>
+      <td id="T_03f5d_row6_col10" class="data row6 col10" >21.466564</td>
+      <td id="T_03f5d_row6_col11" class="data row6 col11" >18.402473</td>
+      <td id="T_03f5d_row6_col12" class="data row6 col12" >0.852635</td>
+      <td id="T_03f5d_row6_col13" class="data row6 col13" >32.000000</td>
+      <td id="T_03f5d_row6_col14" class="data row6 col14" >78.829765</td>
+      <td id="T_03f5d_row6_col15" class="data row6 col15" >0.706308</td>
+      <td id="T_03f5d_row6_col16" class="data row6 col16" >117.072495</td>
+      <td id="T_03f5d_row6_col17" class="data row6 col17" >6144.000000</td>
+      <td id="T_03f5d_row6_col18" class="data row6 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_6/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row7" class="row_heading level0 row7" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_7/metrics.json</th>
+      <td id="T_03f5d_row7_col0" class="data row7 col0" >5</td>
+      <td id="T_03f5d_row7_col1" class="data row7 col1" >32</td>
+      <td id="T_03f5d_row7_col2" class="data row7 col2" >7</td>
+      <td id="T_03f5d_row7_col3" class="data row7 col3" >0.017010</td>
+      <td id="T_03f5d_row7_col4" class="data row7 col4" >0.080486</td>
+      <td id="T_03f5d_row7_col5" class="data row7 col5" >3.614976</td>
+      <td id="T_03f5d_row7_col6" class="data row7 col6" >3.599065</td>
+      <td id="T_03f5d_row7_col7" class="data row7 col7" >3.672712</td>
+      <td id="T_03f5d_row7_col8" class="data row7 col8" >0.788663</td>
+      <td id="T_03f5d_row7_col9" class="data row7 col9" >0.783952</td>
+      <td id="T_03f5d_row7_col10" class="data row7 col10" >25.444439</td>
+      <td id="T_03f5d_row7_col11" class="data row7 col11" >22.004990</td>
+      <td id="T_03f5d_row7_col12" class="data row7 col12" >0.862489</td>
+      <td id="T_03f5d_row7_col13" class="data row7 col13" >32.000000</td>
+      <td id="T_03f5d_row7_col14" class="data row7 col14" >76.419937</td>
+      <td id="T_03f5d_row7_col15" class="data row7 col15" >0.718003</td>
+      <td id="T_03f5d_row7_col16" class="data row7 col16" >157.791412</td>
+      <td id="T_03f5d_row7_col17" class="data row7 col17" >6144.000000</td>
+      <td id="T_03f5d_row7_col18" class="data row7 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_7/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row8" class="row_heading level0 row8" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_8/metrics.json</th>
+      <td id="T_03f5d_row8_col0" class="data row8 col0" >5</td>
+      <td id="T_03f5d_row8_col1" class="data row8 col1" >32</td>
+      <td id="T_03f5d_row8_col2" class="data row8 col2" >8</td>
+      <td id="T_03f5d_row8_col3" class="data row8 col3" >0.018103</td>
+      <td id="T_03f5d_row8_col4" class="data row8 col4" >0.087324</td>
+      <td id="T_03f5d_row8_col5" class="data row8 col5" >3.616245</td>
+      <td id="T_03f5d_row8_col6" class="data row8 col6" >3.599065</td>
+      <td id="T_03f5d_row8_col7" class="data row8 col7" >3.680337</td>
+      <td id="T_03f5d_row8_col8" class="data row8 col8" >0.792688</td>
+      <td id="T_03f5d_row8_col9" class="data row8 col9" >0.788606</td>
+      <td id="T_03f5d_row8_col10" class="data row8 col10" >30.250225</td>
+      <td id="T_03f5d_row8_col11" class="data row8 col11" >26.306936</td>
+      <td id="T_03f5d_row8_col12" class="data row8 col12" >0.867637</td>
+      <td id="T_03f5d_row8_col13" class="data row8 col13" >32.000000</td>
+      <td id="T_03f5d_row8_col14" class="data row8 col14" >76.728195</td>
+      <td id="T_03f5d_row8_col15" class="data row8 col15" >0.723916</td>
+      <td id="T_03f5d_row8_col16" class="data row8 col16" >219.982910</td>
+      <td id="T_03f5d_row8_col17" class="data row8 col17" >6144.000000</td>
+      <td id="T_03f5d_row8_col18" class="data row8 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_8/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row9" class="row_heading level0 row9" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_9/metrics.json</th>
+      <td id="T_03f5d_row9_col0" class="data row9 col0" >5</td>
+      <td id="T_03f5d_row9_col1" class="data row9 col1" >32</td>
+      <td id="T_03f5d_row9_col2" class="data row9 col2" >9</td>
+      <td id="T_03f5d_row9_col3" class="data row9 col3" >0.019997</td>
+      <td id="T_03f5d_row9_col4" class="data row9 col4" >0.097589</td>
+      <td id="T_03f5d_row9_col5" class="data row9 col5" >3.617456</td>
+      <td id="T_03f5d_row9_col6" class="data row9 col6" >3.599065</td>
+      <td id="T_03f5d_row9_col7" class="data row9 col7" >3.696245</td>
+      <td id="T_03f5d_row9_col8" class="data row9 col8" >0.795088</td>
+      <td id="T_03f5d_row9_col9" class="data row9 col9" >0.810751</td>
+      <td id="T_03f5d_row9_col10" class="data row9 col10" >40.192413</td>
+      <td id="T_03f5d_row9_col11" class="data row9 col11" >35.945808</td>
+      <td id="T_03f5d_row9_col12" class="data row9 col12" >0.889800</td>
+      <td id="T_03f5d_row9_col13" class="data row9 col13" >32.000000</td>
+      <td id="T_03f5d_row9_col14" class="data row9 col14" >72.426567</td>
+      <td id="T_03f5d_row9_col15" class="data row9 col15" >0.742352</td>
+      <td id="T_03f5d_row9_col16" class="data row9 col16" >318.143433</td>
+      <td id="T_03f5d_row9_col17" class="data row9 col17" >6144.000000</td>
+      <td id="T_03f5d_row9_col18" class="data row9 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_9/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row10" class="row_heading level0 row10" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_10/metrics.json</th>
+      <td id="T_03f5d_row10_col0" class="data row10 col0" >5</td>
+      <td id="T_03f5d_row10_col1" class="data row10 col1" >32</td>
+      <td id="T_03f5d_row10_col2" class="data row10 col2" >10</td>
+      <td id="T_03f5d_row10_col3" class="data row10 col3" >0.023115</td>
+      <td id="T_03f5d_row10_col4" class="data row10 col4" >0.126748</td>
+      <td id="T_03f5d_row10_col5" class="data row10 col5" >3.617172</td>
+      <td id="T_03f5d_row10_col6" class="data row10 col6" >3.599065</td>
+      <td id="T_03f5d_row10_col7" class="data row10 col7" >3.708984</td>
+      <td id="T_03f5d_row10_col8" class="data row10 col8" >0.817629</td>
+      <td id="T_03f5d_row10_col9" class="data row10 col9" >0.835264</td>
+      <td id="T_03f5d_row10_col10" class="data row10 col10" >81.756828</td>
+      <td id="T_03f5d_row10_col11" class="data row10 col11" >78.393089</td>
+      <td id="T_03f5d_row10_col12" class="data row10 col12" >0.955360</td>
+      <td id="T_03f5d_row10_col13" class="data row10 col13" >32.000000</td>
+      <td id="T_03f5d_row10_col14" class="data row10 col14" >50.458115</td>
+      <td id="T_03f5d_row10_col15" class="data row10 col15" >0.792657</td>
+      <td id="T_03f5d_row10_col16" class="data row10 col16" >514.553589</td>
+      <td id="T_03f5d_row10_col17" class="data row10 col17" >6144.000000</td>
+      <td id="T_03f5d_row10_col18" class="data row10 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_10/metrics.json</td>
+    </tr>
+    <tr>
+      <th id="T_03f5d_level0_row11" class="row_heading level0 row11" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_11/metrics.json</th>
+      <td id="T_03f5d_row11_col0" class="data row11 col0" >5</td>
+      <td id="T_03f5d_row11_col1" class="data row11 col1" >32</td>
+      <td id="T_03f5d_row11_col2" class="data row11 col2" >11</td>
+      <td id="T_03f5d_row11_col3" class="data row11 col3" >0.028953</td>
+      <td id="T_03f5d_row11_col4" class="data row11 col4" >0.173841</td>
+      <td id="T_03f5d_row11_col5" class="data row11 col5" >3.623718</td>
+      <td id="T_03f5d_row11_col6" class="data row11 col6" >3.599065</td>
+      <td id="T_03f5d_row11_col7" class="data row11 col7" >3.783318</td>
+      <td id="T_03f5d_row11_col8" class="data row11 col8" >0.833454</td>
+      <td id="T_03f5d_row11_col9" class="data row11 col9" >0.866197</td>
+      <td id="T_03f5d_row11_col10" class="data row11 col10" >92.906296</td>
+      <td id="T_03f5d_row11_col11" class="data row11 col11" >87.663773</td>
+      <td id="T_03f5d_row11_col12" class="data row11 col12" >0.923381</td>
+      <td id="T_03f5d_row11_col13" class="data row11 col13" >32.000000</td>
+      <td id="T_03f5d_row11_col14" class="data row11 col14" >73.987030</td>
+      <td id="T_03f5d_row11_col15" class="data row11 col15" >0.840599</td>
+      <td id="T_03f5d_row11_col16" class="data row11 col16" >742.957520</td>
+      <td id="T_03f5d_row11_col17" class="data row11 col17" >6144.000000</td>
+      <td id="T_03f5d_row11_col18" class="data row11 col18" >OAI_GPT2Small_v5_32k_resid_delta_mlp/v5_32k_layer_11/metrics.json</td>
+    </tr>
+  </tbody>
+</table>
diff --git a/benchmark_stats.png b/benchmark_stats.png
new file mode 100644
index 0000000000000000000000000000000000000000..73a131c1df718fd5296b8542291d1638b5d1d087
--- /dev/null
+++ b/benchmark_stats.png
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4c06d084693334119a81889b712cccee3f900115be574d2420e6304a50e9b2dc
+size 4548552
diff --git a/v5_32k_layer_0/cfg.json b/v5_32k_layer_0/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..381b394dd00b185f70e688a0302fb005e2a701fe
--- /dev/null
+++ b/v5_32k_layer_0/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.0.hook_mlp_out", "hook_layer": 0, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_0/metrics.json b/v5_32k_layer_0/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..92f6694bfa8d9640887fabb0ac315b320ea2759d
--- /dev/null
+++ b/v5_32k_layer_0/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.0048454091884195805, "metrics/kl_div_with_ablation": 3.094083309173584, "metrics/ce_loss_with_sae": 3.6054646968841553, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 6.694648742675781, "metrics/kl_div_score": 0.9984339758486613, "metrics/ce_loss_score": 0.9979325038445924, "metrics/l2_norm_in": 29.933448791503906, "metrics/l2_norm_out": 29.601543426513672, "metrics/l2_ratio": 0.9893707036972046, "metrics/l0": 32.0, "metrics/l1": 71.21115112304688, "metrics/explained_variance": 0.9667970538139343, "metrics/mse": 21.729291915893555, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_0/sae_weights.safetensors b/v5_32k_layer_0/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..79d31456524867db78ade6149d5c9745b7621478
--- /dev/null
+++ b/v5_32k_layer_0/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ab7f7cbb78776f97da06167e5297aa3d045a8fc83eda19e91076e4b98ce2934f
+size 201461056
diff --git a/v5_32k_layer_0/sparsity.safetensors b/v5_32k_layer_0/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..39584b16c76f37d41202a86426da961dce018f58
--- /dev/null
+++ b/v5_32k_layer_0/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ead023e8744163c7b1fd85e383df10bf880155bea44ad396ac7182c5a2890d81
+size 131152
diff --git a/v5_32k_layer_1/cfg.json b/v5_32k_layer_1/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..7c8336853af871822a6f78383992846821298141
--- /dev/null
+++ b/v5_32k_layer_1/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.1.hook_mlp_out", "hook_layer": 1, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_1/metrics.json b/v5_32k_layer_1/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..4f5df8ef4260f4ac927ab6219c1bb92c3feb8e8c
--- /dev/null
+++ b/v5_32k_layer_1/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.006601419299840927, "metrics/kl_div_with_ablation": 0.05105271190404892, "metrics/ce_loss_with_sae": 3.605595588684082, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6525371074676514, "metrics/kl_div_score": 0.8706940522131719, "metrics/ce_loss_score": 0.8778624933119316, "metrics/l2_norm_in": 18.973735809326172, "metrics/l2_norm_out": 17.91716766357422, "metrics/l2_ratio": 0.910649299621582, "metrics/l0": 32.0, "metrics/l1": 86.5653305053711, "metrics/explained_variance": 0.8854424357414246, "metrics/mse": 25.637441635131836, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_1/sae_weights.safetensors b/v5_32k_layer_1/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8d800d7d9cfc29d47d26d3e9b18689e6f4a4da1b
--- /dev/null
+++ b/v5_32k_layer_1/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9fe30891436eb0a90f46ebc5850c61ccba4022a2acaca044335f7c740f746dba
+size 201461056
diff --git a/v5_32k_layer_1/sparsity.safetensors b/v5_32k_layer_1/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e4c346e25c019d18d3b4f221245e47505f283adf
--- /dev/null
+++ b/v5_32k_layer_1/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:302f9ced1609a7507d856f4d3e8c31bae60f1db043c13595c527427f6c7e7f02
+size 131152
diff --git a/v5_32k_layer_10/cfg.json b/v5_32k_layer_10/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..8f9006c0717a8b4bdba41f245920ce9a2a6a37c4
--- /dev/null
+++ b/v5_32k_layer_10/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.10.hook_mlp_out", "hook_layer": 10, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_10/metrics.json b/v5_32k_layer_10/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..046e21a4a82fcde83b051121ec69ed15db693a0a
--- /dev/null
+++ b/v5_32k_layer_10/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.02311515063047409, "metrics/kl_div_with_ablation": 0.12674781680107117, "metrics/ce_loss_with_sae": 3.6171722412109375, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.708984136581421, "metrics/kl_div_score": 0.8176288064452188, "metrics/ce_loss_score": 0.8352644912761693, "metrics/l2_norm_in": 81.75682830810547, "metrics/l2_norm_out": 78.3930892944336, "metrics/l2_ratio": 0.9553598165512085, "metrics/l0": 32.0, "metrics/l1": 50.45811462402344, "metrics/explained_variance": 0.7926573753356934, "metrics/mse": 514.5535888671875, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_10/sae_weights.safetensors b/v5_32k_layer_10/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f57b424b0811aae6bae86769432b1baa3e727906
--- /dev/null
+++ b/v5_32k_layer_10/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c676f5187854407e5c6f79d7db14fafe6bf3a662a9883e7fa442effa194d6d04
+size 201461056
diff --git a/v5_32k_layer_10/sparsity.safetensors b/v5_32k_layer_10/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..7ff10f5d6fd70f6b8872ef625583f1b775be86b3
--- /dev/null
+++ b/v5_32k_layer_10/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7164ca2c04e1c69c8662b4b0a105ee61196163ffbb1ab4eea3e1875644c25895
+size 131152
diff --git a/v5_32k_layer_11/cfg.json b/v5_32k_layer_11/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..78d7d7f4004f43b2ed9c7ae638645d96747f526b
--- /dev/null
+++ b/v5_32k_layer_11/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.11.hook_mlp_out", "hook_layer": 11, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_11/metrics.json b/v5_32k_layer_11/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..26085daec2e9cf053950140a4abc22c79045e8fe
--- /dev/null
+++ b/v5_32k_layer_11/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.028952505439519882, "metrics/kl_div_with_ablation": 0.17384076118469238, "metrics/ce_loss_with_sae": 3.62371826171875, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.783318281173706, "metrics/kl_div_score": 0.8334538732906256, "metrics/ce_loss_score": 0.8661971284238421, "metrics/l2_norm_in": 92.90629577636719, "metrics/l2_norm_out": 87.66377258300781, "metrics/l2_ratio": 0.9233807325363159, "metrics/l0": 32.0, "metrics/l1": 73.98703002929688, "metrics/explained_variance": 0.840599000453949, "metrics/mse": 742.95751953125, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_11/sae_weights.safetensors b/v5_32k_layer_11/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ff2c31787bd092e92a5d9c5f65abbc5b9ad23768
--- /dev/null
+++ b/v5_32k_layer_11/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:72876f75e313f3785999392dddef0afe7b2dc44f6a0671b007dd1dcd176ee8c5
+size 201461056
diff --git a/v5_32k_layer_11/sparsity.safetensors b/v5_32k_layer_11/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..8393b81eb029636d966a82fe9ed8fa1a46735019
--- /dev/null
+++ b/v5_32k_layer_11/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26db3acaed898f49efb23762df7d70847bc97c5da288926681567dc89f8107a9
+size 131152
diff --git a/v5_32k_layer_2/cfg.json b/v5_32k_layer_2/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..f86334a54c38510b269e530fdc62935d556e8635
--- /dev/null
+++ b/v5_32k_layer_2/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.2.hook_mlp_out", "hook_layer": 2, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_2/metrics.json b/v5_32k_layer_2/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..c8d5210ec8d29dd1b8a559e4de83b4277224e71e
--- /dev/null
+++ b/v5_32k_layer_2/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.00936876516789198, "metrics/kl_div_with_ablation": 0.05874736234545708, "metrics/ce_loss_with_sae": 3.601879119873047, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6459126472473145, "metrics/kl_div_score": 0.8405244968650671, "metrics/ce_loss_score": 0.9399221354232932, "metrics/l2_norm_in": 49.106536865234375, "metrics/l2_norm_out": 47.64448165893555, "metrics/l2_ratio": 0.8887979388237, "metrics/l0": 31.875, "metrics/l1": 85.81163024902344, "metrics/explained_variance": 0.9745470285415649, "metrics/mse": 37.83729553222656, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_2/sae_weights.safetensors b/v5_32k_layer_2/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..25d0aa4a65ed1710bf0f7447b40d00c18d3c7f4a
--- /dev/null
+++ b/v5_32k_layer_2/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:80a546f38807810c98365c13fdf6ba7c883b2f177fec3d79963dd869992f3d9f
+size 201461056
diff --git a/v5_32k_layer_2/sparsity.safetensors b/v5_32k_layer_2/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0222d7530ce7aeb7ec88b3b40c396b4a7fd1e6ec
--- /dev/null
+++ b/v5_32k_layer_2/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7f0e1dcea111995b08893a3af42c3de1444f9ac0b12dc28c7df6d88125e51ee8
+size 131152
diff --git a/v5_32k_layer_3/cfg.json b/v5_32k_layer_3/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..40125db1b3e4cb725fb1adf6d71b420babc9899d
--- /dev/null
+++ b/v5_32k_layer_3/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.3.hook_mlp_out", "hook_layer": 3, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_3/metrics.json b/v5_32k_layer_3/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..8466ca82093a5f945bbf3f2456077bec008fe54d
--- /dev/null
+++ b/v5_32k_layer_3/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.010681239888072014, "metrics/kl_div_with_ablation": 0.07059153914451599, "metrics/ce_loss_with_sae": 3.6096014976501465, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.658677577972412, "metrics/kl_div_score": 0.8486895169376428, "metrics/ce_loss_score": 0.823244745735597, "metrics/l2_norm_in": 16.98731803894043, "metrics/l2_norm_out": 15.157210350036621, "metrics/l2_ratio": 0.8746687173843384, "metrics/l0": 31.91145896911621, "metrics/l1": 85.93821716308594, "metrics/explained_variance": 0.7805342078208923, "metrics/mse": 50.548057556152344, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_3/sae_weights.safetensors b/v5_32k_layer_3/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..45cbfe8bfb2785aee2c462d322164eb2627348a9
--- /dev/null
+++ b/v5_32k_layer_3/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eb781b7a737037ffe78ab1bdca78ba1af47bb297c189ebd9902c60a3fd5f333f
+size 201461056
diff --git a/v5_32k_layer_3/sparsity.safetensors b/v5_32k_layer_3/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dd296034ac5b9f7d58e427b9e592c0747228c1a3
--- /dev/null
+++ b/v5_32k_layer_3/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:26543a937a617417c20fe430ff78e4e031b1b941d59cc80b4db96b4ef7c784a5
+size 131152
diff --git a/v5_32k_layer_4/cfg.json b/v5_32k_layer_4/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..95cd0ff595aaef2a1d2c882b2b99bd7cd2734063
--- /dev/null
+++ b/v5_32k_layer_4/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.4.hook_mlp_out", "hook_layer": 4, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_4/metrics.json b/v5_32k_layer_4/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..b1ed7359b108fd6fa557f632d1bffd79296ca58f
--- /dev/null
+++ b/v5_32k_layer_4/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.012658017687499523, "metrics/kl_div_with_ablation": 0.06332532316446304, "metrics/ce_loss_with_sae": 3.611159086227417, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6600804328918457, "metrics/kl_div_score": 0.8001112816333331, "metrics/ce_loss_score": 0.8017810322797447, "metrics/l2_norm_in": 17.251985549926758, "metrics/l2_norm_out": 15.012179374694824, "metrics/l2_ratio": 0.8525444865226746, "metrics/l0": 31.95556640625, "metrics/l1": 82.4767074584961, "metrics/explained_variance": 0.7294961810112, "metrics/mse": 63.70451354980469, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_4/sae_weights.safetensors b/v5_32k_layer_4/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..347c977e325f0dce2228fc224417a662a80a0234
--- /dev/null
+++ b/v5_32k_layer_4/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:17f173d1919c9c9f53f3a956c96aebe863b0cc90f964c74b13d0056553a09ab3
+size 201461056
diff --git a/v5_32k_layer_4/sparsity.safetensors b/v5_32k_layer_4/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..37a19d1a5f035d957e89ed08fec67cf09417717a
--- /dev/null
+++ b/v5_32k_layer_4/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cc4ef7f40430139c30bc32dbce3fbb64304191924edf791b404eb896583dec26
+size 131152
diff --git a/v5_32k_layer_5/cfg.json b/v5_32k_layer_5/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..f173c114874f719174f0e5f87c5a31ed20ed2739
--- /dev/null
+++ b/v5_32k_layer_5/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.5.hook_mlp_out", "hook_layer": 5, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_5/metrics.json b/v5_32k_layer_5/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..02569cc62dfaec794c48669951a6251ecea9d689
--- /dev/null
+++ b/v5_32k_layer_5/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.014466611668467522, "metrics/kl_div_with_ablation": 0.06850520521402359, "metrics/ce_loss_with_sae": 3.613976240158081, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6693859100341797, "metrics/kl_div_score": 0.7888246356861349, "metrics/ce_loss_score": 0.7879497811486054, "metrics/l2_norm_in": 18.888967514038086, "metrics/l2_norm_out": 16.209918975830078, "metrics/l2_ratio": 0.8484395742416382, "metrics/l0": 32.0, "metrics/l1": 81.43401336669922, "metrics/explained_variance": 0.7174215316772461, "metrics/mse": 87.28172302246094, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_5/sae_weights.safetensors b/v5_32k_layer_5/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5d237d99f80b052399c2435a485ce330b3a8f8bd
--- /dev/null
+++ b/v5_32k_layer_5/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8a5dbd05b4cb8acc8150fa92853ab5c42373121b1bc35bc108ffac1c6cc73ad4
+size 201461056
diff --git a/v5_32k_layer_5/sparsity.safetensors b/v5_32k_layer_5/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b62869cdd95d24da5c9a73efad0201e661f1bbb7
--- /dev/null
+++ b/v5_32k_layer_5/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d092024c813ffab3ab07a3d24630235d7d4348f5b4d68b3d737ad926b4d50022
+size 131152
diff --git a/v5_32k_layer_6/cfg.json b/v5_32k_layer_6/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..dfba00bfdc745fb90290ec4f5ec515675e0ad5f8
--- /dev/null
+++ b/v5_32k_layer_6/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.6.hook_mlp_out", "hook_layer": 6, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_6/metrics.json b/v5_32k_layer_6/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..b837e4501dc6c46692293f8d449a0d4ad89b6e3f
--- /dev/null
+++ b/v5_32k_layer_6/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.016599537804722786, "metrics/kl_div_with_ablation": 0.07569437474012375, "metrics/ce_loss_with_sae": 3.6187987327575684, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.67651629447937, "metrics/kl_div_score": 0.7807031518298047, "metrics/ce_loss_score": 0.7452071071490137, "metrics/l2_norm_in": 21.466564178466797, "metrics/l2_norm_out": 18.40247344970703, "metrics/l2_ratio": 0.852634608745575, "metrics/l0": 32.0, "metrics/l1": 78.82976531982422, "metrics/explained_variance": 0.7063077688217163, "metrics/mse": 117.07249450683594, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_6/sae_weights.safetensors b/v5_32k_layer_6/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9a3345273f4d8201f132f74b14d738263f8d2ee0
--- /dev/null
+++ b/v5_32k_layer_6/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3105f1072fa405f49c442269f43c553fbdc3e6526b6bc0445eaa6c5cd683838b
+size 201461056
diff --git a/v5_32k_layer_6/sparsity.safetensors b/v5_32k_layer_6/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..34a246b5100b22b1698b7b7b5da085c9d001d1d7
--- /dev/null
+++ b/v5_32k_layer_6/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:71eaa2c4d06116f1c4001fc6c162b791a70bcc72f5abccfe6abb5aa870dfe8d9
+size 131152
diff --git a/v5_32k_layer_7/cfg.json b/v5_32k_layer_7/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..404ffa80285d93eef7a758456c02797464775091
--- /dev/null
+++ b/v5_32k_layer_7/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.7.hook_mlp_out", "hook_layer": 7, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_7/metrics.json b/v5_32k_layer_7/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..45abcf6f579c73f580e331b5efac217c3fce7718
--- /dev/null
+++ b/v5_32k_layer_7/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.017009764909744263, "metrics/kl_div_with_ablation": 0.08048636466264725, "metrics/ce_loss_with_sae": 3.614975929260254, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6727118492126465, "metrics/kl_div_score": 0.7886627756013151, "metrics/ce_loss_score": 0.7839520361024154, "metrics/l2_norm_in": 25.444438934326172, "metrics/l2_norm_out": 22.004989624023438, "metrics/l2_ratio": 0.8624889254570007, "metrics/l0": 32.0, "metrics/l1": 76.41993713378906, "metrics/explained_variance": 0.7180025577545166, "metrics/mse": 157.79141235351562, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_7/sae_weights.safetensors b/v5_32k_layer_7/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..f2748c77df1111458872d306d93e64aad006dad9
--- /dev/null
+++ b/v5_32k_layer_7/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:062c7f24dd951d7780e3000d052e82f091564685418cd3c07c61717f23616ee3
+size 201461056
diff --git a/v5_32k_layer_7/sparsity.safetensors b/v5_32k_layer_7/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0e2c93b14b99a9a67f311a4f8de39dddd0faf6ba
--- /dev/null
+++ b/v5_32k_layer_7/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:64ac63219db967150e3ba33adb0fdbae4328f4c0b3259fc34f6c8617fba230d9
+size 131152
diff --git a/v5_32k_layer_8/cfg.json b/v5_32k_layer_8/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..195acde32ef0a52f6994166bb226452a434f691d
--- /dev/null
+++ b/v5_32k_layer_8/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.8.hook_mlp_out", "hook_layer": 8, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_8/metrics.json b/v5_32k_layer_8/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..26cec739223c991ad772f439fcf89e76a8009c0e
--- /dev/null
+++ b/v5_32k_layer_8/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.01810324750840664, "metrics/kl_div_with_ablation": 0.08732372522354126, "metrics/ce_loss_with_sae": 3.6162450313568115, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6803367137908936, "metrics/kl_div_score": 0.792688098657451, "metrics/ce_loss_score": 0.7886059610420089, "metrics/l2_norm_in": 30.250225067138672, "metrics/l2_norm_out": 26.306936264038086, "metrics/l2_ratio": 0.8676368594169617, "metrics/l0": 32.0, "metrics/l1": 76.72819519042969, "metrics/explained_variance": 0.7239155769348145, "metrics/mse": 219.98291015625, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_8/sae_weights.safetensors b/v5_32k_layer_8/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..c5ef7a3743e48e088c61d36766863cbcfd9fba01
--- /dev/null
+++ b/v5_32k_layer_8/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33f7d0d26aabda775fb2fe1fb8ae9e416e0a4cc92e12e491750d595294d320f1
+size 201461056
diff --git a/v5_32k_layer_8/sparsity.safetensors b/v5_32k_layer_8/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..79669e4ae2b8ef8cb0222f21228993c316dd18cf
--- /dev/null
+++ b/v5_32k_layer_8/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cdd2f0c4c36e44ec05d021122bb7d7435ef8cfefe737018b58f5150987c84fea
+size 131152
diff --git a/v5_32k_layer_9/cfg.json b/v5_32k_layer_9/cfg.json
new file mode 100644
index 0000000000000000000000000000000000000000..bafeddd0c44e9b4432e2d8d4939ccc9726e279a9
--- /dev/null
+++ b/v5_32k_layer_9/cfg.json
@@ -0,0 +1 @@
+{"architecture": "standard", "d_in": 768, "d_sae": 32768, "dtype": "torch.float32", "device": "cuda", "model_name": "gpt2-small", "hook_name": "blocks.9.hook_mlp_out", "hook_layer": 9, "hook_head_index": null, "activation_fn_str": "topk", "activation_fn_kwargs": {"k": 32}, "apply_b_dec_to_input": true, "finetuning_scaling_factor": false, "sae_lens_training_version": null, "prepend_bos": false, "dataset_path": "Skylion007/openwebtext", "dataset_trust_remote_code": true, "context_size": 64, "normalize_activations": "layer_norm"}
\ No newline at end of file
diff --git a/v5_32k_layer_9/metrics.json b/v5_32k_layer_9/metrics.json
new file mode 100644
index 0000000000000000000000000000000000000000..dd800f011003ca1e5c049dfc1955b54ef5e51367
--- /dev/null
+++ b/v5_32k_layer_9/metrics.json
@@ -0,0 +1 @@
+{"metrics/kl_div_with_sae": 0.01999707892537117, "metrics/kl_div_with_ablation": 0.09758877754211426, "metrics/ce_loss_with_sae": 3.6174559593200684, "metrics/ce_loss_without_sae": 3.599064588546753, "metrics/ce_loss_with_ablation": 3.6962451934814453, "metrics/kl_div_score": 0.7950883346526042, "metrics/ce_loss_score": 0.8107506041388108, "metrics/l2_norm_in": 40.192413330078125, "metrics/l2_norm_out": 35.94580841064453, "metrics/l2_ratio": 0.8897998332977295, "metrics/l0": 32.0, "metrics/l1": 72.42656707763672, "metrics/explained_variance": 0.7423521876335144, "metrics/mse": 318.1434326171875, "metrics/total_tokens_evaluated": 6144}
\ No newline at end of file
diff --git a/v5_32k_layer_9/sae_weights.safetensors b/v5_32k_layer_9/sae_weights.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..0fa46e33280ca301c9d76279220f41719a366318
--- /dev/null
+++ b/v5_32k_layer_9/sae_weights.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7e471a86fd93d6c293aa4c9b10cd43abac13cc50ee33ed636628bfc7e36124ab
+size 201461056
diff --git a/v5_32k_layer_9/sparsity.safetensors b/v5_32k_layer_9/sparsity.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b72edf4e1f057c0ec2296ebfb7316987452662c7
--- /dev/null
+++ b/v5_32k_layer_9/sparsity.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f257554da48ef7ede841b79335fe5147d9fefd79359a1dca7a5212750f1a56a6
+size 131152