Commit
·
9eca29b
1
Parent(s):
68aa047
Added encoder for ssm_output
Browse files- 72.pt +3 -0
- 72_cfg.json +1 -0
72.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:510cefc19cdb560cd8a3497c10e2ae5f5fe5f3a1db339d35a07b4a6f4156347e
|
3 |
+
size 9448168
|
72_cfg.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"num_tokens": 100000, "batch_size": 32, "act_name": "hook_norm", "dict_size": 1536, "l1_coeff": 0.0003, "beta1": 0.9, "beta2": 0.999, "dict_mult": 32, "seq_len": 128, "remove_rare_dir": false, "device": "cuda:0", "enc_dtype": "fp32", "seed": 16, "act_size": 768, "model_batch_size": 32, "num_epochs": 5, "lr": 0.001, "l1_weight": 1e-05, "l2_weight": 1e-05, "log_every": 50, "eval_every": 100, "recons_every": 500, "save_every": 500, "reset_freq_threshold": 3.162277660168379e-06, "wandb_project": "mamba_autoencoder", "wandb_name": null, "encoder_hidden_sizes": [512, 256], "decoder_hidden_sizes": [256, 512], "latent_dim": 64}
|