diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a0da4709fbc711e9a777f1fb794c024e90d8099 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/config.json @@ -0,0 +1 @@ +{"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["transformer.h.0.attn", "transformer.h.0.mlp", "transformer.h.1.attn", "transformer.h.1.mlp"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/lr_scheduler.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5441e5cff18f2f6f82f927744aebdaaf855c229 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afafb111606b64199b463308d054f28acf71d5cca5174e9fd9fce0b0ab0a717c +size 1076 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/model_config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/model_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3211e66fdb51668312f422ba73e95615779a92db --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/model_config.json @@ -0,0 +1 @@ +{"model_name": "withmartian/sql_interp_bm1_cs1_experiment_1.10", "dataset_name": "withmartian/cs1_dataset_synonyms", "model_abbrev": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True"} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/optimizer.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..7695e09ed62b17ec90bc8744270edb20a6eedfe3 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ac1e2a4b8279d0b3058c6ca4e4196dba16fd257331c187b67ede2fec3fff5b +size 255767204 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/state.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/state.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac77326d8ab626246e4bfeec80899465d5c8aa2f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/state.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a612e8ae5676765040241e0d09a5e743af130e8d444b32987c09e9bf68d244b6 +size 493312 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..7a5c49940485d2a23606145a39728bf54a47b7ae --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..fa3bb2d876857b6f6628db48a3cb08a89da7feee --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.18085938692092896, "fvu": 0.002518476452678442} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f08956340a39f102d02291d359d6f5c24f129eed --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3539bc8788ca8235e06606a9bfecfc247fc329863b899cdfa1130e50ce026f +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..7a5c49940485d2a23606145a39728bf54a47b7ae --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..e5e4699acf83ae60d29cc28c8a7de67484dda11b --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.019294889643788338, "dead_pct": 0.0} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ab3b7cf68a4beb0291d92db43ae71c562b98da64 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.0.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91b236093cd5c4a8247ed11cede8fb71fe2414783345045688935a710f53e3e +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..7a5c49940485d2a23606145a39728bf54a47b7ae --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..4d6c66fa35447dbb16518ecc05330b4b7f4caa19 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.22486980259418488, "fvu": 0.020067255944013596} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e30ae5a1fb04c2783d39e3d79a8b4ab7356d1c08 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266bead4788280baf24dbb0c88d6df9d77da99a2ac1831b010bdf6793c55de5d +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..7a5c49940485d2a23606145a39728bf54a47b7ae --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 128, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..8fdb5b779a24ad748798bfdac2803bb4d2088bfb --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.0174215380102396, "dead_pct": 0.01484375074505806} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e6d3e4d22e56a20bf26108782e472cf6e4fc118c --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=128/transformer.h.1.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7f5911846fdff382b39127c0b731012966fb6261af6d8e128c9cf6799b2455 +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/config.json new file mode 100644 index 0000000000000000000000000000000000000000..a973506ae2d35e9076b5a3363e351e68b0e5c603 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/config.json @@ -0,0 +1 @@ +{"sae": {"expansion_factor": 4, "normalize_decoder": true, "num_latents": 0, "k": 16, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["transformer.h.0.attn", "transformer.h.0.mlp", "transformer.h.1.attn", "transformer.h.1.mlp"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/lr_scheduler.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6aa50a7aa478f20cb4ee6fdd0886d4b66d239d0 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19ec7a7d99a9517726d577d84860d99635fa1571577af8b6d7ba1c019ae8379 +size 1076 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/model_config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/model_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3211e66fdb51668312f422ba73e95615779a92db --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/model_config.json @@ -0,0 +1 @@ +{"model_name": "withmartian/sql_interp_bm1_cs1_experiment_1.10", "dataset_name": "withmartian/cs1_dataset_synonyms", "model_abbrev": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True"} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/optimizer.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..56026f09d42820e6ea5078db7ff80eb41ef9e1aa --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de72be0333f6c32c60298b6dfe17542989da4009b74f4cac9ce4aa480d1f281b +size 68243108 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/state.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/state.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab754305730c0f3cedfdf1b42db82db1e741b11 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/state.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b936b2797e1a1d9d822067e4f761d6771c4063ecfc5d241b7a4f387f66d43472 +size 132864 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8943661e77283935d0527f13a585ab60ac97bd --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 4, "normalize_decoder": true, "num_latents": 0, "k": 16, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..29efbc6f38829bc69ecd18aca57ec922c432dfd0 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.6455078125, "fvu": 0.019297020509839058} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3dd81fc3465ca724f9e8c62cb030b176dc5ff634 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:363144ece15fafd7b196c17966e2e82861105406f3693a8ce89029f39869c2ce +size 33575240 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8943661e77283935d0527f13a585ab60ac97bd --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 4, "normalize_decoder": true, "num_latents": 0, "k": 16, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..2b8d2c799a48251b2a10caf4cc70a1216457031c --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.245361328125, "fvu": 0.03865286707878113} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4be18771b03942c78b5e8a61f82cef0b9bf5d677 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.0.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2442484ede1e6d6e4eda07418e02f832ecd8c04e228a666f4bfaa814bc4d513 +size 33575240 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8943661e77283935d0527f13a585ab60ac97bd --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 4, "normalize_decoder": true, "num_latents": 0, "k": 16, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..d5a605a43d993c986700a549e083c1d78344f812 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.745849609375, "fvu": 0.05162069573998451} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3873618001543121fa88650d01b8f5fd9e667dee --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb4f90210b67c975e41c6db0b94b2e9e4e4e3deea5f702c601352bbed36f36db +size 33575240 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..0d8943661e77283935d0527f13a585ab60ac97bd --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 4, "normalize_decoder": true, "num_latents": 0, "k": 16, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..363709d0d78d6a2e33b7f221605fc11edfab1b94 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.476806640625, "fvu": 0.040764667093753815} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3eb1e2758ff42f385222712003ceb27fe735ad14 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=16/transformer.h.1.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ab0927cdca8b60d9d2761e93b7fb7b32588ce9b0de577d612117b42c165949 +size 33575240 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/config.json new file mode 100644 index 0000000000000000000000000000000000000000..b5e846e5dd7121bc1c5b58d09c5508c63267fe5d --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/config.json @@ -0,0 +1 @@ +{"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["transformer.h.0.attn", "transformer.h.0.mlp", "transformer.h.1.attn", "transformer.h.1.mlp"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/lr_scheduler.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..063c9b68a9ee368cab3ee017989901fd5a869ce9 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd74b3fabf7af5e0d248711a1fa05fe261368df7b69f594226dfd4b050dd08b9 +size 1076 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/model_config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/model_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3211e66fdb51668312f422ba73e95615779a92db --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/model_config.json @@ -0,0 +1 @@ +{"model_name": "withmartian/sql_interp_bm1_cs1_experiment_1.10", "dataset_name": "withmartian/cs1_dataset_synonyms", "model_abbrev": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True"} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/optimizer.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..cea70d461150bab8f373445e5a2144ea4c6c5404 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76be65f441881d9f9282674951baf9935e9dd6f4890b2c6c30c496d327570800 +size 255767204 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/state.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/state.pt new file mode 100644 index 0000000000000000000000000000000000000000..edceae6afeb451eac68ad6391f61a011a945e7f1 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/state.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49a00b004d5cec4cd9f4163f4ba7d5a2db8308446a1d8131959f7589dd485fec +size 493312 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6546ec1f37867d65385e3e774a35e3a73a064f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..369629fc99e80685f55b1f05b365982078db7768 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.21692709624767303, "fvu": 0.0020793573930859566} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bc236b7a3cfbf57f8ecb89822d050795f5c5df94 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c727d8005ec42bcedd7b4dabfff632e4b66048573c4523d75a91c7519ba66c +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6546ec1f37867d65385e3e774a35e3a73a064f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..09d01dd63c819fa4a6767a50a4355c429029e862 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.013328234665095806, "dead_pct": 6.510417006211355e-05} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7ea81b75af1c36d4e0c39343ad802b422dedc612 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.0.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87727975eeae167af6673f4b690af7383d895949b430b7ab0513881fb7b8a52f +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6546ec1f37867d65385e3e774a35e3a73a064f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..7195167f4048551e31754b609072b2e34d204a2f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.46438804268836975, "fvu": 0.008955885656177998} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9a3e1d19debaa02490ac4357e406e2ddd0bc4277 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d4315cefb51df71f2e6d7f1d1f2181f7dfec65a025982f4d4ba82bce5f7b4c +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..ce6546ec1f37867d65385e3e774a35e3a73a064f --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 256, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..aed9a8312b85fe59585eaac076a0ddd10c104609 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.011177952401340008, "dead_pct": 0.005924479570239782} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..60388626d151158214b629b139a7bee2eb1ca5f2 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=256/transformer.h.1.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7348c3aef4fa55e5f248f54ce1c5248aafeefa3b62792fccb575cec124bcab9 +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/config.json new file mode 100644 index 0000000000000000000000000000000000000000..f2f30d5317504513aae8894d7b98c4625b59a01a --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/config.json @@ -0,0 +1 @@ +{"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["transformer.h.0.attn", "transformer.h.0.mlp", "transformer.h.1.attn", "transformer.h.1.mlp"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32", "wandb_log_frequency": 1} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/lr_scheduler.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/lr_scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5441e5cff18f2f6f82f927744aebdaaf855c229 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/lr_scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afafb111606b64199b463308d054f28acf71d5cca5174e9fd9fce0b0ab0a717c +size 1076 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/model_config.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/model_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3211e66fdb51668312f422ba73e95615779a92db --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/model_config.json @@ -0,0 +1 @@ +{"model_name": "withmartian/sql_interp_bm1_cs1_experiment_1.10", "dataset_name": "withmartian/cs1_dataset_synonyms", "model_abbrev": "saes_sql_interp_bm1_cs1_experiment_1.10_syn=True"} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/optimizer.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..655c87ec370c61440f0d82545b6f992d9366eff1 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f212c2a479916a885dac58685037d166c78dfccfe04c77545f57a3d38ae2c457 +size 255767204 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/state.pt b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/state.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dc255adf9ab28888cef875031d1175f236fb53e --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/state.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cdea23be1a3e4c884d1f48a74c9c9346453b4f0f362215b0600d8fed71b3fe0 +size 493312 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..d613f5a83c724bbbd58146cb4f50add56e3cea9e --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..b7addf2b6d92eca055cb0e27bf1048cff29a3815 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/metrics.json @@ -0,0 +1 @@ +{"dead_pct": 0.644726574420929, "fvu": 0.007164086680859327} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ba3c220b77a425699f39b00c7fc93c38c5b1db77 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984bb0941a1f4b3d8faa0bf39048225efd4a07d11c6bbce925d7a61f51664437 +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..d613f5a83c724bbbd58146cb4f50add56e3cea9e --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..c60c8c205369b60ca2d3c106c1e7cb04cec01f97 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.026178715750575066, "dead_pct": 0.13066406548023224} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7e57479ce914dbf1281120361d4ff501c77609aa --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.0.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b10943942d88875d442d6ec33136b79d1983684862b93e6da98735facc1da36 +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..d613f5a83c724bbbd58146cb4f50add56e3cea9e --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..5875c018d74f5cbd6312e52427dbabca47fcb41b --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.04023520275950432, "dead_pct": 0.5947917103767395} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6589940326e24953410d7a3138c97344e7a0f376 --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.attn/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca242d97961235c891d1ac208ce4173bb0f6493e7682af3ff67f15c1021afb7 +size 125894984 diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/cfg.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/cfg.json new file mode 100644 index 0000000000000000000000000000000000000000..d613f5a83c724bbbd58146cb4f50add56e3cea9e --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/cfg.json @@ -0,0 +1 @@ +{"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false, "d_in": 1024} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/metrics.json b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/metrics.json new file mode 100644 index 0000000000000000000000000000000000000000..6073c41fa9e9f06e99a47d7cb7adf08879237fda --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/metrics.json @@ -0,0 +1 @@ +{"fvu": 0.030149364843964577, "dead_pct": 0.24830730259418488} \ No newline at end of file diff --git a/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/sae.safetensors b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/sae.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..41e4fa99104eba84e716a0aeb7712fffad5240dd --- /dev/null +++ b/saes_sql_interp_bm1_cs1_experiment_1.10_syn=True/k=32/transformer.h.1.mlp/sae.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdaacc41254935c6614fbb282b2f7f91ed8a01cb1fbc86884cae0878d55e8a85 +size 125894984