abir-hr196 commited on
Commit
00ed9ee
·
verified ·
1 Parent(s): f928c50

Add config-checkpoint.json to saes_sql_interp_bm2_cs1_experiment_4.3_syn=True/k=32

Browse files
saes_sql_interp_bm2_cs1_experiment_4.3_syn=True/k=32/.ipynb_checkpoints/config-checkpoint.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"sae": {"expansion_factor": 15, "normalize_decoder": true, "num_latents": 0, "k": 32, "multi_topk": false, "skip_connection": false}, "batch_size": 16, "grad_acc_steps": 1, "micro_acc_steps": 1, "lr": null, "lr_warmup_steps": 1000, "auxk_alpha": 0.0, "dead_feature_threshold": 10000000, "hookpoints": ["model.layers.0.mlp", "model.layers.0.post_attention_layernorm", "model.layers.1.mlp", "model.layers.1.post_attention_layernorm", "model.layers.2.mlp", "model.layers.2.post_attention_layernorm", "model.layers.3.mlp", "model.layers.3.post_attention_layernorm", "model.layers.4.mlp", "model.layers.4.post_attention_layernorm", "model.layers.20.mlp", "model.layers.20.post_attention_layernorm", "model.layers.21.mlp", "model.layers.21.post_attention_layernorm", "model.layers.22.mlp", "model.layers.22.post_attention_layernorm", "model.layers.23.mlp", "model.layers.23.post_attention_layernorm"], "init_seeds": [0], "layers": [], "layer_stride": 1, "transcode": false, "distribute_modules": false, "save_every": 100000, "log_to_wandb": true, "run_name": "saes_sql_interp_bm2_cs1_experiment_4.3_syn=True/k=32", "wandb_log_frequency": 1}