sboughorbel commited on
Commit
fe27587
·
verified ·
1 Parent(s): edd30f0

Upload gemma-2-9b-it-L20-mu4.0e-02-lr1e-04-CrosscoderLoss dictionary model

Browse files
Files changed (1) hide show
  1. trainer_config.json +21 -0
trainer_config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "trainer": {
3
+ "dict_class": "CrossCoder",
4
+ "trainer_class": "CrossCoderTrainer",
5
+ "activation_dim": 3584,
6
+ "dict_size": 114688,
7
+ "lr": 0.0001,
8
+ "l1_penalty": 0.04,
9
+ "warmup_steps": 1000,
10
+ "resample_steps": null,
11
+ "device": "cuda",
12
+ "layer": 20,
13
+ "lm_name": "princeton-nlp/gemma-2-9b-it-SimPO-gemma-2-9b-it",
14
+ "wandb_name": "gemma-2-9b-it-L20-mu4.0e-02-lr1e-04-CrosscoderLoss",
15
+ "submodule_name": null,
16
+ "use_mse_loss": false,
17
+ "code_normalization": "CROSSCODER",
18
+ "code_normalization_alpha_sae": 1.0,
19
+ "code_normalization_alpha_cc": 0.1
20
+ }
21
+ }