jkminder commited on
Commit
e494e49
·
verified ·
1 Parent(s): ca9d101

Upload SAE-difference_cb-gemma-2-2b-L13-k100-lr1e-04-local-shuffling dictionary model

Browse files
Files changed (1) hide show
  1. trainer_config.json +23 -0
trainer_config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "trainer": {
3
+ "trainer_class": "BatchTopKTrainer",
4
+ "dict_class": "BatchTopKSAE",
5
+ "lr": 0.0001,
6
+ "steps": 97656,
7
+ "auxk_alpha": 0.03125,
8
+ "warmup_steps": 1000,
9
+ "decay_start": null,
10
+ "threshold_beta": 0.999,
11
+ "threshold_start_step": 1000,
12
+ "top_k_aux": 1152,
13
+ "seed": null,
14
+ "activation_dim": 2304,
15
+ "dict_size": 73728,
16
+ "k": 100,
17
+ "device": "cuda",
18
+ "layer": 13,
19
+ "lm_name": "google/gemma-2-2b-it-google/gemma-2-2b",
20
+ "wandb_name": "SAE-difference_cb-gemma-2-2b-L13-k100-lr1e-04-local-shuffling",
21
+ "submodule_name": null
22
+ }
23
+ }