Jacobcd52's workspace
Runs
52
Name
15 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
act_store_device
activation_fn
adam_beta1
adam_beta2
apply_b_dec_to_input
architecture
autocast
autocast_lm
b_dec_init_method
checkpoint_path
compile_llm
compile_sae
context_size
control_dataset_path
control_mixture
d_in
d_sae
dataset_path
dataset_trust_remote_code
dead_feature_threshold
dead_feature_window
decoder_heuristic_init
decoder_orthogonal_init
device
dtype
eval_every_n_wandb_logs
expansion_factor
feature_sampling_window
finetuning_tokens
gsae_filename_no_suffix
gsae_repo
hook_eval
hook_layer
hook_name
init_encoder_as_decoder_transpose
is_control_dataset_tokenized
is_dataset_tokenized
l1_coefficient
l1_warm_up_steps
log_activations_store_to_wandb
log_optimizer_state_to_wandb
log_to_wandb
lp_norm
lr
Finished
-
jacobcd52
21m 27s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=6.0_expansion=2_control_mixture=0.1_tokens=24576000_lr=0.001/dhujj015
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
6
150
false
false
true
1
0.001
Finished
-
jacobcd52
21m 5s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=6.0_expansion=1_control_mixture=0.1_tokens=24576000_lr=0.001/hyeq4pde
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
768
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
1
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
6
150
false
false
true
1
0.001
Finished
-
jacobcd52
21m 17s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=6.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/6kkro9pl
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
6
150
false
false
true
1
0.001
Finished
-
jacobcd52
25m 5s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=5.0_expansion=2_control_mixture=0.1_tokens=24576000_lr=0.001/r5aqepvm
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
5
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 21s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=5.0_expansion=1_control_mixture=0.1_tokens=24576000_lr=0.001/xk95ayut
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
768
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
1
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
5
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 30s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=5.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/8lxn3eob
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
5
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 16s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=4.0_expansion=2_control_mixture=0.1_tokens=24576000_lr=0.001/agzc5nqq
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
4
150
false
false
true
1
0.001
Finished
-
jacobcd52
21m 56s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=4.0_expansion=1_control_mixture=0.1_tokens=24576000_lr=0.001/6ht1s8pn
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
768
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
1
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
4
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 3s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=4.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/fr9db29u
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
4
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 47s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=3.0_expansion=2_control_mixture=0.1_tokens=24576000_lr=0.001/j5la8a8o
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
3
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 19s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=3.0_expansion=1_control_mixture=0.1_tokens=24576000_lr=0.001/rjs1sslg
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
768
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
1
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
3
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 33s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=3.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/q6vav0hb
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
3
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 53s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=2_control_mixture=0.1_tokens=24576000_lr=0.001/o99blwyi
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 39s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=1_control_mixture=0.1_tokens=24576000_lr=0.001/af1h2wgs
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
768
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
1
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Finished
-
jacobcd52
22m 8s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/pjhjk1ep
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Failed
-
jacobcd52
8m 2s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/m7ta2klh
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Failed
-
jacobcd52
4m 17s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/vtulol22
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
1
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Failed
-
jacobcd52
3m 7s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=2.0_expansion=0.5_control_mixture=0.1_tokens=24576000_lr=0.001/heowidny
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
1
0.5
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
2
150
false
false
true
1
0.001
Finished
-
jacobcd52
15m 24s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=4.0_expansion=2_control_mixture=0.1_tokens=16384000_lr=0.001/xrb4jygi
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
384
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
4
100
false
false
true
1
0.001
Failed
-
jacobcd52
12m 8s
-
cuda
relu
0.9
0.999
true
standard
false
false
zeros
phys_gpt2_ssae_l1_coeff=4.0_expansion=2_control_mixture=0.1_tokens=32768000_lr=0.001/sx9ilmsp
false
false
256
NeelNanda/openwebtext-tokenized-9b
0.1
768
1536
jacobcd52/physics-papers
true
0.0001
1000
true
false
cuda
float32
20
2
1000
0
gpt2_resid_8_gated_gsae
jacobcd52/mats-saes
NOT_IN_USE
8
blocks.8.hook_resid_pre
true
true
false
4
200
false
false
true
1
0.001
1-20
of 52