Jbloom's workspace
Runs
21
Name
13 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
b_dec_init_method
cached_activations_path
checkpoint_path
context_size
d_in
d_sae
dataset_path
dead_feature_estimation_method
dead_feature_threshold
dead_feature_window
device
dtype
expansion_factor
feature_reinit_scale
feature_sampling_method
feature_sampling_window
hook_point
hook_point_layer
is_dataset_tokenized
l1_coefficient
log_to_wandb
lr
lr_warm_up_steps
model_name
n_batches_in_buffer
n_checkpoints
resample_batches
run_name
seed
sparsity_loss_type
store_batch_size
tokens_per_buffer
total_training_tokens
train_batch_size
use_cached_activations
use_ghost_grads
wandb_log_frequency
wandb_project
details/current_learning_rate
details/n_training_tokens
losses/ghost_grad_loss
losses/l1_loss
losses/mse_loss
losses/overall_loss
Finished
-
jbloom
2h 34m 9s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.0.hook_resid_pre
checkpoints/y1t51byy
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.0.hook_resid_pre
0
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.000058032
4.58041
0.000058032
0.0004825
Finished
-
jbloom
3h 6m 3s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.1.hook_resid_pre
checkpoints/mm179kd2
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.1.hook_resid_pre
1
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0011548
41.04158
0.0011548
0.005593
Finished
-
jbloom
3h 15m 15s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.2.hook_resid_pre
checkpoints/59dzvtdt
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.2.hook_resid_pre
2
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0015013
51.87626
0.0015013
0.0071526
Finished
-
jbloom
2h 59m 2s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.3.hook_resid_pre
checkpoints/0sgl1gqz
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.3.hook_resid_pre
3
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0024967
74.96449
0.0024967
0.010991
Finished
-
jbloom
2h 26m 37s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.4.hook_resid_pre
checkpoints/7rzeo1iv
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.4.hook_resid_pre
4
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0037705
90.23271
0.0037705
0.01476
Finished
-
jbloom
2h 38m 7s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.5.hook_resid_pre
checkpoints/65ufbyeo
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.5.hook_resid_pre
5
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0048513
108.59385
0.0048513
0.01839
Finished
-
jbloom
2h 41m 1s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.6.hook_resid_pre
checkpoints/vjvlfpxa
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.6.hook_resid_pre
6
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.006327
136.06539
0.006327
0.023539
Finished
-
jbloom
2h 48m 42s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.7.hook_resid_pre
checkpoints/n6gbpj7s
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.7.hook_resid_pre
7
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0079579
138.04927
0.0079579
0.02696
Finished
-
jbloom
2h 59m 20s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.8.hook_resid_pre
checkpoints/ut7lhl4q
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.8.hook_resid_pre
8
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.0098861
167.34963
0.0098861
0.03316
Finished
-
jbloom
3h 12m 36s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.9.hook_resid_pre
checkpoints/wg1xo7vo
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.9.hook_resid_pre
9
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.012488
198.4199
0.012488
0.040849
Finished
-
jbloom
3h 38m 59s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.10.hook_resid_pre
checkpoints/9vu4ulem
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.10.hook_resid_pre
10
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0
215.111
0.017561
0.03477
Finished
-
jbloom
3h 7m 51s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.11.hook_resid_pre
checkpoints/gf296egd
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.11.hook_resid_pre
11
false
0.00008
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-8e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0.019196
270.1289
0.019196
0.060002
Finished
-
jbloom
4h 10m 47s
-
geometric_median
activations/Skylion007_openwebtext/gpt2-small/blocks.11.hook_resid_post
checkpoints/ycfyp18l
128
768
24576
Skylion007/openwebtext
no_fire
1.0000e-8
5000
cuda
torch.float32
32
0.2
-
1000
blocks.11.hook_resid_post
11
false
0.00004
true
0.0004
5000
gpt2-small
128
10
1028
24576-L1-4e-05-LR-0.0004-Tokens-3.000e+08
42
-
32
67108864
300000000
4096
false
true
100
mats_sae_training_gpt2_small_resid_pre_5
0.0004
299827200
0
375.40917
0.016677
0.031694
1-13
of 13