Danbraunai-apollo's workspace
Runs
163
Name
163 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
act_frequency_n_tokens
adam_beta1
batch_size
collect_act_frequency_every_n_samples
collect_output_metrics_every_n_samples
cooldown_samples
effective_batch_size
eval_data.column_name
eval_data.dataset_name
eval_data.is_tokenized
eval_data.n_ctx
eval_data.seed
eval_data.split
eval_data.streaming
eval_data.tokenizer_name
eval_every_n_samples
eval_n_samples
log_every_n_grad_steps
loss.sparsity.coeff
lr
lr_schedule
max_grad_norm
min_lr_factor
n_samples
saes.dict_size_to_input_ratio
saes.sae_positions
save_dir
seed
tlens_model_name
train_data.column_name
train_data.dataset_name
train_data.is_tokenized
train_data.n_ctx
train_data.seed
train_data.split
train_data.streaming
train_data.tokenizer_name
wandb_project
wandb_run_name_prefix
warmup_samples
loss.in_to_orig.hook_positions
loss.in_to_orig.total_coeff
Killed
-
danbraunai-apollo
1m 14s
-
500000
-
20
40000
-
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
-
validation
true
gpt2
40000
500
20
3
0.001
cosine
1
0.1
400000
50
["blocks.4.hook_resid_pre"]
/Users/dan/Documents/code/e2e_sae/e2e_sae/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
-
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
downstream
1h 15m 2s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
100
Finished
-
danbraunai-apollo
downstream
1h 15m 43s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
100
Finished
-
danbraunai-apollo
downstream
1h 15m 9s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
100
Finished
-
danbraunai-apollo
downstream
1h 15m 33s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
500
Finished
-
danbraunai-apollo
downstream
1h 15m 13s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
500
Finished
-
danbraunai-apollo
downstream
1h 15m 37s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
500
Finished
-
danbraunai-apollo
downstream
1h 14m 49s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
1000
Finished
-
danbraunai-apollo
downstream
1h 14m 58s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
2000
Finished
-
danbraunai-apollo
downstream
1h 15m 11s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
1000
Finished
-
danbraunai-apollo
downstream
1h 15m 13s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
2000
Finished
-
danbraunai-apollo
downstream
1h 15m 6s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
1000
Finished
-
danbraunai-apollo
downstream
1h 14m 58s
500000
-
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.001
cosine
1
0.1
250000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
e2e-recon_
20000
-
2000
Finished
-
danbraunai-apollo
e2e
2h 3m 39s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
200
0.001
cosine
1
0.1
450000
100
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 4m 19s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
450000
100
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 3m 50s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
80
0.001
cosine
1
0.1
450000
100
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 3m 55s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.001
cosine
1
0.1
450000
100
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
1h 40m 4s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.001
cosine
-
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
nogradnorm_
20000
-
-
Finished
-
danbraunai-apollo
1h 40m 5s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
-
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
nogradnorm_
20000
-
-
Finished
-
danbraunai-apollo
1h 40m 34s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.001
cosine
-
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
nogradnorm_
20000
-
-
Finished
-
danbraunai-apollo
1h 40m 25s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.001
cosine
-
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
nogradnorm_
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 26m 25s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
3
0.001
cosine
1
0.1
450000
50
["blocks.0.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 26m 11s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
35
0.001
cosine
1
0.1
450000
50
["blocks.0.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 24s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
30
0.001
cosine
1
0.1
450000
50
["blocks.3.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 4s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
40
0.001
cosine
1
0.1
450000
50
["blocks.3.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 13m 31s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.001
cosine
1
0.1
450000
50
["blocks.3.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 38s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
80
0.001
cosine
1
0.1
450000
50
["blocks.6.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 6s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
450000
50
["blocks.6.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 30s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
200
0.001
cosine
1
0.1
450000
50
["blocks.6.hook_resid_post"]
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m-2
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 9s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.0001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 13m 41s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.0001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 23s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.0001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 16s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.0001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 13m 58s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.0001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
43m 23s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 36s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.0001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 17s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.0001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
35m 59s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
29m 11s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
42m 53s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 13m 51s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.0001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 29s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.0001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 14m 23s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.0001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 14m 27s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.0001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 50s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.0001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 36s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.0001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 44s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.0001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 23s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.0001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
36m 1s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
29m 2s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
43m 5s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.007
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
36m 13s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.007
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 8s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
1
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
28m 57s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.007
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 9s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
1
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 26m 18s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
1
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
43m 44s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.01
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
36m 11s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.01
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
28m 29s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.01
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 38s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 11s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 26m 43s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
5
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
42m 35s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.02
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 9s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
36m 9s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.02
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
28m 53s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.02
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
43m 11s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.05
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 13m 56s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 26m 40s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
10
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 15s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 22s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
35m 53s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.05
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
28m 52s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.05
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
43m 51s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.08
0.01
cosine
1
0.1
400000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
38m 10s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.08
0.01
cosine
1
0.1
400000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 28m 13s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 28m 15s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
60
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 15m 17s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 2m 34s
-
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
120
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
local
29m 39s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.08
0.01
cosine
1
0.1
400000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 1m 54s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 21m 54s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 21m 54s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 13m 59s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
150
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 14s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
100
0.001
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 30s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.01
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 1m 49s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
70
0.01
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 2m
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.01
cosine
1
0.1
450000
50
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 13m 45s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
50
0.01
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
e2e
2h 14m 31s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
70
0.01
cosine
1
0.1
450000
50
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
2h 26m 48s
500000
0.9
20
10000
0
0
20
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
70
0.01
cosine
1
0.1
450000
50
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
42m 37s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
20
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
35m 41s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
20
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
28m 5s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.01
cosine
1
0.1
400000
20
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
42m 13s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
20
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
35m 27s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
20
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
27m 57s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.004
0.01
cosine
1
0.1
400000
20
blocks.0.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
42m 8s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.007
0.01
cosine
1
0.1
400000
20
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
41m 50s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.015
cosine
1
0.1
400000
5
blocks.6.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
Finished
-
danbraunai-apollo
34m 35s
500000
0.9
32
10000
0
0
32
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
validation
true
gpt2
20000
500
20
0.001
0.015
cosine
1
0.1
400000
5
blocks.3.hook_resid_post
/mnt/ssd-interp/dan/sparsify/sparsify/scripts/train_tlens_saes/out
0
roneneldan/TinyStories-1M
input_ids
apollo-research/roneneldan-TinyStories-tokenizer-gpt2
true
512
0
train
true
gpt2
tinystories-1m_play
20000
-
-
1-100
of 163