Levmckinney's group workspace
Group: pythia-70m-deduped
Name
7 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
constant
data
data.max_length
data.name
data.split
data.text_column
dist
dist.cpu_offload
dist.fsdp
loss
model
model.name
model.revision
model.slow_tokenizer
num_steps
opt
opt.lr_scale
opt.momentum
opt.optimizer
opt.weight_decay
opt.zero
output
per_gpu_batch_size
pre_ln
seed
separate_unembeddings
tokens_per_step
wandb
wandb_upload_checkpoints
bias_only
checkpoint_dir
checkpoint_freq
data.shuffle_seed
dist.nccl_timeout
dist.per_gpu_batch_size
model.precision
opt.warmup_steps
data.dataset_shuffle
data.dataset_shuffle_seed
dist.dataloader_shuffle
w_ce
w_kl
data.max_seq_len
bias_norm/0.ffn
Finished
-
levmckinney
20s
-
false
-
128
["tests/test_data/pile_text.jsonl"]
validation
text
-
false
false
LossChoice.CE
-
EleutherAI/pythia-70m-deduped
main
false
250
-
1
0.9
OptimizerOption.SGD
0.001
false
-
1
false
42
false
262144
smoke-test-1
false
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
levmckinney
50s
-
false
-
128
["tests/test_data/pile_text.jsonl"]
validation
text
-
false
false
LossChoice.CE
-
EleutherAI/pythia-70m-deduped
main
false
250
-
1
0.9
OptimizerOption.SGD
0.001
false
-
1
false
42
false
262144
smoke-test-1
false
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Killed
-
levmckinney
8m 15s
-
false
-
2048
["val.jsonl"]
validation
text
-
false
false
LossChoice.KL
-
EleutherAI/pythia-70m-deduped
main
false
250
-
1
0.9
OptimizerOption.SGD
0.001
false
-
2
false
42
false
262144
pythia-160m-deduped-single-gpu
false
-
-
-
-
-
-
-
-
-
-
-
-
-
-
0.48285
Finished
-
levmckinney
1h 37m 21s
-
false
-
2048
["val.jsonl"]
validation
text
-
false
false
LossChoice.KL
-
EleutherAI/pythia-70m-deduped
main
false
250
-
1
0.9
OptimizerOption.SGD
0.001
false
-
2
false
42
false
262144
pythia-70m-deduped-single-gpu-no-renormalize
false
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2.31037
Failed
-
levmckinney
8s
-
false
-
2048
["val.jsonl"]
validation
text
-
false
false
LossChoice.KL
-
EleutherAI/pythia-70m-deduped
main
false
250
-
1
0.9
OptimizerOption.SGD
0.001
false
-
8
false
42
false
262144
pythia-70m-deduped-single-gpu-no-renormalize
false
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Killed
-
levmckinney
18s
-
false
Data(name=['val.jsonl'], split='validation', text_column='text', revision=None)
-
-
-
-
Distributed(fsdp=False, cpu_offload=False)
-
-
LossChoice.CE
Model(name='EleutherAI/pythia-70m-deduped', revision='main', slow_tokenizer=False, tokenizer=None, tokenizer_type=None)
-
-
-
2
Optimizer(weight_decay=0.001, lr_scale=1.0, momentum=0.9, zero=False, optimizer=<OptimizerOption.SGD: 'sgd'>, warmup_steps=None)
-
-
-
-
-
-
1
false
42
false
262144
smoke-test-1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
-
levmckinney
10m 56s
-
false
Data(name=['val.jsonl'], split='validation', text_column='text', revision=None)
-
-
-
-
Distributed(fsdp=False, cpu_offload=False)
-
-
LossChoice.CE
Model(name='EleutherAI/pythia-70m-deduped', revision='main', slow_tokenizer=False, tokenizer=None, tokenizer_type=None)
-
-
-
2
Optimizer(weight_decay=0.001, lr_scale=1.0, momentum=0.9, zero=False, optimizer=<OptimizerOption.SGD: 'sgd'>, warmup_steps=None)
-
-
-
-
-
-
1
false
42
false
262144
smoke-test-1
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
0.024574
1-7
of 7