Jellywibble's workspace
Runs
28
Name
2 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_n_gpu
_name_or_path
activation_function
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attn_pdrop
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
data_seed
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_bucket_cap_mb
ddp_find_unused_parameters
debug
deepspeed
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
embd_pdrop
encoder_no_repeat_ngram_size
eos_token_id
eval_accumulation_steps
eval_batch_size
eval_delay
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
gradient_accumulation_steps
gradient_checkpointing
greater_is_better
Crashed
jellywibble
8h 24m 1s
-
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
183
steps
true
auto
false
O1
1
false
None
Killed
jellywibble
44m 37s
-
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
183
steps
true
auto
false
O1
1
false
None
Crashed
jellywibble
26s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Failed
jellywibble
22s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
jellywibble
1m 26s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
jellywibble
9h 2m 13s
-
-
gpt2
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
3984
steps
true
auto
false
O1
1
false
None
Failed
jellywibble
1m 1s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Failed
jellywibble
19s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Crashed
jellywibble
21h 32m 50s
-
-
/models/checkpoints/reward_models_v25_start_cp_332032_seed_100_data_170000000/checkpoint-332000
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2ForSequenceClassification"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
128
0
1660
steps
true
auto
false
O1
1
false
None
Failed
jellywibble
17m 3s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Failed
jellywibble
26m 8s
-
-
/models/checkpoints/reward_models_v25_start_cp_332032_seed_100_data_170000000/checkpoint-332000
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2ForSequenceClassification"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
128
0
1660
steps
true
auto
false
O1
1
false
None
Killed
jellywibble
17s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
Finished
jellywibble
3d 21h 36m 37s
-
-
/models/checkpoints/reward_models_100_170000000/checkpoint-332032
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2ForSequenceClassification"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
1660
steps
true
auto
false
O1
1
false
None
Crashed
jellywibble
4d 13h 35m 37s
-
1
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
16
0
26562
steps
true
auto
false
O1
1
false
None
Killed
jellywibble
20m 34s
-
4
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
64
0
7
steps
true
auto
false
O1
1
false
None
Killed
jellywibble
45m 42s
-
4
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
32
0
7
steps
true
auto
false
O1
1
false
None
Crashed
jellywibble
3d 14h 23m 54s
-
1
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
26562
steps
true
auto
false
O1
1
false
None
Failed
jellywibble
12m 20s
-
1
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
8
0
13281
steps
true
auto
false
O1
1
false
None
Killed
jellywibble
3h 50m 46s
-
4
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
32
0
132
steps
true
auto
false
O1
1
false
None
Failed
jellywibble
15m 18s
-
4
gpt2-xl
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
50256
0
None
false
12
true
None
None
[]
None
false
0
true
false
false
false
false
0.1
0
50256
None
32
0
33
steps
true
auto
false
O1
1
false
None
1-20
of 28