Bcs1's workspace
Runs
9
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
activation_function
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attn_pdrop
auto_find_batch_size
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
data_seed
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_backend
ddp_broadcast_buffers
ddp_bucket_cap_mb
ddp_find_unused_parameters
ddp_timeout
debug
deepspeed
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
embd_pdrop
encoder_no_repeat_ngram_size
eos_token_id
eval_accumulation_steps
eval_batch_size
eval_delay
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
Finished
-
bcs1
1d 16h 56m 7s
-
output/checkpoint-700/
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
5h 8m 28s
-
output/checkpoint-500/
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
10h 25m 51s
-
output/checkpoint-100/
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
6m 40s
-
output/checkpoint-100/
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
2h 42m 8s
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
5m 7s
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
4h 10m 56s
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
4h 31m 22s
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0.1
0
50256
None
8
0
None
no
true
auto
false
O1
Finished
-
bcs1
6m 59s
-
gpt2-medium
gelu_new
false
0.9
0.999
1.0000e-8
false
["GPT2LMHeadModel"]
0.1
false
false
false
50256
0
None
false
0
true
None
None
None
None
1800
[]
None
false
0
false
false
false
false
false
0.1
0
50256
None
8
0
None
no
true
auto
false
O1
1-9
of 9