Jiayipan's workspace
Runs
48
Name
2 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
adamw_optimizer.b1
adamw_optimizer.b2
adamw_optimizer.bf16_momentum
adamw_optimizer.clip_gradient
adamw_optimizer.end_lr
adamw_optimizer.init_lr
adamw_optimizer.lr
adamw_optimizer.lr_decay_steps
adamw_optimizer.lr_warmup_steps
adamw_optimizer.multiply_by_parameter_scale
adamw_optimizer.weight_decay
checkpointer.float_dtype
checkpointer.save_optimizer_state
dtype
eval_dataset.type
eval_steps
hostname
huggingface_dataset.always_start_with_bos
huggingface_dataset.batch_size
huggingface_dataset.batch_token_dtype
huggingface_dataset.name
huggingface_dataset.path
huggingface_dataset.seq_length
huggingface_dataset.split
huggingface_dataset.streaming
jax_distributed.initialize_jax_distributed
json_dataset.always_start_with_bos
json_dataset.batch_size
json_dataset.example_index_at_start
json_dataset.path
json_dataset.seq_length
json_dataset.start_seek_loc
json_dataset.throughput_average_window_size
json_dataset.tokenizer_parallel_batch_size
json_dataset.tokenizer_parallel_chunk_size
json_dataset.tokenizer_processes
json_dataset.tokens_count_at_start
llama.attn_pdrop
llama.bos_token_id
llama.embd_pdrop
llama.eos_token_id
llama.fcm_max_ratio
llama.fcm_min_ratio
llama.hidden_size
Killed
-
jiayipan
12s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-603b2c58-w-0
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Finished
-
jiayipan
1h 56m 36s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-603b2c58-w-0
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
2m 50s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-603b2c58-w-0
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Killed
-
jiayipan
1m 38s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-603b2c58-w-0
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
3m 42s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-603b2c58-w-0
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
31m 16s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-5e66f83e-w-6
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
15m 13s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-5e66f83e-w-6
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
7m 35s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-5e66f83e-w-6
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
1d 4h 40m 39s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
22m 19s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
20m 13s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
20m 58s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
19h 10m 53s
-
0.9
0.95
false
1
0.00003
0
0.0003
25000
2000
false
0.1
bf16
true
bf16
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
1h 26m 14s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
1h 49m 9s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
23m 27s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
22m 8s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
6m 32s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Crashed
-
jiayipan
4m 42s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
Failed
-
jiayipan
2m 25s
-
0.9
0.95
false
1
0.00003
0
0.0003
250000
2000
false
0.1
bf16
true
fp32
huggingface
0
t1v-n-7c300196-w-3
false
8
i4
en
c4
1024
train
false
false
false
8
0
1024
0
200
1024
32
1
0
0
0
0
1
0
0
4096
1-20
of 48