Stephenxie's workspace
Runs
22
Name
22 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
accelerator_config.even_batches
accelerator_config.non_blocking
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
activation_offloading
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
assistant_only_loss
attention_bias
attention_dropout
auto_find_batch_size
average_tokens_across_devices
batch_eval_metrics
batch_size
bf16
bf16_full_eval
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
dataset_name
dataset_text_field
ddp_timeout
debug
disable_tqdm
diversity_penalty
do_eval
do_predict
do_sample
do_train
early_stopping
enable_wandb
encoder_no_repeat_ngram_size
eos_token
eos_token_id
eval_accumulation_steps
eval_delay
eval_do_concat_batches
Finished
stephenxie
1m 2s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
40s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
43s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
1m 8s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
1m
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
10m 39s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Crashed
stephenxie
8m 31s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
54s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
20m 36s
-
NousResearch/Hermes-4-14B
true
false
false
true
false
false
0.9
0.999
1.0000e-8
false
["Qwen3ForCausalLM"]
false
false
0
false
false
false
2
true
true
0
false
0
false
true
data/training-data/replai.json
text
1800
[]
false
0
true
false
false
false
false
true
0
<EOS_TOKEN>
151645
4
0
true
Finished
stephenxie
3m 30s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
1m 54s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
2m 2s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
1m 41s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
42s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
1m 49s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
2m 14s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
45s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
51s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
1m 38s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
Finished
stephenxie
31s
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
2
-
-
-
-
-
-
-
data/training-data/replai.json
-
-
-
-
-
-
-
-
-
-
true
-
-
-
-
-
-
1-20
of 22