Husein-mesolitica's workspace
Runs
43
Name
43 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_dropout
auto_find_batch_size
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_pin_memory
ddp_timeout
debug
deepspeed.bf16.enabled
deepspeed.comms_logger.debug
deepspeed.comms_logger.enabled
deepspeed.fp16.enabled
deepspeed.fp16.hysteresis
deepspeed.fp16.initial_scale_power
deepspeed.fp16.loss_scale
deepspeed.fp16.loss_scale_window
deepspeed.fp16.min_loss_scale
deepspeed.gradient_accumulation_steps
deepspeed.gradient_clipping
deepspeed.optimizer.params.betas
deepspeed.optimizer.params.eps
deepspeed.optimizer.params.lr
deepspeed.optimizer.params.weight_decay
deepspeed.optimizer.type
deepspeed.scheduler.params.total_num_steps
deepspeed.scheduler.params.warmup_max_lr
deepspeed.scheduler.params.warmup_min_lr
deepspeed.scheduler.params.warmup_num_steps
deepspeed.scheduler.type
deepspeed.steps_per_print
deepspeed.train_batch_size
deepspeed.train_micro_batch_size_per_gpu
deepspeed.wall_clock_breakdown
deepspeed.zero_optimization.contiguous_gradients
Crashed
-
husein-mesolitica
1d 2h 35m 5s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
1d 22h 28m 10s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
20h 2m 4s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
1d 4h 21m 36s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
1h 28m 31s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
2d 17h 6m 41s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
9m 30s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
1h 4s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
30m 36s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
true
true
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
1h 35m 31s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
2d 11h 12m 36s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
2h 51m 35s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
3m 23s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
8m 59s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
50m 5s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
2h 53m
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
57m
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
4h 53m 2s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
39m 1s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
Crashed
-
husein-mesolitica
5h 50m 31s
-
huseinzol05/dummy-mistral-3b
false
0.9
0.999
1.0000e-8
false
["MistralForCausalLM"]
0
false
true
false
1
0
false
0
true
1800
[]
auto
-
-
auto
2
16
0
1000
1
auto
auto
auto
auto
auto
auto
AdamW
auto
auto
auto
auto
WarmupDecayLR
2000
auto
auto
false
true
1-20
of 43