Mhenrichsen's workspace
Runs
11
Name
1 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
_name_or_path
adafactor
adam_beta1
adam_beta2
adam_epsilon
add_cross_attention
architectures
attention_dropout
auto_find_batch_size
bench_dataset
bench_source_max_len
bench_split
bf16
bf16_full_eval
bos_token_id
chunk_size_feed_forward
dataloader_drop_last
dataloader_num_workers
dataloader_persistent_workers
dataloader_pin_memory
dataloader_prefetch_factor
ddp_timeout
debug
disable_tqdm
diversity_penalty
do_bench_eval
do_eval
do_predict
do_sample
do_train
early_stopping
encoder_no_repeat_ngram_size
eos_token_id
eval_accumulation_steps
eval_delay
eval_sample_packing
eval_steps
evaluation_strategy
fp16
fp16_backend
fp16_full_eval
fp16_opt_level
fsdp
fsdp_config.min_num_params
Finished
mhenrichsen
7d 21h 12m 58s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.95
0.00001
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
8
false
true
4
1800
[]
false
0
false
true
false
false
false
false
0
32000
1
0
true
-
epoch
false
auto
false
O1
[]
0
Failed
mhenrichsen
1h 37m 31s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.95
0.00001
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
8
false
true
4
1800
[]
false
0
false
true
false
false
false
false
0
32000
1
0
true
-
epoch
false
auto
false
O1
[]
0
Finished
mhenrichsen
9m 8s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.95
0.00001
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
8
false
true
4
1800
[]
false
0
false
true
false
false
false
false
0
32000
1
0
true
-
epoch
false
auto
false
O1
[]
0
Failed
mhenrichsen
4m 6s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.95
0.00001
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
8
false
true
4
1800
[]
false
0
false
false
false
false
false
false
0
32000
1
0
true
-
no
false
auto
false
O1
[]
0
Failed
mhenrichsen
10m 41s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.95
0.00001
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
8
false
true
4
1800
[]
false
0
false
true
false
false
false
false
0
32000
1
0
true
0.25
steps
false
auto
false
O1
[]
0
Finished
mhenrichsen
15m 4s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
2
0
true
-
no
false
auto
false
O1
[]
0
Finished
mhenrichsen
6m 44s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
2
0
true
-
no
false
auto
false
O1
[]
0
Finished
mhenrichsen
1h 20m 16s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
2
0
true
-
no
false
auto
false
O1
[]
0
Finished
mhenrichsen
1m 54s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
2
0
true
-
no
false
auto
false
O1
[]
0
Finished
mhenrichsen
7m 21s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
2
0
true
-
no
false
auto
false
O1
[]
0
Finished
mhenrichsen
4h 30m 17s
-
mistralai/Mixtral-8x7B-v0.1
false
0.9
0.999
1.0000e-8
false
["MixtralForCausalLM"]
0
false
pharaouk/dharma-1/dharma_1_mini.json
2048
eval
true
false
1
0
false
0
false
true
-
1800
[]
false
0
false
false
false
false
false
false
0
2
1
0
true
-
no
false
auto
false
O1
[]
0
1-11
of 11