Jiayipan's workspace
Runs
3
State
Notes
User
Tags
Created
Runtime
Sweep
base_path
buffer_size
cache_dir
data_parallel
dataset_offset
do_clear_buffer
do_save
huggingface_token
importance_sampling
learning_rate
load_in_4bit
max_decoding_length
num_sequences_per_epoch
num_shots
num_steps_per_epoch
oracle_model
output_path
project_name
reward_model
reward_offset
reward_type
rollout_batch_size
rollout_iterations
rollout_temperature
run_name
save_epochs
single_device
top_p
total_epochs
train_batch_size
use_accelerator
use_wandb
verbose
wandb_key
eval_epoch_rewards_mean
loss_mean
train_epoch_rewards_mean
Killed
-
jiayipan
18h 5m 13s
-
data/harmful_behaviors.csv
100000
./.cache
false
0
true
true
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
false
0.0002
true
32
1
520
10
lmsys/vicuna-7b-v1.3
./outputs
advbench-gpt2-llama2-toxity
meta-llama/Llama-2-7b-chat-hf
50
vllm_bert
256
40
10
debug-trick-v1
1
cuda:0
0.1
150
64
true
true
false
0929e692448f1bc929d71d7e3ece80073c3041e6
0.73498
67.70027
0.66925
Killed
-
jiayipan
1d 12h 38m 35s
-
data/harmful_behaviors.csv
100000
./.cache
false
0
true
true
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
false
0.0002
true
32
1
520
10
lmsys/vicuna-7b-v1.3
./outputs
advbench-gpt2-llama2-toxity
meta-llama/Llama-2-7b-chat-hf
50
vllm_bert
256
40
10
debug
1
cuda:0
0.1
150
64
true
true
false
0929e692448f1bc929d71d7e3ece80073c3041e6
0.045573
39.94793
0.048632
Killed
-
jiayipan
2m 23s
-
data/harmful_behaviors.csv
100000
./.cache
false
0
true
true
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
false
0.0002
true
32
1
520
10
lmsys/vicuna-7b-v1.3
./outputs
advbench-gpt2-llama2-toxity
meta-llama/Llama-2-7b-chat-hf
50
vllm_bert
256
40
10
debug
1
cuda:0
0.1
150
64
true
true
false
0929e692448f1bc929d71d7e3ece80073c3041e6
-
-
-
1-3
of 3