Awni00's workspace
Runs
75
Name
40 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
d_model
decoder_kwargs.activation
decoder_kwargs.causal
decoder_kwargs.dff
decoder_kwargs.dropout_rate
decoder_kwargs.n_heads_abs
decoder_kwargs.n_heads_cross
decoder_kwargs.n_heads_enc
decoder_kwargs.norm_first
decoder_kwargs.rel_mask_diag
encoder_kwargs.activation
encoder_kwargs.causal
encoder_kwargs.dff
encoder_kwargs.dropout_rate
encoder_kwargs.n_heads_abs
encoder_kwargs.n_heads_enc
encoder_kwargs.norm_first
encoder_kwargs.rel_mask_diag
group
in_block_size
input_spec.type
input_spec.vocab_size
loss_ignore_idx
n_layers_dec
n_layers_enc
out_block_size
out_dim
output_spec.type
output_spec.vocab_size
symbol_retrieval
symbol_retrieval_kwargs.dropout
symbol_retrieval_kwargs.model_dim
symbol_retrieval_kwargs.n_heads
symbol_retrieval_kwargs.num_symbols
decoder_kwargs.n_heads_rca
decoder_kwargs.n_heads_sa
decoder_kwargs.rca_disentangled
encoder_kwargs.n_heads_rca
encoder_kwargs.n_heads_sa
encoder_kwargs.rca_disentangled
decoder_kwargs.n_heads
decoder_kwargs.rca_kwargs.use_relative_positional_symbols
decoder_kwargs.rca_type
encoder_kwargs.n_heads
Finished
awni00
11d 20h 15m 43s
-
144
relu
true
288
0.1
-
8
-
false
-
relu
false
288
0.1
-
-
false
-
enc_sa=8; enc_ra=0; dec_sa=8; dec_ra=0; d_cross=8; d=144; el=4; dl=4
161
token
85
0
4
4
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
Finished
awni00
11d 6h 22m 14s
-
144
relu
true
288
0.1
-
8
-
false
-
relu
false
288
0.1
-
-
false
-
enc_sa=8; enc_ra=0; dec_sa=8; dec_ra=0; d_cross=8; d=144; el=3; dl=3
161
token
85
0
3
3
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
Crashed
awni00
13d 22h 34m 15s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
enc_sa=4; enc_ra=4; dec_sa=8; dec_ra=0; d_cross=8; d=128; el=4; dl=4
161
token
85
0
4
4
31
85
token
85
position_relative
-
-
-
-
-
8
-
-
4
-
-
-
-
-
Crashed
awni00
13d 13h 21m 30s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
enc_sa=4; enc_ra=4; dec_sa=4; dec_ra=4; d_cross=8; d=128; el=4; dl=4
161
token
85
0
4
4
31
85
token
85
position_relative
-
-
-
-
-
4
-
-
4
-
-
-
-
-
Crashed
awni00
12d 18h 24m 14s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
enc_sa=4; enc_ra=4; dec_sa=8; dec_ra=0; d_cross=8; d=128; el=3; dl=3
161
token
85
0
3
3
31
85
token
85
position_relative
-
-
-
-
-
8
-
-
4
-
-
-
-
-
Finished
awni00
12d 11h 52m 52s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
enc_sa=4; enc_ra=4; dec_sa=4; dec_ra=4; d_cross=8; d=128; el=3; dl=3
161
token
85
0
3
3
31
85
token
85
position_relative
-
-
-
-
-
4
-
-
4
-
-
-
-
-
Finished
awni00
1d 1h 59m 20s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
Abstractor - L=2, d=128, h=8
161
token
85
-
2
2
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
Finished
awni00
20h 47m 35s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
Abstractor - L=1, d=128, h=8
161
token
85
-
1
1
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
Finished
awni00
14h 33m 27s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
e_sa=8; e_rca=0; d_sa=8; d_rca=0; d_cross=8; d=128; rca_type=NA, symbol_type=NA; el=2; dl=2
161
token
85
0
2
2
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
Crashed
awni00
3d 1h 55m 33s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
e_sa=4; e_rca=4; d_sa=8; d_rca=0; d_cross=8; d=128; rca_type=disentangled_v2, symbol_type=pos_relative; el=2; dl=2
161
token
85
0
2
2
31
85
token
85
pos_relative
-
-
-
-
0
8
-
4
4
-
-
true
disentangled_v2
-
Crashed
awni00
3d 14s
-
128
relu
true
256
0.1
-
8
-
false
-
relu
false
256
0.1
-
-
false
-
e_sa=4; e_rca=4; d_sa=4; d_rca=4; d_cross=8; d=128; rca_type=disentangled_v2, symbol_type=pos_relative; el=2; dl=2
161
token
85
0
2
2
31
85
token
85
pos_relative
-
-
-
-
4
4
-
4
4
-
-
true
disentangled_v2
-
Finished
awni00
4d 6h 11m 50s
-
144
relu
true
288
0.1
-
8
-
false
-
relu
false
288
0.1
-
-
false
-
e_sa=8; e_rca=0; d_sa=8; d_rca=0; d_cross=8; d=144; rca_type=NA, symbol_type=NA; el=2; dl=2
161
token
85
0
2
2
31
85
token
85
-
-
-
-
-
-
-
-
-
-
-
8
-
-
8
1-12
of 12