Ajanz's workspace
Runs
6,380
Name
6,380 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
accelerator
adam_epsilon
config
config_kwargs/classifier_dropout
dataset_info
dataset_name_or_path
dataset_version
devices
downstream_model_type
embedding_name_or_path
eval_batch_size
evaluation_filename
evaluation_mode
finetune_last_n_layers
ignore_index
input_column_name
label_all_tokens
learning_rate
load_dataset_kwargs
logging_config
max_seq_length
metrics
model_checkpoint_kwargs/filename
model_checkpoint_kwargs/monitor
model_checkpoint_kwargs/save_last
model_name_or_path
num_classes
optimizer
output_path
predict_subset
processing_batch_size
seed
tagging_scheme
target_column_name
target_field
task_model_kwargs/adam_epsilon
task_model_kwargs/eval_batch_size
task_model_kwargs/learning_rate
task_model_kwargs/optimizer
task_model_kwargs/train_batch_size
task_model_kwargs/use_scheduler
task_model_kwargs/warmup_steps
task_model_kwargs/weight_decay
text_field
Finished
ktagowski
1h 8m 57s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.5}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.5
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
sentence-transformers/paraphrase-xlm-r-multilingual-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
sentence-transformers/paraphrase-xlm-r-multilingual-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/sentence-transformers__paraphrase-xlm-r-multilingual-v1/nkjp_pos/run-4
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
1h 11m 24s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.5}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.5
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
sentence-transformers/paraphrase-xlm-r-multilingual-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
sentence-transformers/paraphrase-xlm-r-multilingual-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/sentence-transformers__paraphrase-xlm-r-multilingual-v1/nkjp_pos/run-3
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
2h 1m 53s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0001, 'optimizer': 'Adam', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-cased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0001
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-cased-v1
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-cased-v1/nkjp_pos/run-4
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0001
Adam
64
true
25
0
tokens
Finished
ktagowski
1h 12m 57s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.5}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.5
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
sentence-transformers/paraphrase-xlm-r-multilingual-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
sentence-transformers/paraphrase-xlm-r-multilingual-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/sentence-transformers__paraphrase-xlm-r-multilingual-v1/nkjp_pos/run-2
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
1h 11m 54s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.5}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.5
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
sentence-transformers/paraphrase-xlm-r-multilingual-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
sentence-transformers/paraphrase-xlm-r-multilingual-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/sentence-transformers__paraphrase-xlm-r-multilingual-v1/nkjp_pos/run-1
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
2h 2m 40s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0001, 'optimizer': 'Adam', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-cased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0001
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-cased-v1
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-cased-v1/nkjp_pos/run-3
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0001
Adam
64
true
25
0
tokens
Finished
ktagowski
1h 11m 53s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.5}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.5
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
sentence-transformers/paraphrase-xlm-r-multilingual-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
sentence-transformers/paraphrase-xlm-r-multilingual-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/sentence-transformers__paraphrase-xlm-r-multilingual-v1/nkjp_pos/run-0
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
2h 2m 10s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0001, 'optimizer': 'Adam', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-cased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0001
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-cased-v1
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-cased-v1/nkjp_pos/run-2
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0001
Adam
64
true
25
0
tokens
Finished
ktagowski
2h 14m 52s
-
auto
0.0001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 0.0001, 'eval_batch_size': 32, 'learning_rate': 5e-05, 'optimizer': 'Adam', 'train_batch_size': 32, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.2}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.2
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-base-cased
32
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-base-cased
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-base-cased/nkjp_pos/run-4
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.0001
32
0.00005
Adam
32
true
25
0
tokens
Finished
ktagowski
2h 10m 33s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 16, 'learning_rate': 5e-05, 'optimizer': 'AdamW', 'train_batch_size': 16, 'use_scheduler': True, 'warmup_steps': 50, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-large-cased
16
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-large-cased
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-large-cased/nkjp_pos/run-4
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
16
0.00005
AdamW
16
true
50
0
tokens
Finished
ktagowski
2h 5m 16s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0001, 'optimizer': 'Adam', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-cased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0001
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-cased-v1
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-cased-v1/nkjp_pos/run-1
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0001
Adam
64
true
25
0
tokens
Finished
ktagowski
2h 7m 56s
-
auto
0.0001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 0.0001, 'eval_batch_size': 32, 'learning_rate': 5e-05, 'optimizer': 'Adam', 'train_batch_size': 32, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.2}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.2
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-base-cased
32
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-base-cased
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-base-cased/nkjp_pos/run-3
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.0001
32
0.00005
Adam
32
true
25
0
tokens
Finished
ktagowski
2h 10m 24s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 16, 'learning_rate': 5e-05, 'optimizer': 'AdamW', 'train_batch_size': 16, 'use_scheduler': True, 'warmup_steps': 50, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-large-cased
16
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-large-cased
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-large-cased/nkjp_pos/run-3
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
16
0.00005
AdamW
16
true
50
0
tokens
Finished
ktagowski
2h 4m 46s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 64, 'learning_rate': 0.0001, 'optimizer': 'Adam', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-cased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0001
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-cased-v1
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-cased-v1/nkjp_pos/run-0
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
64
0.0001
Adam
64
true
25
0
tokens
Finished
ktagowski
1h 4m 11s
-
auto
0.000001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-06, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.1}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.1
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-uncased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-uncased-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-uncased-v1/nkjp_pos/run-4
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.000001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
2h 9m 12s
-
auto
0.0001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 0.0001, 'eval_batch_size': 32, 'learning_rate': 5e-05, 'optimizer': 'Adam', 'train_batch_size': 32, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.2}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.2
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-base-cased
32
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-base-cased
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-base-cased/nkjp_pos/run-2
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.0001
32
0.00005
Adam
32
true
25
0
tokens
Finished
ktagowski
2h 4m 55s
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 16, 'learning_rate': 5e-05, 'optimizer': 'AdamW', 'train_batch_size': 16, 'use_scheduler': True, 'warmup_steps': 50, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-large-cased
16
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-large-cased
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-large-cased/nkjp_pos/run-2
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
16
0.00005
AdamW
16
true
50
0
tokens
Finished
ktagowski
1h 4m 49s
-
auto
0.000001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-06, 'eval_batch_size': 64, 'learning_rate': 0.0005, 'optimizer': 'AdamW', 'train_batch_size': 64, 'use_scheduler': True, 'warmup_steps': 100, 'weight_decay': 0.1}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.1}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.1
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
dkleczek/bert-base-polish-uncased-v1
64
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.0005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
dkleczek/bert-base-polish-uncased-v1
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/dkleczek__bert-base-polish-uncased-v1/nkjp_pos/run-3
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.000001
64
0.0005
AdamW
64
true
100
0.1
tokens
Finished
ktagowski
2h 7m 35s
-
auto
0.0001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 0.0001, 'eval_batch_size': 32, 'learning_rate': 5e-05, 'optimizer': 'Adam', 'train_batch_size': 32, 'use_scheduler': True, 'warmup_steps': 25, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 10, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.2}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.2
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-base-cased
32
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-base-cased
35
Adam
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-base-cased/nkjp_pos/run-1
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.0001
32
0.00005
Adam
32
true
25
0
tokens
Finished
ktagowski
2h 5m
-
auto
0.00001
LightningAdvancedConfig(finetune_last_n_layers=4, task_model_kwargs={'adam_epsilon': 1e-05, 'eval_batch_size': 16, 'learning_rate': 5e-05, 'optimizer': 'AdamW', 'train_batch_size': 16, 'use_scheduler': True, 'warmup_steps': 50, 'weight_decay': 0}, datamodule_kwargs={'label_all_tokens': False, 'max_seq_length': 512}, task_train_kwargs={'max_epochs': 5, 'devices': 'auto', 'accelerator': 'auto'}, model_config_kwargs={'classifier_dropout': 0.4}, early_stopping_kwargs={'mode': 'min', 'monitor': 'val/Loss', 'patience': 3}, tokenizer_kwargs={}, batch_encoding_kwargs={}, dataloader_kwargs={})
0.4
DatasetInfo(description='NKJP-POS tagging dataset.', citation='', homepage='http://clip.ipipan.waw.pl/NationalCorpusOfPolish', license='', features={'input_ids': Sequence(feature=Value(dtype='int32', id=None), length=-1, id=None), 'token_type_ids': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'attention_mask': Sequence(feature=Value(dtype='int8', id=None), length=-1, id=None), 'labels': Sequence(feature=ClassLabel(num_classes=35, names=['interp', 'comp', 'pred', 'imps', 'ppas', 'adja', 'aglt', 'interj', 'depr', 'numcol', 'ppron3', 'qub', 'ger', 'winien', 'adj', 'xxx', 'num', 'fin', 'ppron12', 'siebie', 'inf', 'pcon', 'prep', 'praet', 'adjp', 'impt', 'brev', 'pact', 'burk', 'adjc', 'adv', 'bedzie', 'subst', 'conj', 'pant'], id=None), length=-1, id=None)}, post_processed=None, supervised_keys=None, task_templates=None, builder_name='nkjppos', config_name='default', version=1.1.0, splits={'train': SplitInfo(name='train', num_bytes=21995776, num_examples=78219, dataset_name='nkjppos'), 'test': SplitInfo(name='test', num_bytes=2115978, num_examples=7444, dataset_name='nkjppos')}, download_checksums={'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/train.jsonl': {'num_bytes': 24495626, 'checksum': '2b531e4c97c0e9e587780c2cd58bbf0e9a1163fe5c5fcf7617cc50473b5984a9'}, 'https://huggingface.co/datasets/clarin-pl/nkjp-pos/resolve/main/data/test.jsonl': {'num_bytes': 2354273, 'checksum': '8917b146b157e3dd6ec531eca9174781e8579f0271040e5256095156abbb3c84'}}, download_size=26849899, post_processing_size=None, dataset_size=24111754, size_in_bytes=50961653)
data/datasets/nkjp_pos/lightning/
1.1.0
auto
AutoModelForTokenClassification
allegro/herbert-large-cased
16
evaluation.json
EvaluationMode.UNIT
4
-100
tokens
false
0.00005
None
LightningLoggingConfig(loggers_names=['wandb'], tracking_project_name='nkjp_pos', wandb_entity='embeddings', wandb_logger_kwargs={})
512
None
last
None
false
allegro/herbert-large-cased
35
AdamW
/embeddings-internal/leaderboard/data/models/lightning/allegro__herbert-large-cased/nkjp_pos/run-1
LightingDataModuleSubset.TEST
None
441
None
pos_tags
pos_tags
0.00001
16
0.00005
AdamW
16
true
50
0
tokens
1-20
of 6,380