_attn_implementation_autoset
accelerator_config.even_batches
accelerator_config.non_blocking
accelerator_config.split_batches
accelerator_config.use_seedable_sampler
attention_probs_dropout_prob
auto_map.AutoModelForMaskedLM
auto_map.AutoModelForMultipleChoice
auto_map.AutoModelForQuestionAnswering
auto_map.AutoModelForSequenceClassification
auto_map.AutoModelForTokenClassification
average_tokens_across_devices
data.cache_options.batch_size
data.cache_options.num_shard_groups
data.cache_options.prefetch_per_group
data.cache_options.shard_order_randomization_key
data.cache_options.target_size_per_flush
data.configs.SlimPajama-627B.cache_dir
data.configs.SlimPajama-627B.plaintext
data.configs.SlimPajama-627B.stream
data.configs.SlimPajama-627B.tags
data.configs.SlimPajama-627B.text_key
data.configs.SlimPajama-627B.train_urls
data.configs.SlimPajama-627B.validation_urls
data.configs.SlimPajama-6B.cache_dir
data.configs.SlimPajama-6B.plaintext
data.configs.SlimPajama-6B.stream
data.configs.SlimPajama-6B.tags