| model_name_or_path: facebook/opt-125m | |
| config_name: None | |
| tokenizer_name: None | |
| use_slow_tokenizer: False | |
| per_device_train_batch_size: 32 | |
| per_device_eval_batch_size: 32 | |
| learning_rate: 5e-05 | |
| weight_decay: 0.1 | |
| num_train_epochs: 5 | |
| patience: 100 | |
| max_train_steps: None | |
| gradient_accumulation_steps: 1 | |
| lr_scheduler_type: SchedulerType.LINEAR | |
| num_warmup_steps: 0 | |
| output_dir: opt_125m_squad_decay_0.1 | |
| seed: None | |
| finetune_type: vanilla | |
| beta: 0.1 | |
| model_type: None | |
| max_seq_length: 384 | |
| max_context_length: 600 | |
| num_beams: 1 | |
| preprocessing_num_workers: 16 | |
| overwrite_cache: False | |
| no_keep_linebreaks: False | |
| push_to_hub: False | |
| hub_model_id: None | |
| hub_token: None | |
| checkpointing_steps: epoch | |
| resume_from_checkpoint: None | |
| with_tracking: False | |
| local_rank: -1 | |