Spaces:
Running
on
A100
Running
on
A100
| defaults: | |
| - base_pytorch | |
| - _self_ | |
| tasks: [training] | |
| training: | |
| lr: 1e-5 | |
| precision: bf16-mixed | |
| batch_size: 1 | |
| max_epochs: -1 | |
| max_steps: 10000000 | |
| checkpointing: | |
| every_n_train_steps: 2000 | |
| every_n_epochs: null | |
| save_weights_only: true | |
| filename: "latest" | |
| optim: | |
| accumulate_grad_batches: 4 | |
| gradient_clip_val: null | |
| data: | |
| num_workers: 5 # number of CPU threads for data preprocessing. | |
| validation: | |
| precision: bf16-mixed | |
| val_every_n_step: 1000 | |
| val_every_n_epoch: null | |
| batch_size: 1 | |
| limit_batch: 1 | |
| data: | |
| num_workers: 1 # number of CPU threads for data preprocessing, for validation. | |
| test: | |
| precision: bf16-mixed | |
| limit_batch: null | |
| batch_size: 1 | |
| data: | |
| num_workers: 1 # number of CPU threads for data preprocessing, for test. | |
| find_unused_parameters: False |