| base_model: facebook/opt-125m | |
| batch_size: 128 | |
| bf16: true | |
| chat_template: tokenizer_default_fallback_alpaca | |
| datasets: | |
| - format: custom | |
| path: https://gradients.s3.eu-north-1.amazonaws.com/7575a7e5b38479e3_train_data.json?X-Amz-Algorithm=AWS4-HMAC-SHA256&X-Amz-Credential=AKIAVVZOOA7SA4UOFLPI%2F20250209%2Feu-north-1%2Fs3%2Faws4_request&X-Amz-Date=20250209T024133Z&X-Amz-Expires=604800&X-Amz-SignedHeaders=host&X-Amz-Signature=5b334fbc5cfa88197315bf2cd74f2114e46bdb6bf8716ba3c96b73b8c3e6ef9a | |
| type: | |
| field_instruction: instruction | |
| field_output: output | |
| format: '{instruction}' | |
| no_input_format: '{instruction}' | |
| system_format: '{system}' | |
| system_prompt: '' | |
| device_map: auto | |
| eval_sample_packing: false | |
| eval_steps: 40 | |
| flash_attention: true | |
| gradient_checkpointing: true | |
| group_by_length: true | |
| hub_model_id: SystemAdmin123/d778c1e6-0d20-4dd2-81e1-efc24a74b590 | |
| hub_strategy: checkpoint | |
| learning_rate: 0.0002 | |
| logging_steps: 10 | |
| lr_scheduler: cosine | |
| max_steps: 10000 | |
| micro_batch_size: 32 | |
| model_type: AutoModelForCausalLM | |
| num_epochs: 100 | |
| optimizer: adamw_bnb_8bit | |
| output_dir: /root/.sn56/axolotl/tmp/d778c1e6-0d20-4dd2-81e1-efc24a74b590 | |
| pad_to_sequence_len: true | |
| resize_token_embeddings_to_32x: false | |
| sample_packing: true | |
| save_steps: 40 | |
| save_total_limit: 2 | |
| sequence_len: 2048 | |
| tokenizer_type: GPT2TokenizerFast | |
| torch_dtype: bf16 | |
| training_args_kwargs: | |
| hub_private_repo: true | |
| trust_remote_code: true | |
| val_set_size: 0.1 | |
| wandb_entity: '' | |
| wandb_mode: online | |
| wandb_name: facebook/opt-125m-https://gradients.s3.eu-north-1.amazonaws.com/7575a7e5b38479e3_train_data.json?X-Amz-Algorithm=AWS4-HMAC-SHA256&X-Amz-Credential=AKIAVVZOOA7SA4UOFLPI%2F20250209%2Feu-north-1%2Fs3%2Faws4_request&X-Amz-Date=20250209T024133Z&X-Amz-Expires=604800&X-Amz-SignedHeaders=host&X-Amz-Signature=5b334fbc5cfa88197315bf2cd74f2114e46bdb6bf8716ba3c96b73b8c3e6ef9a | |
| wandb_project: Gradients-On-Demand | |
| wandb_run: your_name | |
| wandb_runid: default | |
| warmup_ratio: 0.05 | |