{ "training_parameters": { "num_train_epochs": 5, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 8, "gradient_accumulation_steps": 4, "learning_rate": 3e-5, "warmup_ratio": 0.1, "weight_decay": 0.01, "adam_beta1": 0.9, "adam_beta2": 0.999, "adam_epsilon": 1e-8, "max_grad_norm": 1.0, "label_smoothing": 0.1 }, "optimization": { "mixed_precision": "fp16", "gradient_checkpointing": true, "kernel_fusion": true, "dynamic_padding": true }, "logging": { "logging_steps": 100, "save_steps": 500, "eval_steps": 500, "save_strategy": "epoch", "evaluation_strategy": "epoch" } }