| { | |
| "best_metric": 0.012183231301605701, | |
| "best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/dinov2-base_rice-leaf-disease-augmented_fft_012825/checkpoint-2000", | |
| "epoch": 12.0, | |
| "eval_steps": 500, | |
| "global_step": 3000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 46.693111419677734, | |
| "learning_rate": 5e-06, | |
| "loss": 0.8384, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.931, | |
| "eval_loss": 0.20420736074447632, | |
| "eval_runtime": 105.5728, | |
| "eval_samples_per_second": 18.944, | |
| "eval_steps_per_second": 0.303, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 40.63591003417969, | |
| "learning_rate": 1e-05, | |
| "loss": 0.1037, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.96, | |
| "eval_loss": 0.12901116907596588, | |
| "eval_runtime": 103.7804, | |
| "eval_samples_per_second": 19.271, | |
| "eval_steps_per_second": 0.308, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 13.294111251831055, | |
| "learning_rate": 9.444444444444445e-06, | |
| "loss": 0.0574, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.977, | |
| "eval_loss": 0.06572597473859787, | |
| "eval_runtime": 106.4096, | |
| "eval_samples_per_second": 18.795, | |
| "eval_steps_per_second": 0.301, | |
| "step": 750 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 20.432308197021484, | |
| "learning_rate": 8.888888888888888e-06, | |
| "loss": 0.0255, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.985, | |
| "eval_loss": 0.05270255357027054, | |
| "eval_runtime": 104.4225, | |
| "eval_samples_per_second": 19.153, | |
| "eval_steps_per_second": 0.306, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 11.204561233520508, | |
| "learning_rate": 8.333333333333334e-06, | |
| "loss": 0.0096, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.988, | |
| "eval_loss": 0.03742993623018265, | |
| "eval_runtime": 103.3751, | |
| "eval_samples_per_second": 19.347, | |
| "eval_steps_per_second": 0.31, | |
| "step": 1250 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 0.008258991874754429, | |
| "learning_rate": 6.666666666666667e-06, | |
| "loss": 0.0052, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.997, | |
| "eval_loss": 0.012767890468239784, | |
| "eval_runtime": 109.714, | |
| "eval_samples_per_second": 18.229, | |
| "eval_steps_per_second": 0.292, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 0.023719610646367073, | |
| "learning_rate": 5.925925925925926e-06, | |
| "loss": 0.0018, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.9945, | |
| "eval_loss": 0.013132033869624138, | |
| "eval_runtime": 108.5519, | |
| "eval_samples_per_second": 18.424, | |
| "eval_steps_per_second": 0.295, | |
| "step": 1750 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 0.1996152102947235, | |
| "learning_rate": 5.185185185185185e-06, | |
| "loss": 0.0027, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.997, | |
| "eval_loss": 0.012183231301605701, | |
| "eval_runtime": 107.9106, | |
| "eval_samples_per_second": 18.534, | |
| "eval_steps_per_second": 0.297, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 0.008068982511758804, | |
| "learning_rate": 4.444444444444444e-06, | |
| "loss": 0.0004, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.997, | |
| "eval_loss": 0.015290269628167152, | |
| "eval_runtime": 108.9225, | |
| "eval_samples_per_second": 18.362, | |
| "eval_steps_per_second": 0.294, | |
| "step": 2250 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "grad_norm": 0.0013503103982657194, | |
| "learning_rate": 3.7037037037037037e-06, | |
| "loss": 0.0013, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.997, | |
| "eval_loss": 0.012768927030265331, | |
| "eval_runtime": 107.1659, | |
| "eval_samples_per_second": 18.663, | |
| "eval_steps_per_second": 0.299, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "grad_norm": 0.0178547166287899, | |
| "learning_rate": 2.962962962962963e-06, | |
| "loss": 0.0004, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.9965, | |
| "eval_loss": 0.014693325385451317, | |
| "eval_runtime": 116.2834, | |
| "eval_samples_per_second": 17.199, | |
| "eval_steps_per_second": 0.275, | |
| "step": 2750 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "grad_norm": 0.0006140907644294202, | |
| "learning_rate": 2.222222222222222e-06, | |
| "loss": 0.0004, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.997, | |
| "eval_loss": 0.015538069419562817, | |
| "eval_runtime": 106.5951, | |
| "eval_samples_per_second": 18.763, | |
| "eval_steps_per_second": 0.3, | |
| "step": 3000 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 3750, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 15, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": false | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 1.5015902268358656e+19, | |
| "train_batch_size": 64, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |