SodaXII's picture
Training in progress, epoch 14
0ad60b2 verified
{
"best_metric": 0.012183231301605701,
"best_model_checkpoint": "./drive/Shareddrives/CS198-Drones/training_output/dinov2-base_rice-leaf-disease-augmented_fft_012825/checkpoint-2000",
"epoch": 12.0,
"eval_steps": 500,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 46.693111419677734,
"learning_rate": 5e-06,
"loss": 0.8384,
"step": 250
},
{
"epoch": 1.0,
"eval_accuracy": 0.931,
"eval_loss": 0.20420736074447632,
"eval_runtime": 105.5728,
"eval_samples_per_second": 18.944,
"eval_steps_per_second": 0.303,
"step": 250
},
{
"epoch": 2.0,
"grad_norm": 40.63591003417969,
"learning_rate": 1e-05,
"loss": 0.1037,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.96,
"eval_loss": 0.12901116907596588,
"eval_runtime": 103.7804,
"eval_samples_per_second": 19.271,
"eval_steps_per_second": 0.308,
"step": 500
},
{
"epoch": 3.0,
"grad_norm": 13.294111251831055,
"learning_rate": 9.444444444444445e-06,
"loss": 0.0574,
"step": 750
},
{
"epoch": 3.0,
"eval_accuracy": 0.977,
"eval_loss": 0.06572597473859787,
"eval_runtime": 106.4096,
"eval_samples_per_second": 18.795,
"eval_steps_per_second": 0.301,
"step": 750
},
{
"epoch": 4.0,
"grad_norm": 20.432308197021484,
"learning_rate": 8.888888888888888e-06,
"loss": 0.0255,
"step": 1000
},
{
"epoch": 4.0,
"eval_accuracy": 0.985,
"eval_loss": 0.05270255357027054,
"eval_runtime": 104.4225,
"eval_samples_per_second": 19.153,
"eval_steps_per_second": 0.306,
"step": 1000
},
{
"epoch": 5.0,
"grad_norm": 11.204561233520508,
"learning_rate": 8.333333333333334e-06,
"loss": 0.0096,
"step": 1250
},
{
"epoch": 5.0,
"eval_accuracy": 0.988,
"eval_loss": 0.03742993623018265,
"eval_runtime": 103.3751,
"eval_samples_per_second": 19.347,
"eval_steps_per_second": 0.31,
"step": 1250
},
{
"epoch": 6.0,
"grad_norm": 0.008258991874754429,
"learning_rate": 6.666666666666667e-06,
"loss": 0.0052,
"step": 1500
},
{
"epoch": 6.0,
"eval_accuracy": 0.997,
"eval_loss": 0.012767890468239784,
"eval_runtime": 109.714,
"eval_samples_per_second": 18.229,
"eval_steps_per_second": 0.292,
"step": 1500
},
{
"epoch": 7.0,
"grad_norm": 0.023719610646367073,
"learning_rate": 5.925925925925926e-06,
"loss": 0.0018,
"step": 1750
},
{
"epoch": 7.0,
"eval_accuracy": 0.9945,
"eval_loss": 0.013132033869624138,
"eval_runtime": 108.5519,
"eval_samples_per_second": 18.424,
"eval_steps_per_second": 0.295,
"step": 1750
},
{
"epoch": 8.0,
"grad_norm": 0.1996152102947235,
"learning_rate": 5.185185185185185e-06,
"loss": 0.0027,
"step": 2000
},
{
"epoch": 8.0,
"eval_accuracy": 0.997,
"eval_loss": 0.012183231301605701,
"eval_runtime": 107.9106,
"eval_samples_per_second": 18.534,
"eval_steps_per_second": 0.297,
"step": 2000
},
{
"epoch": 9.0,
"grad_norm": 0.008068982511758804,
"learning_rate": 4.444444444444444e-06,
"loss": 0.0004,
"step": 2250
},
{
"epoch": 9.0,
"eval_accuracy": 0.997,
"eval_loss": 0.015290269628167152,
"eval_runtime": 108.9225,
"eval_samples_per_second": 18.362,
"eval_steps_per_second": 0.294,
"step": 2250
},
{
"epoch": 10.0,
"grad_norm": 0.0013503103982657194,
"learning_rate": 3.7037037037037037e-06,
"loss": 0.0013,
"step": 2500
},
{
"epoch": 10.0,
"eval_accuracy": 0.997,
"eval_loss": 0.012768927030265331,
"eval_runtime": 107.1659,
"eval_samples_per_second": 18.663,
"eval_steps_per_second": 0.299,
"step": 2500
},
{
"epoch": 11.0,
"grad_norm": 0.0178547166287899,
"learning_rate": 2.962962962962963e-06,
"loss": 0.0004,
"step": 2750
},
{
"epoch": 11.0,
"eval_accuracy": 0.9965,
"eval_loss": 0.014693325385451317,
"eval_runtime": 116.2834,
"eval_samples_per_second": 17.199,
"eval_steps_per_second": 0.275,
"step": 2750
},
{
"epoch": 12.0,
"grad_norm": 0.0006140907644294202,
"learning_rate": 2.222222222222222e-06,
"loss": 0.0004,
"step": 3000
},
{
"epoch": 12.0,
"eval_accuracy": 0.997,
"eval_loss": 0.015538069419562817,
"eval_runtime": 106.5951,
"eval_samples_per_second": 18.763,
"eval_steps_per_second": 0.3,
"step": 3000
}
],
"logging_steps": 500,
"max_steps": 3750,
"num_input_tokens_seen": 0,
"num_train_epochs": 15,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.5015902268358656e+19,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}