{ "best_global_step": 1749, "best_metric": 0.959008487654321, "best_model_checkpoint": "dinov2-base-finetuned-clothes-big/checkpoint-1749", "epoch": 3.0, "eval_steps": 500, "global_step": 1749, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.08576329331046312, "learning_rate": 1.4000000000000001e-05, "loss": 1.3651, "step": 50 }, { "epoch": 0.17152658662092624, "learning_rate": 2.8285714285714287e-05, "loss": 0.4913, "step": 100 }, { "epoch": 0.25728987993138935, "learning_rate": 4.257142857142857e-05, "loss": 0.4551, "step": 150 }, { "epoch": 0.34305317324185247, "learning_rate": 4.923761118170267e-05, "loss": 0.4288, "step": 200 }, { "epoch": 0.4288164665523156, "learning_rate": 4.764930114358323e-05, "loss": 0.4145, "step": 250 }, { "epoch": 0.5145797598627787, "learning_rate": 4.606099110546379e-05, "loss": 0.3938, "step": 300 }, { "epoch": 0.6003430531732419, "learning_rate": 4.4472681067344344e-05, "loss": 0.3559, "step": 350 }, { "epoch": 0.6861063464837049, "learning_rate": 4.2884371029224906e-05, "loss": 0.3624, "step": 400 }, { "epoch": 0.7718696397941681, "learning_rate": 4.129606099110547e-05, "loss": 0.3382, "step": 450 }, { "epoch": 0.8576329331046312, "learning_rate": 3.9707750952986025e-05, "loss": 0.322, "step": 500 }, { "epoch": 0.9433962264150944, "learning_rate": 3.811944091486658e-05, "loss": 0.3022, "step": 550 }, { "epoch": 1.0, "eval_accuracy": 0.9210069444444444, "eval_loss": 0.23223502933979034, "eval_runtime": 29.8019, "eval_samples_per_second": 352.662, "eval_steps_per_second": 2.45, "step": 583 }, { "epoch": 1.0291595197255574, "learning_rate": 3.653113087674714e-05, "loss": 0.3261, "step": 600 }, { "epoch": 1.1149228130360207, "learning_rate": 3.4942820838627705e-05, "loss": 0.2997, "step": 650 }, { "epoch": 1.2006861063464838, "learning_rate": 3.335451080050826e-05, "loss": 0.2866, "step": 700 }, { "epoch": 1.2864493996569468, "learning_rate": 3.176620076238882e-05, "loss": 0.2809, "step": 750 }, { "epoch": 1.3722126929674099, "learning_rate": 3.017789072426938e-05, "loss": 0.2919, "step": 800 }, { "epoch": 1.457975986277873, "learning_rate": 2.8589580686149935e-05, "loss": 0.2543, "step": 850 }, { "epoch": 1.5437392795883362, "learning_rate": 2.7001270648030498e-05, "loss": 0.2744, "step": 900 }, { "epoch": 1.6295025728987993, "learning_rate": 2.5412960609911057e-05, "loss": 0.269, "step": 950 }, { "epoch": 1.7152658662092626, "learning_rate": 2.3824650571791616e-05, "loss": 0.2489, "step": 1000 }, { "epoch": 1.8010291595197256, "learning_rate": 2.2236340533672172e-05, "loss": 0.2608, "step": 1050 }, { "epoch": 1.8867924528301887, "learning_rate": 2.0648030495552734e-05, "loss": 0.2424, "step": 1100 }, { "epoch": 1.9725557461406518, "learning_rate": 1.905972045743329e-05, "loss": 0.2158, "step": 1150 }, { "epoch": 2.0, "eval_accuracy": 0.9501350308641975, "eval_loss": 0.15389321744441986, "eval_runtime": 29.6932, "eval_samples_per_second": 353.953, "eval_steps_per_second": 2.458, "step": 1166 }, { "epoch": 2.058319039451115, "learning_rate": 1.7471410419313853e-05, "loss": 0.234, "step": 1200 }, { "epoch": 2.144082332761578, "learning_rate": 1.588310038119441e-05, "loss": 0.2244, "step": 1250 }, { "epoch": 2.2298456260720414, "learning_rate": 1.4294790343074968e-05, "loss": 0.197, "step": 1300 }, { "epoch": 2.3156089193825045, "learning_rate": 1.2706480304955528e-05, "loss": 0.2182, "step": 1350 }, { "epoch": 2.4013722126929675, "learning_rate": 1.1118170266836086e-05, "loss": 0.2031, "step": 1400 }, { "epoch": 2.4871355060034306, "learning_rate": 9.529860228716645e-06, "loss": 0.2005, "step": 1450 }, { "epoch": 2.5728987993138936, "learning_rate": 7.941550190597204e-06, "loss": 0.197, "step": 1500 }, { "epoch": 2.6586620926243567, "learning_rate": 6.353240152477764e-06, "loss": 0.1859, "step": 1550 }, { "epoch": 2.7444253859348198, "learning_rate": 4.7649301143583225e-06, "loss": 0.1788, "step": 1600 }, { "epoch": 2.830188679245283, "learning_rate": 3.176620076238882e-06, "loss": 0.18, "step": 1650 }, { "epoch": 2.915951972555746, "learning_rate": 1.588310038119441e-06, "loss": 0.1767, "step": 1700 }, { "epoch": 3.0, "eval_accuracy": 0.959008487654321, "eval_loss": 0.1260276585817337, "eval_runtime": 29.5902, "eval_samples_per_second": 355.185, "eval_steps_per_second": 2.467, "step": 1749 }, { "epoch": 3.0, "step": 1749, "total_flos": 2.573186038429542e+19, "train_loss": 0.3105868404425506, "train_runtime": 1894.2785, "train_samples_per_second": 133.159, "train_steps_per_second": 0.923 } ], "logging_steps": 50, "max_steps": 1749, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.573186038429542e+19, "train_batch_size": 144, "trial_name": null, "trial_params": null }