{ "best_metric": 0.5628694891929626, "best_model_checkpoint": "output_pipe/H3K4me3/origin/checkpoint-800", "epoch": 4.0, "eval_steps": 200, "global_step": 1840, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.21739130434782608, "grad_norm": 9.999856948852539, "learning_rate": 2.92122905027933e-05, "loss": 0.7052, "step": 100 }, { "epoch": 0.43478260869565216, "grad_norm": 6.555872917175293, "learning_rate": 2.753631284916201e-05, "loss": 0.6974, "step": 200 }, { "epoch": 0.43478260869565216, "eval_accuracy": 0.6519021739130435, "eval_f1": 0.6472859020981344, "eval_loss": 0.6252989768981934, "eval_matthews_correlation": 0.2982120567132538, "eval_precision": 0.6509352846293209, "eval_recall": 0.6472989417079502, "eval_runtime": 1.64, "eval_samples_per_second": 2243.962, "eval_steps_per_second": 35.367, "step": 200 }, { "epoch": 0.6521739130434783, "grad_norm": 10.895277976989746, "learning_rate": 2.5860335195530725e-05, "loss": 0.647, "step": 300 }, { "epoch": 0.8695652173913043, "grad_norm": 13.307287216186523, "learning_rate": 2.4184357541899442e-05, "loss": 0.6402, "step": 400 }, { "epoch": 0.8695652173913043, "eval_accuracy": 0.6584239130434782, "eval_f1": 0.6584236860388981, "eval_loss": 0.6169613003730774, "eval_matthews_correlation": 0.3220566655224521, "eval_precision": 0.6610448792984156, "eval_recall": 0.6610117879241085, "eval_runtime": 1.6414, "eval_samples_per_second": 2242.015, "eval_steps_per_second": 35.336, "step": 400 }, { "epoch": 1.0869565217391304, "grad_norm": 9.527493476867676, "learning_rate": 2.2508379888268156e-05, "loss": 0.5937, "step": 500 }, { "epoch": 1.3043478260869565, "grad_norm": 21.95737648010254, "learning_rate": 2.0832402234636874e-05, "loss": 0.5398, "step": 600 }, { "epoch": 1.3043478260869565, "eval_accuracy": 0.6809782608695653, "eval_f1": 0.6806272489346898, "eval_loss": 0.6053802371025085, "eval_matthews_correlation": 0.37370172922502976, "eval_precision": 0.6880450607585084, "eval_recall": 0.6856642523106775, "eval_runtime": 1.652, "eval_samples_per_second": 2227.623, "eval_steps_per_second": 35.109, "step": 600 }, { "epoch": 1.5217391304347827, "grad_norm": 17.107023239135742, "learning_rate": 1.9173184357541898e-05, "loss": 0.5213, "step": 700 }, { "epoch": 1.7391304347826086, "grad_norm": 12.411290168762207, "learning_rate": 1.7497206703910616e-05, "loss": 0.513, "step": 800 }, { "epoch": 1.7391304347826086, "eval_accuracy": 0.7048913043478261, "eval_f1": 0.7045338405632524, "eval_loss": 0.5628694891929626, "eval_matthews_correlation": 0.4101109337743351, "eval_precision": 0.7046674488480548, "eval_recall": 0.7054442205488696, "eval_runtime": 1.6506, "eval_samples_per_second": 2229.501, "eval_steps_per_second": 35.139, "step": 800 }, { "epoch": 1.9565217391304348, "grad_norm": 11.334113121032715, "learning_rate": 1.582122905027933e-05, "loss": 0.4965, "step": 900 }, { "epoch": 2.1739130434782608, "grad_norm": 28.086755752563477, "learning_rate": 1.4145251396648046e-05, "loss": 0.3209, "step": 1000 }, { "epoch": 2.1739130434782608, "eval_accuracy": 0.7029891304347826, "eval_f1": 0.7023614089231047, "eval_loss": 0.7348151206970215, "eval_matthews_correlation": 0.40508519181609787, "eval_precision": 0.7022438526861932, "eval_recall": 0.7028417804165564, "eval_runtime": 1.6525, "eval_samples_per_second": 2226.972, "eval_steps_per_second": 35.099, "step": 1000 }, { "epoch": 2.391304347826087, "grad_norm": 21.236024856567383, "learning_rate": 1.246927374301676e-05, "loss": 0.2459, "step": 1100 }, { "epoch": 2.608695652173913, "grad_norm": 27.03154754638672, "learning_rate": 1.0793296089385476e-05, "loss": 0.2465, "step": 1200 }, { "epoch": 2.608695652173913, "eval_accuracy": 0.7266304347826087, "eval_f1": 0.7261754894636794, "eval_loss": 0.6555567383766174, "eval_matthews_correlation": 0.45300551506446013, "eval_precision": 0.7261108931112572, "eval_recall": 0.726895301078929, "eval_runtime": 1.6486, "eval_samples_per_second": 2232.252, "eval_steps_per_second": 35.182, "step": 1200 }, { "epoch": 2.8260869565217392, "grad_norm": 24.729053497314453, "learning_rate": 9.117318435754191e-06, "loss": 0.2336, "step": 1300 }, { "epoch": 3.0434782608695654, "grad_norm": 8.527237892150879, "learning_rate": 7.441340782122905e-06, "loss": 0.1989, "step": 1400 }, { "epoch": 3.0434782608695654, "eval_accuracy": 0.7502717391304348, "eval_f1": 0.7498163710812544, "eval_loss": 0.9599674344062805, "eval_matthews_correlation": 0.5001928701951829, "eval_precision": 0.7496841522913477, "eval_recall": 0.7505093986723612, "eval_runtime": 1.6491, "eval_samples_per_second": 2231.585, "eval_steps_per_second": 35.172, "step": 1400 }, { "epoch": 3.260869565217391, "grad_norm": 1.4311695098876953, "learning_rate": 5.76536312849162e-06, "loss": 0.0516, "step": 1500 }, { "epoch": 3.4782608695652173, "grad_norm": 25.26365089416504, "learning_rate": 4.106145251396648e-06, "loss": 0.0524, "step": 1600 }, { "epoch": 3.4782608695652173, "eval_accuracy": 0.7529891304347827, "eval_f1": 0.7529298550551656, "eval_loss": 1.589869737625122, "eval_matthews_correlation": 0.5091195396887124, "eval_precision": 0.7541927197975609, "eval_recall": 0.7549273499052958, "eval_runtime": 1.6464, "eval_samples_per_second": 2235.204, "eval_steps_per_second": 35.229, "step": 1600 }, { "epoch": 3.6956521739130435, "grad_norm": 26.048221588134766, "learning_rate": 2.430167597765363e-06, "loss": 0.0506, "step": 1700 }, { "epoch": 3.9130434782608696, "grad_norm": 32.529476165771484, "learning_rate": 7.541899441340783e-07, "loss": 0.0413, "step": 1800 }, { "epoch": 3.9130434782608696, "eval_accuracy": 0.748641304347826, "eval_f1": 0.7474285608287964, "eval_loss": 1.434490442276001, "eval_matthews_correlation": 0.494938242187782, "eval_precision": 0.7477221063315149, "eval_recall": 0.7472163942164571, "eval_runtime": 1.6473, "eval_samples_per_second": 2233.905, "eval_steps_per_second": 35.208, "step": 1800 }, { "epoch": 4.0, "step": 1840, "total_flos": 9283152131334144.0, "train_loss": 0.37002268653848897, "train_runtime": 187.7318, "train_samples_per_second": 627.257, "train_steps_per_second": 9.801 } ], "logging_steps": 100, "max_steps": 1840, "num_input_tokens_seen": 0, "num_train_epochs": 4, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 9283152131334144.0, "train_batch_size": 64, "trial_name": null, "trial_params": null }