|
{ |
|
"best_metric": 0.23172695934772491, |
|
"best_model_checkpoint": "output/dnabert2/checkpoint-800", |
|
"epoch": 4.751619870410368, |
|
"global_step": 2200, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.22, |
|
"learning_rate": 2.9350993377483443e-05, |
|
"loss": 0.4605, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"learning_rate": 2.8026490066225165e-05, |
|
"loss": 0.3215, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"eval_accuracy": 0.8912925905895078, |
|
"eval_f1": 0.8889597986481533, |
|
"eval_loss": 0.31392547488212585, |
|
"eval_matthews_correlation": 0.77967969546277, |
|
"eval_precision": 0.8934182790168708, |
|
"eval_recall": 0.8862939649347417, |
|
"eval_runtime": 62.2861, |
|
"eval_samples_per_second": 29.686, |
|
"eval_steps_per_second": 0.466, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.65, |
|
"learning_rate": 2.6701986754966888e-05, |
|
"loss": 0.2989, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"learning_rate": 2.537748344370861e-05, |
|
"loss": 0.257, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.86, |
|
"eval_accuracy": 0.9064359113034073, |
|
"eval_f1": 0.9045485484159261, |
|
"eval_loss": 0.25544461607933044, |
|
"eval_matthews_correlation": 0.8104176298356943, |
|
"eval_precision": 0.9083037444483227, |
|
"eval_recall": 0.9021373448557914, |
|
"eval_runtime": 13.8982, |
|
"eval_samples_per_second": 133.038, |
|
"eval_steps_per_second": 2.087, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"learning_rate": 2.4052980132450332e-05, |
|
"loss": 0.2309, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"learning_rate": 2.272847682119205e-05, |
|
"loss": 0.1856, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.3, |
|
"eval_accuracy": 0.916170903190914, |
|
"eval_f1": 0.915332450010266, |
|
"eval_loss": 0.26646658778190613, |
|
"eval_matthews_correlation": 0.8310628286957625, |
|
"eval_precision": 0.9143132069512503, |
|
"eval_recall": 0.9167532036464074, |
|
"eval_runtime": 13.924, |
|
"eval_samples_per_second": 132.792, |
|
"eval_steps_per_second": 2.083, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.51, |
|
"learning_rate": 2.141721854304636e-05, |
|
"loss": 0.2026, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"learning_rate": 2.0092715231788082e-05, |
|
"loss": 0.1838, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"eval_accuracy": 0.9167117360735533, |
|
"eval_f1": 0.9161963590301421, |
|
"eval_loss": 0.23172695934772491, |
|
"eval_matthews_correlation": 0.8347581669464483, |
|
"eval_precision": 0.9150315305811474, |
|
"eval_recall": 0.919739914885546, |
|
"eval_runtime": 13.8871, |
|
"eval_samples_per_second": 133.145, |
|
"eval_steps_per_second": 2.088, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"learning_rate": 1.8768211920529804e-05, |
|
"loss": 0.1709, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.16, |
|
"learning_rate": 1.7443708609271526e-05, |
|
"loss": 0.1294, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.16, |
|
"eval_accuracy": 0.9215792320173066, |
|
"eval_f1": 0.9202124731082957, |
|
"eval_loss": 0.30326515436172485, |
|
"eval_matthews_correlation": 0.8409598313352707, |
|
"eval_precision": 0.922362176282312, |
|
"eval_recall": 0.918606043363325, |
|
"eval_runtime": 13.8906, |
|
"eval_samples_per_second": 133.112, |
|
"eval_steps_per_second": 2.088, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.38, |
|
"learning_rate": 1.6119205298013245e-05, |
|
"loss": 0.1035, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"learning_rate": 1.4794701986754966e-05, |
|
"loss": 0.0985, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"eval_accuracy": 0.9318550567874527, |
|
"eval_f1": 0.9310236405107544, |
|
"eval_loss": 0.2722685933113098, |
|
"eval_matthews_correlation": 0.8620829631411653, |
|
"eval_precision": 0.9306271696202292, |
|
"eval_recall": 0.9314561921358038, |
|
"eval_runtime": 13.8974, |
|
"eval_samples_per_second": 133.047, |
|
"eval_steps_per_second": 2.087, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 2.81, |
|
"learning_rate": 1.3470198675496688e-05, |
|
"loss": 0.1197, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"learning_rate": 1.2145695364238412e-05, |
|
"loss": 0.0996, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.02, |
|
"eval_accuracy": 0.9307733910221742, |
|
"eval_f1": 0.9295971062088004, |
|
"eval_loss": 0.25412517786026, |
|
"eval_matthews_correlation": 0.8596347250275603, |
|
"eval_precision": 0.9315324336402677, |
|
"eval_recall": 0.9281091077207582, |
|
"eval_runtime": 13.861, |
|
"eval_samples_per_second": 133.396, |
|
"eval_steps_per_second": 2.092, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.24, |
|
"learning_rate": 1.0821192052980133e-05, |
|
"loss": 0.0648, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"learning_rate": 9.509933774834438e-06, |
|
"loss": 0.0606, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"eval_accuracy": 0.9378042184964845, |
|
"eval_f1": 0.9368778062265761, |
|
"eval_loss": 0.28330132365226746, |
|
"eval_matthews_correlation": 0.8738509274469478, |
|
"eval_precision": 0.9376815542111061, |
|
"eval_recall": 0.9361706793745628, |
|
"eval_runtime": 13.8639, |
|
"eval_samples_per_second": 133.367, |
|
"eval_steps_per_second": 2.092, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"learning_rate": 8.185430463576158e-06, |
|
"loss": 0.0428, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"learning_rate": 6.8609271523178805e-06, |
|
"loss": 0.0498, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"eval_accuracy": 0.9378042184964845, |
|
"eval_f1": 0.9367918681230483, |
|
"eval_loss": 0.29408514499664307, |
|
"eval_matthews_correlation": 0.8738828807254423, |
|
"eval_precision": 0.9383419948746582, |
|
"eval_recall": 0.9355453607880793, |
|
"eval_runtime": 13.8855, |
|
"eval_samples_per_second": 133.161, |
|
"eval_steps_per_second": 2.089, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 4.1, |
|
"learning_rate": 5.536423841059603e-06, |
|
"loss": 0.0431, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 4.32, |
|
"learning_rate": 4.211920529801325e-06, |
|
"loss": 0.0192, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.32, |
|
"eval_accuracy": 0.9405083829096809, |
|
"eval_f1": 0.9395484397142884, |
|
"eval_loss": 0.29439404606819153, |
|
"eval_matthews_correlation": 0.8793713183376617, |
|
"eval_precision": 0.9410276655328202, |
|
"eval_recall": 0.9383477364059888, |
|
"eval_runtime": 38.3587, |
|
"eval_samples_per_second": 48.203, |
|
"eval_steps_per_second": 0.756, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 4.54, |
|
"learning_rate": 2.8874172185430465e-06, |
|
"loss": 0.0261, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"learning_rate": 1.5629139072847683e-06, |
|
"loss": 0.0276, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 4.75, |
|
"eval_accuracy": 0.942671714440238, |
|
"eval_f1": 0.9418255234675899, |
|
"eval_loss": 0.2877638638019562, |
|
"eval_matthews_correlation": 0.8837326760671694, |
|
"eval_precision": 0.94256886123578, |
|
"eval_recall": 0.9411649299998814, |
|
"eval_runtime": 13.8654, |
|
"eval_samples_per_second": 133.354, |
|
"eval_steps_per_second": 2.092, |
|
"step": 2200 |
|
} |
|
], |
|
"max_steps": 2315, |
|
"num_train_epochs": 5, |
|
"total_flos": 5574741099609024.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|