| { | |
| "best_metric": 0.8780487804878049, | |
| "best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-33", | |
| "epoch": 30.0, | |
| "global_step": 90, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_f1": 0.19148936170212766, | |
| "eval_loss": 0.7407425045967102, | |
| "eval_runtime": 0.5779, | |
| "eval_samples_per_second": 173.027, | |
| "eval_steps_per_second": 6.921, | |
| "step": 3 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_f1": 0.3773584905660377, | |
| "eval_loss": 0.729247510433197, | |
| "eval_runtime": 0.5528, | |
| "eval_samples_per_second": 180.896, | |
| "eval_steps_per_second": 7.236, | |
| "step": 6 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_f1": 0.4786324786324786, | |
| "eval_loss": 0.7105527520179749, | |
| "eval_runtime": 0.558, | |
| "eval_samples_per_second": 179.203, | |
| "eval_steps_per_second": 7.168, | |
| "step": 9 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_f1": 0.6060606060606061, | |
| "eval_loss": 0.6890331506729126, | |
| "eval_runtime": 0.5504, | |
| "eval_samples_per_second": 181.671, | |
| "eval_steps_per_second": 7.267, | |
| "step": 12 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_f1": 0.7, | |
| "eval_loss": 0.6695859432220459, | |
| "eval_runtime": 0.5595, | |
| "eval_samples_per_second": 178.745, | |
| "eval_steps_per_second": 7.15, | |
| "step": 15 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_f1": 0.7761194029850746, | |
| "eval_loss": 0.6517141461372375, | |
| "eval_runtime": 0.5632, | |
| "eval_samples_per_second": 177.548, | |
| "eval_steps_per_second": 7.102, | |
| "step": 18 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_f1": 0.828125, | |
| "eval_loss": 0.6349117755889893, | |
| "eval_runtime": 0.5567, | |
| "eval_samples_per_second": 179.616, | |
| "eval_steps_per_second": 7.185, | |
| "step": 21 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_f1": 0.8503937007874015, | |
| "eval_loss": 0.618772029876709, | |
| "eval_runtime": 0.5546, | |
| "eval_samples_per_second": 180.325, | |
| "eval_steps_per_second": 7.213, | |
| "step": 24 | |
| }, | |
| { | |
| "epoch": 8.33, | |
| "learning_rate": 8.024691358024692e-06, | |
| "loss": 0.634, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_f1": 0.8709677419354839, | |
| "eval_loss": 0.6039881706237793, | |
| "eval_runtime": 0.5519, | |
| "eval_samples_per_second": 181.185, | |
| "eval_steps_per_second": 7.247, | |
| "step": 27 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_f1": 0.8709677419354839, | |
| "eval_loss": 0.5912619829177856, | |
| "eval_runtime": 0.5573, | |
| "eval_samples_per_second": 179.441, | |
| "eval_steps_per_second": 7.178, | |
| "step": 30 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_f1": 0.8780487804878049, | |
| "eval_loss": 0.5805598497390747, | |
| "eval_runtime": 0.5574, | |
| "eval_samples_per_second": 179.394, | |
| "eval_steps_per_second": 7.176, | |
| "step": 33 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_f1": 0.8688524590163933, | |
| "eval_loss": 0.5723507404327393, | |
| "eval_runtime": 0.5544, | |
| "eval_samples_per_second": 180.362, | |
| "eval_steps_per_second": 7.214, | |
| "step": 36 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_f1": 0.8688524590163933, | |
| "eval_loss": 0.5652728080749512, | |
| "eval_runtime": 0.5588, | |
| "eval_samples_per_second": 178.951, | |
| "eval_steps_per_second": 7.158, | |
| "step": 39 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_f1": 0.8688524590163933, | |
| "eval_loss": 0.5592342019081116, | |
| "eval_runtime": 0.5516, | |
| "eval_samples_per_second": 181.294, | |
| "eval_steps_per_second": 7.252, | |
| "step": 42 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_f1": 0.8760330578512396, | |
| "eval_loss": 0.553566575050354, | |
| "eval_runtime": 0.558, | |
| "eval_samples_per_second": 179.226, | |
| "eval_steps_per_second": 7.169, | |
| "step": 45 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_f1": 0.8760330578512396, | |
| "eval_loss": 0.5487043857574463, | |
| "eval_runtime": 0.5688, | |
| "eval_samples_per_second": 175.802, | |
| "eval_steps_per_second": 7.032, | |
| "step": 48 | |
| }, | |
| { | |
| "epoch": 16.67, | |
| "learning_rate": 4.938271604938272e-06, | |
| "loss": 0.5096, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_f1": 0.8760330578512396, | |
| "eval_loss": 0.5434445142745972, | |
| "eval_runtime": 0.5636, | |
| "eval_samples_per_second": 177.42, | |
| "eval_steps_per_second": 7.097, | |
| "step": 51 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_f1": 0.8760330578512396, | |
| "eval_loss": 0.5385234951972961, | |
| "eval_runtime": 0.561, | |
| "eval_samples_per_second": 178.247, | |
| "eval_steps_per_second": 7.13, | |
| "step": 54 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_f1": 0.8760330578512396, | |
| "eval_loss": 0.5339138507843018, | |
| "eval_runtime": 0.5531, | |
| "eval_samples_per_second": 180.806, | |
| "eval_steps_per_second": 7.232, | |
| "step": 57 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5293477177619934, | |
| "eval_runtime": 0.5612, | |
| "eval_samples_per_second": 178.191, | |
| "eval_steps_per_second": 7.128, | |
| "step": 60 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5248751640319824, | |
| "eval_runtime": 0.554, | |
| "eval_samples_per_second": 180.518, | |
| "eval_steps_per_second": 7.221, | |
| "step": 63 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5204405784606934, | |
| "eval_runtime": 0.564, | |
| "eval_samples_per_second": 177.317, | |
| "eval_steps_per_second": 7.093, | |
| "step": 66 | |
| }, | |
| { | |
| "epoch": 23.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5157800912857056, | |
| "eval_runtime": 0.5507, | |
| "eval_samples_per_second": 181.589, | |
| "eval_steps_per_second": 7.264, | |
| "step": 69 | |
| }, | |
| { | |
| "epoch": 24.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5112195014953613, | |
| "eval_runtime": 0.5502, | |
| "eval_samples_per_second": 181.737, | |
| "eval_steps_per_second": 7.269, | |
| "step": 72 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "learning_rate": 1.8518518518518519e-06, | |
| "loss": 0.4584, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 25.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5078128576278687, | |
| "eval_runtime": 0.5542, | |
| "eval_samples_per_second": 180.427, | |
| "eval_steps_per_second": 7.217, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 26.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5054234266281128, | |
| "eval_runtime": 0.5564, | |
| "eval_samples_per_second": 179.717, | |
| "eval_steps_per_second": 7.189, | |
| "step": 78 | |
| }, | |
| { | |
| "epoch": 27.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.503419041633606, | |
| "eval_runtime": 0.5536, | |
| "eval_samples_per_second": 180.639, | |
| "eval_steps_per_second": 7.226, | |
| "step": 81 | |
| }, | |
| { | |
| "epoch": 28.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5020792484283447, | |
| "eval_runtime": 0.5563, | |
| "eval_samples_per_second": 179.771, | |
| "eval_steps_per_second": 7.191, | |
| "step": 84 | |
| }, | |
| { | |
| "epoch": 29.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.5012262463569641, | |
| "eval_runtime": 0.5542, | |
| "eval_samples_per_second": 180.449, | |
| "eval_steps_per_second": 7.218, | |
| "step": 87 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "eval_f1": 0.8739495798319329, | |
| "eval_loss": 0.50089430809021, | |
| "eval_runtime": 0.553, | |
| "eval_samples_per_second": 180.845, | |
| "eval_steps_per_second": 7.234, | |
| "step": 90 | |
| }, | |
| { | |
| "epoch": 30.0, | |
| "step": 90, | |
| "total_flos": 2.7816295750742016e+17, | |
| "train_loss": 0.517905675040351, | |
| "train_runtime": 173.4592, | |
| "train_samples_per_second": 63.819, | |
| "train_steps_per_second": 0.519 | |
| } | |
| ], | |
| "max_steps": 90, | |
| "num_train_epochs": 30, | |
| "total_flos": 2.7816295750742016e+17, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |