| { |
| "best_metric": 0.8780487804878049, |
| "best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-33", |
| "epoch": 30.0, |
| "global_step": 90, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_f1": 0.19148936170212766, |
| "eval_loss": 0.7407425045967102, |
| "eval_runtime": 0.5779, |
| "eval_samples_per_second": 173.027, |
| "eval_steps_per_second": 6.921, |
| "step": 3 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_f1": 0.3773584905660377, |
| "eval_loss": 0.729247510433197, |
| "eval_runtime": 0.5528, |
| "eval_samples_per_second": 180.896, |
| "eval_steps_per_second": 7.236, |
| "step": 6 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_f1": 0.4786324786324786, |
| "eval_loss": 0.7105527520179749, |
| "eval_runtime": 0.558, |
| "eval_samples_per_second": 179.203, |
| "eval_steps_per_second": 7.168, |
| "step": 9 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_f1": 0.6060606060606061, |
| "eval_loss": 0.6890331506729126, |
| "eval_runtime": 0.5504, |
| "eval_samples_per_second": 181.671, |
| "eval_steps_per_second": 7.267, |
| "step": 12 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_f1": 0.7, |
| "eval_loss": 0.6695859432220459, |
| "eval_runtime": 0.5595, |
| "eval_samples_per_second": 178.745, |
| "eval_steps_per_second": 7.15, |
| "step": 15 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_f1": 0.7761194029850746, |
| "eval_loss": 0.6517141461372375, |
| "eval_runtime": 0.5632, |
| "eval_samples_per_second": 177.548, |
| "eval_steps_per_second": 7.102, |
| "step": 18 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_f1": 0.828125, |
| "eval_loss": 0.6349117755889893, |
| "eval_runtime": 0.5567, |
| "eval_samples_per_second": 179.616, |
| "eval_steps_per_second": 7.185, |
| "step": 21 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_f1": 0.8503937007874015, |
| "eval_loss": 0.618772029876709, |
| "eval_runtime": 0.5546, |
| "eval_samples_per_second": 180.325, |
| "eval_steps_per_second": 7.213, |
| "step": 24 |
| }, |
| { |
| "epoch": 8.33, |
| "learning_rate": 8.024691358024692e-06, |
| "loss": 0.634, |
| "step": 25 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_f1": 0.8709677419354839, |
| "eval_loss": 0.6039881706237793, |
| "eval_runtime": 0.5519, |
| "eval_samples_per_second": 181.185, |
| "eval_steps_per_second": 7.247, |
| "step": 27 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_f1": 0.8709677419354839, |
| "eval_loss": 0.5912619829177856, |
| "eval_runtime": 0.5573, |
| "eval_samples_per_second": 179.441, |
| "eval_steps_per_second": 7.178, |
| "step": 30 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_f1": 0.8780487804878049, |
| "eval_loss": 0.5805598497390747, |
| "eval_runtime": 0.5574, |
| "eval_samples_per_second": 179.394, |
| "eval_steps_per_second": 7.176, |
| "step": 33 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_f1": 0.8688524590163933, |
| "eval_loss": 0.5723507404327393, |
| "eval_runtime": 0.5544, |
| "eval_samples_per_second": 180.362, |
| "eval_steps_per_second": 7.214, |
| "step": 36 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_f1": 0.8688524590163933, |
| "eval_loss": 0.5652728080749512, |
| "eval_runtime": 0.5588, |
| "eval_samples_per_second": 178.951, |
| "eval_steps_per_second": 7.158, |
| "step": 39 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_f1": 0.8688524590163933, |
| "eval_loss": 0.5592342019081116, |
| "eval_runtime": 0.5516, |
| "eval_samples_per_second": 181.294, |
| "eval_steps_per_second": 7.252, |
| "step": 42 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_f1": 0.8760330578512396, |
| "eval_loss": 0.553566575050354, |
| "eval_runtime": 0.558, |
| "eval_samples_per_second": 179.226, |
| "eval_steps_per_second": 7.169, |
| "step": 45 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_f1": 0.8760330578512396, |
| "eval_loss": 0.5487043857574463, |
| "eval_runtime": 0.5688, |
| "eval_samples_per_second": 175.802, |
| "eval_steps_per_second": 7.032, |
| "step": 48 |
| }, |
| { |
| "epoch": 16.67, |
| "learning_rate": 4.938271604938272e-06, |
| "loss": 0.5096, |
| "step": 50 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_f1": 0.8760330578512396, |
| "eval_loss": 0.5434445142745972, |
| "eval_runtime": 0.5636, |
| "eval_samples_per_second": 177.42, |
| "eval_steps_per_second": 7.097, |
| "step": 51 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_f1": 0.8760330578512396, |
| "eval_loss": 0.5385234951972961, |
| "eval_runtime": 0.561, |
| "eval_samples_per_second": 178.247, |
| "eval_steps_per_second": 7.13, |
| "step": 54 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_f1": 0.8760330578512396, |
| "eval_loss": 0.5339138507843018, |
| "eval_runtime": 0.5531, |
| "eval_samples_per_second": 180.806, |
| "eval_steps_per_second": 7.232, |
| "step": 57 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5293477177619934, |
| "eval_runtime": 0.5612, |
| "eval_samples_per_second": 178.191, |
| "eval_steps_per_second": 7.128, |
| "step": 60 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5248751640319824, |
| "eval_runtime": 0.554, |
| "eval_samples_per_second": 180.518, |
| "eval_steps_per_second": 7.221, |
| "step": 63 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5204405784606934, |
| "eval_runtime": 0.564, |
| "eval_samples_per_second": 177.317, |
| "eval_steps_per_second": 7.093, |
| "step": 66 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5157800912857056, |
| "eval_runtime": 0.5507, |
| "eval_samples_per_second": 181.589, |
| "eval_steps_per_second": 7.264, |
| "step": 69 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5112195014953613, |
| "eval_runtime": 0.5502, |
| "eval_samples_per_second": 181.737, |
| "eval_steps_per_second": 7.269, |
| "step": 72 |
| }, |
| { |
| "epoch": 25.0, |
| "learning_rate": 1.8518518518518519e-06, |
| "loss": 0.4584, |
| "step": 75 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5078128576278687, |
| "eval_runtime": 0.5542, |
| "eval_samples_per_second": 180.427, |
| "eval_steps_per_second": 7.217, |
| "step": 75 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5054234266281128, |
| "eval_runtime": 0.5564, |
| "eval_samples_per_second": 179.717, |
| "eval_steps_per_second": 7.189, |
| "step": 78 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.503419041633606, |
| "eval_runtime": 0.5536, |
| "eval_samples_per_second": 180.639, |
| "eval_steps_per_second": 7.226, |
| "step": 81 |
| }, |
| { |
| "epoch": 28.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5020792484283447, |
| "eval_runtime": 0.5563, |
| "eval_samples_per_second": 179.771, |
| "eval_steps_per_second": 7.191, |
| "step": 84 |
| }, |
| { |
| "epoch": 29.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.5012262463569641, |
| "eval_runtime": 0.5542, |
| "eval_samples_per_second": 180.449, |
| "eval_steps_per_second": 7.218, |
| "step": 87 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_f1": 0.8739495798319329, |
| "eval_loss": 0.50089430809021, |
| "eval_runtime": 0.553, |
| "eval_samples_per_second": 180.845, |
| "eval_steps_per_second": 7.234, |
| "step": 90 |
| }, |
| { |
| "epoch": 30.0, |
| "step": 90, |
| "total_flos": 2.7816295750742016e+17, |
| "train_loss": 0.517905675040351, |
| "train_runtime": 173.4592, |
| "train_samples_per_second": 63.819, |
| "train_steps_per_second": 0.519 |
| } |
| ], |
| "max_steps": 90, |
| "num_train_epochs": 30, |
| "total_flos": 2.7816295750742016e+17, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|