{ "best_global_step": 30, "best_metric": 1.0, "best_model_checkpoint": "vit-base-patch32-384-finetuned-humid-classes-32/checkpoint-30", "epoch": 50.0, "eval_steps": 500, "global_step": 150, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.23684210526315788, "eval_f1_dry": 0.0, "eval_f1_firm": 0.18181818181818182, "eval_f1_humid": 0.0, "eval_f1_lump": 0.4, "eval_f1_macro": 0.15444096133751306, "eval_f1_moist": 0.0, "eval_f1_rockies": 0.3448275862068966, "eval_loss": 1.7800142765045166, "eval_precision_dry": 0.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.0, "eval_precision_lump": 0.3333333333333333, "eval_precision_macro": 0.2569444444444444, "eval_precision_moist": 0.0, "eval_precision_rockies": 0.20833333333333334, "eval_recall_dry": 0.0, "eval_recall_firm": 0.1, "eval_recall_humid": 0.0, "eval_recall_lump": 0.5, "eval_recall_macro": 0.26666666666666666, "eval_recall_moist": 0.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.9091, "eval_samples_per_second": 41.801, "eval_steps_per_second": 3.3, "step": 3 }, { "epoch": 2.0, "eval_accuracy": 0.6052631578947368, "eval_f1_dry": 0.0, "eval_f1_firm": 0.9090909090909091, "eval_f1_humid": 0.5833333333333334, "eval_f1_lump": 0.0, "eval_f1_macro": 0.4436091686091686, "eval_f1_moist": 0.4, "eval_f1_rockies": 0.7692307692307693, "eval_loss": 1.4470411539077759, "eval_precision_dry": 0.0, "eval_precision_firm": 0.8333333333333334, "eval_precision_humid": 0.4117647058823529, "eval_precision_lump": 0.0, "eval_precision_macro": 0.4783496732026144, "eval_precision_moist": 1.0, "eval_precision_rockies": 0.625, "eval_recall_dry": 0.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.0, "eval_recall_macro": 0.5416666666666666, "eval_recall_moist": 0.25, "eval_recall_rockies": 1.0, "eval_runtime": 0.6705, "eval_samples_per_second": 56.677, "eval_steps_per_second": 4.474, "step": 6 }, { "epoch": 3.0, "eval_accuracy": 0.5526315789473685, "eval_f1_dry": 0.0, "eval_f1_firm": 0.9523809523809523, "eval_f1_humid": 0.6666666666666666, "eval_f1_lump": 0.0, "eval_f1_macro": 0.3878968253968254, "eval_f1_moist": 0.375, "eval_f1_rockies": 0.3333333333333333, "eval_loss": 1.2254561185836792, "eval_precision_dry": 0.0, "eval_precision_firm": 0.9090909090909091, "eval_precision_humid": 0.5, "eval_precision_lump": 0.0, "eval_precision_macro": 0.4431818181818182, "eval_precision_moist": 0.25, "eval_precision_rockies": 1.0, "eval_recall_dry": 0.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.0, "eval_recall_macro": 0.4916666666666667, "eval_recall_moist": 0.75, "eval_recall_rockies": 0.2, "eval_runtime": 0.6634, "eval_samples_per_second": 57.284, "eval_steps_per_second": 4.522, "step": 9 }, { "epoch": 3.4, "grad_norm": 4.948105812072754, "learning_rate": 3e-05, "loss": 1.6327, "step": 10 }, { "epoch": 4.0, "eval_accuracy": 0.7631578947368421, "eval_f1_dry": 0.8, "eval_f1_firm": 0.9523809523809523, "eval_f1_humid": 0.7, "eval_f1_lump": 0.0, "eval_f1_macro": 0.6865079365079364, "eval_f1_moist": 0.6666666666666666, "eval_f1_rockies": 1.0, "eval_loss": 0.9397746920585632, "eval_precision_dry": 1.0, "eval_precision_firm": 0.9090909090909091, "eval_precision_humid": 0.5384615384615384, "eval_precision_lump": 0.0, "eval_precision_macro": 0.6745920745920747, "eval_precision_moist": 0.6, "eval_precision_rockies": 1.0, "eval_recall_dry": 0.6666666666666666, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.0, "eval_recall_macro": 0.736111111111111, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.6614, "eval_samples_per_second": 57.456, "eval_steps_per_second": 4.536, "step": 12 }, { "epoch": 5.0, "eval_accuracy": 0.8947368421052632, "eval_f1_dry": 0.8, "eval_f1_firm": 1.0, "eval_f1_humid": 0.875, "eval_f1_lump": 0.9090909090909091, "eval_f1_macro": 0.8751262626262627, "eval_f1_moist": 0.6666666666666666, "eval_f1_rockies": 1.0, "eval_loss": 0.623245894908905, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.7777777777777778, "eval_precision_lump": 1.0, "eval_precision_macro": 0.8962962962962963, "eval_precision_moist": 0.6, "eval_precision_rockies": 1.0, "eval_recall_dry": 0.6666666666666666, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.8333333333333334, "eval_recall_macro": 0.875, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.7369, "eval_samples_per_second": 51.565, "eval_steps_per_second": 4.071, "step": 15 }, { "epoch": 6.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9650793650793651, "eval_f1_moist": 0.8571428571428571, "eval_f1_rockies": 1.0, "eval_loss": 0.32733020186424255, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9791666666666666, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9583333333333334, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 1.1558, "eval_samples_per_second": 32.879, "eval_steps_per_second": 2.596, "step": 18 }, { "epoch": 6.8, "grad_norm": 2.2400197982788086, "learning_rate": 4.851851851851852e-05, "loss": 0.6436, "step": 20 }, { "epoch": 7.0, "eval_accuracy": 0.9210526315789473, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.875, "eval_f1_lump": 0.9090909090909091, "eval_f1_macro": 0.9038299663299663, "eval_f1_moist": 0.75, "eval_f1_rockies": 0.8888888888888888, "eval_loss": 0.2520924210548401, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.7777777777777778, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9212962962962963, "eval_precision_moist": 0.75, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.8333333333333334, "eval_recall_macro": 0.8972222222222223, "eval_recall_moist": 0.75, "eval_recall_rockies": 0.8, "eval_runtime": 0.7413, "eval_samples_per_second": 51.26, "eval_steps_per_second": 4.047, "step": 21 }, { "epoch": 8.0, "eval_accuracy": 0.9473684210526315, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9166666666666666, "eval_f1_moist": 0.6666666666666666, "eval_f1_rockies": 0.8333333333333334, "eval_loss": 0.13729172945022583, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9523809523809524, "eval_precision_moist": 1.0, "eval_precision_rockies": 0.7142857142857143, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9166666666666666, "eval_recall_moist": 0.5, "eval_recall_rockies": 1.0, "eval_runtime": 0.6765, "eval_samples_per_second": 56.168, "eval_steps_per_second": 4.434, "step": 24 }, { "epoch": 9.0, "eval_accuracy": 0.9473684210526315, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9287037037037038, "eval_f1_moist": 0.75, "eval_f1_rockies": 0.8888888888888888, "eval_loss": 0.15521343052387238, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9375, "eval_precision_moist": 0.75, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9249999999999999, "eval_recall_moist": 0.75, "eval_recall_rockies": 0.8, "eval_runtime": 0.6709, "eval_samples_per_second": 56.642, "eval_steps_per_second": 4.472, "step": 27 }, { "epoch": 10.0, "grad_norm": 2.4721362590789795, "learning_rate": 4.481481481481482e-05, "loss": 0.1165, "step": 30 }, { "epoch": 10.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.054696615785360336, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.7869, "eval_samples_per_second": 48.292, "eval_steps_per_second": 3.813, "step": 30 }, { "epoch": 11.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.05095173045992851, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6642, "eval_samples_per_second": 57.213, "eval_steps_per_second": 4.517, "step": 33 }, { "epoch": 12.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9629629629629631, "eval_f1_moist": 0.8888888888888888, "eval_f1_rockies": 0.8888888888888888, "eval_loss": 0.09588845074176788, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9666666666666667, "eval_precision_moist": 0.8, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9666666666666667, "eval_recall_moist": 1.0, "eval_recall_rockies": 0.8, "eval_runtime": 0.7339, "eval_samples_per_second": 51.782, "eval_steps_per_second": 4.088, "step": 36 }, { "epoch": 13.0, "eval_accuracy": 0.9473684210526315, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9287037037037038, "eval_f1_moist": 0.75, "eval_f1_rockies": 0.8888888888888888, "eval_loss": 0.06681454926729202, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9375, "eval_precision_moist": 0.75, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9249999999999999, "eval_recall_moist": 0.75, "eval_recall_rockies": 0.8, "eval_runtime": 0.7404, "eval_samples_per_second": 51.327, "eval_steps_per_second": 4.052, "step": 39 }, { "epoch": 13.4, "grad_norm": 0.25804993510246277, "learning_rate": 4.111111111111111e-05, "loss": 0.023, "step": 40 }, { "epoch": 14.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9650793650793651, "eval_f1_moist": 0.8571428571428571, "eval_f1_rockies": 1.0, "eval_loss": 0.07483488321304321, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9791666666666666, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9583333333333334, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.7353, "eval_samples_per_second": 51.68, "eval_steps_per_second": 4.08, "step": 42 }, { "epoch": 15.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9650793650793651, "eval_f1_moist": 0.8571428571428571, "eval_f1_rockies": 1.0, "eval_loss": 0.04593011736869812, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9791666666666666, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9583333333333334, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.6961, "eval_samples_per_second": 54.588, "eval_steps_per_second": 4.31, "step": 45 }, { "epoch": 16.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9629629629629631, "eval_f1_moist": 0.8888888888888888, "eval_f1_rockies": 0.8888888888888888, "eval_loss": 0.052568551152944565, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9666666666666667, "eval_precision_moist": 0.8, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9666666666666667, "eval_recall_moist": 1.0, "eval_recall_rockies": 0.8, "eval_runtime": 0.7089, "eval_samples_per_second": 53.605, "eval_steps_per_second": 4.232, "step": 48 }, { "epoch": 16.8, "grad_norm": 0.06971626728773117, "learning_rate": 3.740740740740741e-05, "loss": 0.0091, "step": 50 }, { "epoch": 17.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 1.0, "eval_f1_macro": 0.9650793650793651, "eval_f1_moist": 0.8571428571428571, "eval_f1_rockies": 1.0, "eval_loss": 0.0735773891210556, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9791666666666666, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 0.9583333333333334, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.6761, "eval_samples_per_second": 56.204, "eval_steps_per_second": 4.437, "step": 51 }, { "epoch": 18.0, "eval_accuracy": 0.9473684210526315, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.875, "eval_f1_lump": 0.9090909090909091, "eval_f1_macro": 0.9402056277056277, "eval_f1_moist": 0.8571428571428571, "eval_f1_rockies": 1.0, "eval_loss": 0.08610320836305618, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.7777777777777778, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9629629629629629, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.8333333333333334, "eval_recall_macro": 0.9305555555555557, "eval_recall_moist": 0.75, "eval_recall_rockies": 1.0, "eval_runtime": 0.6727, "eval_samples_per_second": 56.492, "eval_steps_per_second": 4.46, "step": 54 }, { "epoch": 19.0, "eval_accuracy": 0.9736842105263158, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 0.9333333333333333, "eval_f1_lump": 0.9090909090909091, "eval_f1_macro": 0.9737373737373738, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.059885572642087936, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 0.875, "eval_precision_lump": 1.0, "eval_precision_macro": 0.9791666666666666, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 0.8333333333333334, "eval_recall_macro": 0.9722222222222223, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6892, "eval_samples_per_second": 55.133, "eval_steps_per_second": 4.353, "step": 57 }, { "epoch": 20.0, "grad_norm": 0.10011594742536545, "learning_rate": 3.3703703703703706e-05, "loss": 0.0036, "step": 60 }, { "epoch": 20.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.022346777841448784, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6684, "eval_samples_per_second": 56.854, "eval_steps_per_second": 4.488, "step": 60 }, { "epoch": 21.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.008191967383027077, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6681, "eval_samples_per_second": 56.874, "eval_steps_per_second": 4.49, "step": 63 }, { "epoch": 22.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.004844570532441139, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6585, "eval_samples_per_second": 57.711, "eval_steps_per_second": 4.556, "step": 66 }, { "epoch": 23.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.0039038031827658415, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6573, "eval_samples_per_second": 57.811, "eval_steps_per_second": 4.564, "step": 69 }, { "epoch": 23.4, "grad_norm": 0.052555520087480545, "learning_rate": 3e-05, "loss": 0.0021, "step": 70 }, { "epoch": 24.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.0036111008375883102, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.67, "eval_samples_per_second": 56.716, "eval_steps_per_second": 4.478, "step": 72 }, { "epoch": 25.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.003612279426306486, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6757, "eval_samples_per_second": 56.236, "eval_steps_per_second": 4.44, "step": 75 }, { "epoch": 26.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.0040664165280759335, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6624, "eval_samples_per_second": 57.37, "eval_steps_per_second": 4.529, "step": 78 }, { "epoch": 26.8, "grad_norm": 0.017726685851812363, "learning_rate": 2.6296296296296296e-05, "loss": 0.0016, "step": 80 }, { "epoch": 27.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.005073578096926212, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6591, "eval_samples_per_second": 57.651, "eval_steps_per_second": 4.551, "step": 81 }, { "epoch": 28.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.006673986092209816, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6709, "eval_samples_per_second": 56.64, "eval_steps_per_second": 4.472, "step": 84 }, { "epoch": 29.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.008735415525734425, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6851, "eval_samples_per_second": 55.468, "eval_steps_per_second": 4.379, "step": 87 }, { "epoch": 30.0, "grad_norm": 0.019602151587605476, "learning_rate": 2.2592592592592594e-05, "loss": 0.0013, "step": 90 }, { "epoch": 30.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.010786506347358227, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6747, "eval_samples_per_second": 56.324, "eval_steps_per_second": 4.447, "step": 90 }, { "epoch": 31.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.012865853495895863, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6688, "eval_samples_per_second": 56.821, "eval_steps_per_second": 4.486, "step": 93 }, { "epoch": 32.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.013852025382220745, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 1.2041, "eval_samples_per_second": 31.558, "eval_steps_per_second": 2.491, "step": 96 }, { "epoch": 33.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.014263465069234371, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6718, "eval_samples_per_second": 56.561, "eval_steps_per_second": 4.465, "step": 99 }, { "epoch": 33.4, "grad_norm": 0.013969006948173046, "learning_rate": 1.888888888888889e-05, "loss": 0.0011, "step": 100 }, { "epoch": 34.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.014433705247938633, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6884, "eval_samples_per_second": 55.2, "eval_steps_per_second": 4.358, "step": 102 }, { "epoch": 35.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.014307624660432339, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6652, "eval_samples_per_second": 57.129, "eval_steps_per_second": 4.51, "step": 105 }, { "epoch": 36.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.013969190418720245, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6928, "eval_samples_per_second": 54.846, "eval_steps_per_second": 4.33, "step": 108 }, { "epoch": 36.8, "grad_norm": 0.011866221204400063, "learning_rate": 1.5185185185185186e-05, "loss": 0.001, "step": 110 }, { "epoch": 37.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.013421060517430305, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6713, "eval_samples_per_second": 56.605, "eval_steps_per_second": 4.469, "step": 111 }, { "epoch": 38.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.012647929601371288, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6646, "eval_samples_per_second": 57.176, "eval_steps_per_second": 4.514, "step": 114 }, { "epoch": 39.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.011756044812500477, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.7478, "eval_samples_per_second": 50.813, "eval_steps_per_second": 4.012, "step": 117 }, { "epoch": 40.0, "grad_norm": 0.016002096235752106, "learning_rate": 1.1481481481481482e-05, "loss": 0.001, "step": 120 }, { "epoch": 40.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.01096806488931179, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.663, "eval_samples_per_second": 57.319, "eval_steps_per_second": 4.525, "step": 120 }, { "epoch": 41.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.010448604822158813, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6705, "eval_samples_per_second": 56.673, "eval_steps_per_second": 4.474, "step": 123 }, { "epoch": 42.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.010021907277405262, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6723, "eval_samples_per_second": 56.521, "eval_steps_per_second": 4.462, "step": 126 }, { "epoch": 43.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009785743430256844, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.689, "eval_samples_per_second": 55.148, "eval_steps_per_second": 4.354, "step": 129 }, { "epoch": 43.4, "grad_norm": 0.011299243196845055, "learning_rate": 7.777777777777777e-06, "loss": 0.0009, "step": 130 }, { "epoch": 44.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009630183689296246, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6698, "eval_samples_per_second": 56.735, "eval_steps_per_second": 4.479, "step": 132 }, { "epoch": 45.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009469670243561268, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6835, "eval_samples_per_second": 55.592, "eval_steps_per_second": 4.389, "step": 135 }, { "epoch": 46.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009332198649644852, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.672, "eval_samples_per_second": 56.549, "eval_steps_per_second": 4.464, "step": 138 }, { "epoch": 46.8, "grad_norm": 0.011965502053499222, "learning_rate": 4.074074074074075e-06, "loss": 0.0009, "step": 140 }, { "epoch": 47.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009224910289049149, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6702, "eval_samples_per_second": 56.702, "eval_steps_per_second": 4.476, "step": 141 }, { "epoch": 48.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009173477999866009, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.7274, "eval_samples_per_second": 52.242, "eval_steps_per_second": 4.124, "step": 144 }, { "epoch": 49.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009150910191237926, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6693, "eval_samples_per_second": 56.778, "eval_steps_per_second": 4.482, "step": 147 }, { "epoch": 50.0, "grad_norm": 0.01177594717592001, "learning_rate": 3.703703703703704e-07, "loss": 0.0009, "step": 150 }, { "epoch": 50.0, "eval_accuracy": 1.0, "eval_f1_dry": 1.0, "eval_f1_firm": 1.0, "eval_f1_humid": 1.0, "eval_f1_lump": 1.0, "eval_f1_macro": 1.0, "eval_f1_moist": 1.0, "eval_f1_rockies": 1.0, "eval_loss": 0.009149772115051746, "eval_precision_dry": 1.0, "eval_precision_firm": 1.0, "eval_precision_humid": 1.0, "eval_precision_lump": 1.0, "eval_precision_macro": 1.0, "eval_precision_moist": 1.0, "eval_precision_rockies": 1.0, "eval_recall_dry": 1.0, "eval_recall_firm": 1.0, "eval_recall_humid": 1.0, "eval_recall_lump": 1.0, "eval_recall_macro": 1.0, "eval_recall_moist": 1.0, "eval_recall_rockies": 1.0, "eval_runtime": 0.6821, "eval_samples_per_second": 55.711, "eval_steps_per_second": 4.398, "step": 150 }, { "epoch": 50.0, "step": 150, "total_flos": 1.74247705460736e+18, "train_loss": 0.16261619688322146, "train_runtime": 336.1639, "train_samples_per_second": 22.311, "train_steps_per_second": 0.446 } ], "logging_steps": 10, "max_steps": 150, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.74247705460736e+18, "train_batch_size": 16, "trial_name": null, "trial_params": null }