{ "best_metric": 0.9322203066872333, "best_model_checkpoint": "/content/drive/MyDrive/checkpoint_layoutlm2/checkpoint-3500", "epoch": 26.31578947368421, "global_step": 5000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.53, "eval_accuracy": 0.5655867006431259, "eval_f1": 0.49600000000000005, "eval_loss": 1.9622313976287842, "eval_precision": 0.6104310803618946, "eval_recall": 0.41769847050254916, "eval_runtime": 31.7963, "eval_samples_per_second": 5.976, "eval_steps_per_second": 1.51, "step": 100 }, { "epoch": 1.05, "eval_accuracy": 0.7380172309185778, "eval_f1": 0.6739791685869665, "eval_loss": 1.2630114555358887, "eval_precision": 0.682471532574202, "eval_recall": 0.6656955571740714, "eval_runtime": 32.3716, "eval_samples_per_second": 5.869, "eval_steps_per_second": 1.483, "step": 200 }, { "epoch": 1.58, "eval_accuracy": 0.7893459531610242, "eval_f1": 0.7480542986425339, "eval_loss": 0.9176977872848511, "eval_precision": 0.7436128103634401, "eval_recall": 0.7525491624180627, "eval_runtime": 32.1494, "eval_samples_per_second": 5.91, "eval_steps_per_second": 1.493, "step": 300 }, { "epoch": 2.11, "eval_accuracy": 0.8295109816769809, "eval_f1": 0.8007957319830002, "eval_loss": 0.7080672979354858, "eval_precision": 0.7954014729656906, "eval_recall": 0.8062636562272396, "eval_runtime": 32.0545, "eval_samples_per_second": 5.927, "eval_steps_per_second": 1.497, "step": 400 }, { "epoch": 2.63, "learning_rate": 9.666666666666667e-06, "loss": 1.4294, "step": 500 }, { "epoch": 2.63, "eval_accuracy": 0.8411600533915787, "eval_f1": 0.8213092550790069, "eval_loss": 0.6136476397514343, "eval_precision": 0.814615797958087, "eval_recall": 0.8281136198106337, "eval_runtime": 32.0473, "eval_samples_per_second": 5.929, "eval_steps_per_second": 1.498, "step": 500 }, { "epoch": 3.16, "eval_accuracy": 0.8741657565829389, "eval_f1": 0.8656448866182666, "eval_loss": 0.5390823483467102, "eval_precision": 0.8524271844660194, "eval_recall": 0.879278951201748, "eval_runtime": 33.0229, "eval_samples_per_second": 5.754, "eval_steps_per_second": 1.454, "step": 600 }, { "epoch": 3.68, "eval_accuracy": 0.8869069287707803, "eval_f1": 0.878114599262391, "eval_loss": 0.47398096323013306, "eval_precision": 0.8677333333333334, "eval_recall": 0.8887472687545521, "eval_runtime": 32.5116, "eval_samples_per_second": 5.844, "eval_steps_per_second": 1.476, "step": 700 }, { "epoch": 4.21, "eval_accuracy": 0.8989200339764591, "eval_f1": 0.893278463648834, "eval_loss": 0.4286675751209259, "eval_precision": 0.8972992834833732, "eval_recall": 0.8892935178441369, "eval_runtime": 32.15, "eval_samples_per_second": 5.91, "eval_steps_per_second": 1.493, "step": 800 }, { "epoch": 4.74, "eval_accuracy": 0.9040165028515956, "eval_f1": 0.8944705457173835, "eval_loss": 0.40272650122642517, "eval_precision": 0.8877331420373027, "eval_recall": 0.9013109978150037, "eval_runtime": 32.2339, "eval_samples_per_second": 5.894, "eval_steps_per_second": 1.489, "step": 900 }, { "epoch": 5.26, "learning_rate": 9.333333333333334e-06, "loss": 0.455, "step": 1000 }, { "epoch": 5.26, "eval_accuracy": 0.9131173401286252, "eval_f1": 0.9035698147311342, "eval_loss": 0.369215190410614, "eval_precision": 0.8970034092948143, "eval_recall": 0.9102330662782229, "eval_runtime": 32.0091, "eval_samples_per_second": 5.936, "eval_steps_per_second": 1.5, "step": 1000 }, { "epoch": 5.79, "eval_accuracy": 0.9172430530275452, "eval_f1": 0.912167606768735, "eval_loss": 0.36320310831069946, "eval_precision": 0.8973049145675532, "eval_recall": 0.9275309541150765, "eval_runtime": 31.8391, "eval_samples_per_second": 5.968, "eval_steps_per_second": 1.508, "step": 1100 }, { "epoch": 6.32, "eval_accuracy": 0.9166363305424099, "eval_f1": 0.9132502018480307, "eval_loss": 0.34437164664268494, "eval_precision": 0.9000884173297966, "eval_recall": 0.92680262199563, "eval_runtime": 31.688, "eval_samples_per_second": 5.996, "eval_steps_per_second": 1.515, "step": 1200 }, { "epoch": 6.84, "eval_accuracy": 0.924766411843223, "eval_f1": 0.9212297616881936, "eval_loss": 0.327307790517807, "eval_precision": 0.920392584514722, "eval_recall": 0.922068463219228, "eval_runtime": 31.8134, "eval_samples_per_second": 5.972, "eval_steps_per_second": 1.509, "step": 1300 }, { "epoch": 7.37, "eval_accuracy": 0.9242810338551146, "eval_f1": 0.9209428830462375, "eval_loss": 0.32373183965682983, "eval_precision": 0.9171180931744312, "eval_recall": 0.9247997086671522, "eval_runtime": 32.69, "eval_samples_per_second": 5.812, "eval_steps_per_second": 1.468, "step": 1400 }, { "epoch": 7.89, "learning_rate": 9e-06, "loss": 0.2736, "step": 1500 }, { "epoch": 7.89, "eval_accuracy": 0.9282854022570076, "eval_f1": 0.9256823709575714, "eval_loss": 0.31131741404533386, "eval_precision": 0.916027812444286, "eval_recall": 0.9355426074289876, "eval_runtime": 32.0518, "eval_samples_per_second": 5.928, "eval_steps_per_second": 1.498, "step": 1500 }, { "epoch": 8.42, "eval_accuracy": 0.9254944788253853, "eval_f1": 0.9237975139614484, "eval_loss": 0.3146894872188568, "eval_precision": 0.9140819964349376, "eval_recall": 0.9337217771303714, "eval_runtime": 32.0386, "eval_samples_per_second": 5.93, "eval_steps_per_second": 1.498, "step": 1600 }, { "epoch": 8.95, "eval_accuracy": 0.9253731343283582, "eval_f1": 0.9235605856462767, "eval_loss": 0.3176872134208679, "eval_precision": 0.9113632334692431, "eval_recall": 0.9360888565185724, "eval_runtime": 32.1667, "eval_samples_per_second": 5.907, "eval_steps_per_second": 1.492, "step": 1700 }, { "epoch": 9.47, "eval_accuracy": 0.9262225458075476, "eval_f1": 0.9248316120341267, "eval_loss": 0.3194420337677002, "eval_precision": 0.9124579124579124, "eval_recall": 0.9375455207574654, "eval_runtime": 32.186, "eval_samples_per_second": 5.903, "eval_steps_per_second": 1.491, "step": 1800 }, { "epoch": 10.0, "eval_accuracy": 0.9293775027302512, "eval_f1": 0.9273722955381991, "eval_loss": 0.30748510360717773, "eval_precision": 0.9146449442181689, "eval_recall": 0.9404588492352512, "eval_runtime": 31.8871, "eval_samples_per_second": 5.959, "eval_steps_per_second": 1.505, "step": 1900 }, { "epoch": 10.53, "learning_rate": 8.666666666666668e-06, "loss": 0.2045, "step": 2000 }, { "epoch": 10.53, "eval_accuracy": 0.9305909477005218, "eval_f1": 0.928266981046522, "eval_loss": 0.3004026710987091, "eval_precision": 0.9246612466124661, "eval_recall": 0.9319009468317553, "eval_runtime": 32.044, "eval_samples_per_second": 5.929, "eval_steps_per_second": 1.498, "step": 2000 }, { "epoch": 11.05, "eval_accuracy": 0.9284067467540347, "eval_f1": 0.9264534623309147, "eval_loss": 0.3036515414714813, "eval_precision": 0.9118321283724211, "eval_recall": 0.9415513474144209, "eval_runtime": 31.8687, "eval_samples_per_second": 5.962, "eval_steps_per_second": 1.506, "step": 2100 }, { "epoch": 11.58, "eval_accuracy": 0.9307122921975488, "eval_f1": 0.9279507603186097, "eval_loss": 0.30012640357017517, "eval_precision": 0.9226061915046796, "eval_recall": 0.9333576110706482, "eval_runtime": 31.9364, "eval_samples_per_second": 5.949, "eval_steps_per_second": 1.503, "step": 2200 }, { "epoch": 12.11, "eval_accuracy": 0.9318043926707924, "eval_f1": 0.9303956834532375, "eval_loss": 0.3051491975784302, "eval_precision": 0.9191542288557214, "eval_recall": 0.9419155134741443, "eval_runtime": 31.9279, "eval_samples_per_second": 5.951, "eval_steps_per_second": 1.503, "step": 2300 }, { "epoch": 12.63, "eval_accuracy": 0.9299842252153865, "eval_f1": 0.9288619723402333, "eval_loss": 0.31714528799057007, "eval_precision": 0.9222760725183988, "eval_recall": 0.9355426074289876, "eval_runtime": 32.3661, "eval_samples_per_second": 5.87, "eval_steps_per_second": 1.483, "step": 2400 }, { "epoch": 13.16, "learning_rate": 8.333333333333334e-06, "loss": 0.1678, "step": 2500 }, { "epoch": 13.16, "eval_accuracy": 0.9279213687659265, "eval_f1": 0.9271131805157592, "eval_loss": 0.321869432926178, "eval_precision": 0.9120859760394644, "eval_recall": 0.9426438455935907, "eval_runtime": 32.586, "eval_samples_per_second": 5.831, "eval_steps_per_second": 1.473, "step": 2500 }, { "epoch": 13.68, "eval_accuracy": 0.9273146462807912, "eval_f1": 0.9248711689720641, "eval_loss": 0.3112223446369171, "eval_precision": 0.9184772849703717, "eval_recall": 0.9313546977421704, "eval_runtime": 32.4269, "eval_samples_per_second": 5.859, "eval_steps_per_second": 1.48, "step": 2600 }, { "epoch": 14.21, "eval_accuracy": 0.92901346923917, "eval_f1": 0.9273105820584773, "eval_loss": 0.3135831654071808, "eval_precision": 0.922052205220522, "eval_recall": 0.9326292789512017, "eval_runtime": 31.2652, "eval_samples_per_second": 6.077, "eval_steps_per_second": 1.535, "step": 2700 }, { "epoch": 14.74, "eval_accuracy": 0.9296201917243053, "eval_f1": 0.9286809124515373, "eval_loss": 0.3137897551059723, "eval_precision": 0.9198071084122165, "eval_recall": 0.937727603787327, "eval_runtime": 31.2737, "eval_samples_per_second": 6.075, "eval_steps_per_second": 1.535, "step": 2800 }, { "epoch": 15.26, "eval_accuracy": 0.93313918213809, "eval_f1": 0.9307971014492753, "eval_loss": 0.3145933747291565, "eval_precision": 0.9260994953136266, "eval_recall": 0.9355426074289876, "eval_runtime": 32.3029, "eval_samples_per_second": 5.882, "eval_steps_per_second": 1.486, "step": 2900 }, { "epoch": 15.79, "learning_rate": 8.000000000000001e-06, "loss": 0.1404, "step": 3000 }, { "epoch": 15.79, "eval_accuracy": 0.9296201917243053, "eval_f1": 0.9290786516853932, "eval_loss": 0.31863638758659363, "eval_precision": 0.917450736729984, "eval_recall": 0.9410050983248361, "eval_runtime": 31.4449, "eval_samples_per_second": 6.042, "eval_steps_per_second": 1.526, "step": 3000 }, { "epoch": 16.32, "eval_accuracy": 0.9314403591797112, "eval_f1": 0.929384143037746, "eval_loss": 0.3153584599494934, "eval_precision": 0.9218917950555356, "eval_recall": 0.9369992716678806, "eval_runtime": 31.167, "eval_samples_per_second": 6.096, "eval_steps_per_second": 1.54, "step": 3100 }, { "epoch": 16.84, "eval_accuracy": 0.9273146462807912, "eval_f1": 0.926561797752809, "eval_loss": 0.34182220697402954, "eval_precision": 0.9149653825670158, "eval_recall": 0.9384559359067735, "eval_runtime": 31.6096, "eval_samples_per_second": 6.011, "eval_steps_per_second": 1.519, "step": 3200 }, { "epoch": 17.37, "eval_accuracy": 0.925009100837277, "eval_f1": 0.9233380986418871, "eval_loss": 0.35532286763191223, "eval_precision": 0.9064912280701755, "eval_recall": 0.9408230152949745, "eval_runtime": 32.7011, "eval_samples_per_second": 5.81, "eval_steps_per_second": 1.468, "step": 3300 }, { "epoch": 17.89, "eval_accuracy": 0.9294988472272783, "eval_f1": 0.9289882395188078, "eval_loss": 0.339712530374527, "eval_precision": 0.9162387108199044, "eval_recall": 0.9420975965040058, "eval_runtime": 31.1932, "eval_samples_per_second": 6.091, "eval_steps_per_second": 1.539, "step": 3400 }, { "epoch": 18.42, "learning_rate": 7.666666666666667e-06, "loss": 0.1174, "step": 3500 }, { "epoch": 18.42, "eval_accuracy": 0.9322897706589006, "eval_f1": 0.9322203066872333, "eval_loss": 0.32590094208717346, "eval_precision": 0.929101103273648, "eval_recall": 0.935360524399126, "eval_runtime": 31.3047, "eval_samples_per_second": 6.069, "eval_steps_per_second": 1.533, "step": 3500 }, { "epoch": 18.95, "eval_accuracy": 0.9299842252153865, "eval_f1": 0.9293038316243929, "eval_loss": 0.330241322517395, "eval_precision": 0.9182367579097049, "eval_recall": 0.9406409322651129, "eval_runtime": 31.3595, "eval_samples_per_second": 6.059, "eval_steps_per_second": 1.531, "step": 3600 }, { "epoch": 19.47, "eval_accuracy": 0.9303482587064676, "eval_f1": 0.9284752759580005, "eval_loss": 0.33720284700393677, "eval_precision": 0.9154132012033268, "eval_recall": 0.9419155134741443, "eval_runtime": 32.5529, "eval_samples_per_second": 5.837, "eval_steps_per_second": 1.475, "step": 3700 }, { "epoch": 20.0, "eval_accuracy": 0.9305909477005218, "eval_f1": 0.9294531038832327, "eval_loss": 0.33688944578170776, "eval_precision": 0.9199215266630997, "eval_recall": 0.9391842680262199, "eval_runtime": 31.1686, "eval_samples_per_second": 6.096, "eval_steps_per_second": 1.54, "step": 3800 }, { "epoch": 20.53, "eval_accuracy": 0.9302269142094406, "eval_f1": 0.9289775291038715, "eval_loss": 0.33882710337638855, "eval_precision": 0.9209160851672928, "eval_recall": 0.9371813546977422, "eval_runtime": 31.4744, "eval_samples_per_second": 6.037, "eval_steps_per_second": 1.525, "step": 3900 }, { "epoch": 21.05, "learning_rate": 7.333333333333333e-06, "loss": 0.0978, "step": 4000 }, { "epoch": 21.05, "eval_accuracy": 0.9297415362213324, "eval_f1": 0.9305718144979739, "eval_loss": 0.34309884905815125, "eval_precision": 0.9205415998574737, "eval_recall": 0.9408230152949745, "eval_runtime": 31.0896, "eval_samples_per_second": 6.111, "eval_steps_per_second": 1.544, "step": 4000 }, { "epoch": 21.58, "eval_accuracy": 0.9313190146826842, "eval_f1": 0.9312798342790237, "eval_loss": 0.3530495762825012, "eval_precision": 0.9214043842452326, "eval_recall": 0.9413692643845594, "eval_runtime": 32.1875, "eval_samples_per_second": 5.903, "eval_steps_per_second": 1.491, "step": 4100 }, { "epoch": 22.11, "eval_accuracy": 0.9325324596529547, "eval_f1": 0.932169845268082, "eval_loss": 0.34749624133110046, "eval_precision": 0.9212304409672831, "eval_recall": 0.9433721777130372, "eval_runtime": 31.1794, "eval_samples_per_second": 6.094, "eval_steps_per_second": 1.539, "step": 4200 }, { "epoch": 22.63, "eval_accuracy": 0.9302269142094406, "eval_f1": 0.9302577040908272, "eval_loss": 0.35649344325065613, "eval_precision": 0.9207991437745273, "eval_recall": 0.9399126001456665, "eval_runtime": 32.3866, "eval_samples_per_second": 5.867, "eval_steps_per_second": 1.482, "step": 4300 }, { "epoch": 23.16, "eval_accuracy": 0.9326538041499818, "eval_f1": 0.9312274368231047, "eval_loss": 0.35333752632141113, "eval_precision": 0.9232283464566929, "eval_recall": 0.9393663510560816, "eval_runtime": 31.2877, "eval_samples_per_second": 6.073, "eval_steps_per_second": 1.534, "step": 4400 }, { "epoch": 23.68, "learning_rate": 7e-06, "loss": 0.0822, "step": 4500 }, { "epoch": 23.68, "eval_accuracy": 0.9333818711321441, "eval_f1": 0.932110421724665, "eval_loss": 0.3559868335723877, "eval_precision": 0.9207674542547521, "eval_recall": 0.9437363437727604, "eval_runtime": 31.1716, "eval_samples_per_second": 6.095, "eval_steps_per_second": 1.54, "step": 4500 }, { "epoch": 24.21, "eval_accuracy": 0.9337459046232254, "eval_f1": 0.932995750067818, "eval_loss": 0.3473477065563202, "eval_precision": 0.9267109753906951, "eval_recall": 0.9393663510560816, "eval_runtime": 31.2203, "eval_samples_per_second": 6.086, "eval_steps_per_second": 1.537, "step": 4600 }, { "epoch": 24.74, "eval_accuracy": 0.9287707802451158, "eval_f1": 0.9275258194881005, "eval_loss": 0.3723868131637573, "eval_precision": 0.9151160730108099, "eval_recall": 0.9402767662053897, "eval_runtime": 32.4085, "eval_samples_per_second": 5.863, "eval_steps_per_second": 1.481, "step": 4700 }, { "epoch": 25.26, "eval_accuracy": 0.9327751486470088, "eval_f1": 0.9308232750855701, "eval_loss": 0.3668186068534851, "eval_precision": 0.9210338680926916, "eval_recall": 0.9408230152949745, "eval_runtime": 31.1822, "eval_samples_per_second": 6.093, "eval_steps_per_second": 1.539, "step": 4800 }, { "epoch": 25.79, "eval_accuracy": 0.9342312826113336, "eval_f1": 0.932900432900433, "eval_loss": 0.35110706090927124, "eval_precision": 0.9242315939957112, "eval_recall": 0.9417334304442826, "eval_runtime": 31.632, "eval_samples_per_second": 6.007, "eval_steps_per_second": 1.517, "step": 4900 }, { "epoch": 26.32, "learning_rate": 6.666666666666667e-06, "loss": 0.0685, "step": 5000 }, { "epoch": 26.32, "eval_accuracy": 0.9322897706589006, "eval_f1": 0.9301610276822869, "eval_loss": 0.349013090133667, "eval_precision": 0.9243078029485796, "eval_recall": 0.9360888565185724, "eval_runtime": 31.5377, "eval_samples_per_second": 6.025, "eval_steps_per_second": 1.522, "step": 5000 } ], "max_steps": 15000, "num_train_epochs": 79, "total_flos": 5296004751249408.0, "trial_name": null, "trial_params": null }