{"eval_loss":1.1322584152,"eval_rouge":0.7466957847,"eval_tool_call_equivalence":0.0,"eval_binary_tool_call":0.0,"eval_staged_tool_call":0.0,"eval_runtime":10.035,"eval_samples_per_second":11.56,"eval_steps_per_second":11.56,"epoch":0.0,"step":0,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.0248336148,"step":250,"loss":0.6023,"grad_norm":1.859403491,"learning_rate":0.0000061817,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.0496672296,"step":500,"loss":0.1788,"grad_norm":0.4753092825,"learning_rate":0.0000123883,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.0745008443,"step":750,"loss":0.1174,"grad_norm":2.3618509769,"learning_rate":0.0000185948,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.0993344591,"step":1000,"loss":0.1393,"grad_norm":14.4716386795,"learning_rate":0.0000248014,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.1241680739,"step":1250,"loss":0.1266,"grad_norm":2.8318195343,"learning_rate":0.0000310079,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.1490016887,"step":1500,"loss":0.1185,"grad_norm":4.5640730858,"learning_rate":0.0000372145,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.1738353035,"step":1750,"loss":0.0968,"grad_norm":0.7261046171,"learning_rate":0.0000434211,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.1986689182,"step":2000,"loss":0.0878,"grad_norm":0.5482857823,"learning_rate":0.0000496276,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.223502533,"step":2250,"loss":0.0826,"grad_norm":0.0892484263,"learning_rate":0.0000496928,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.2483361478,"step":2500,"loss":0.0881,"grad_norm":3.6561279297,"learning_rate":0.0000493661,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.2731697626,"step":2750,"loss":0.0784,"grad_norm":0.715729475,"learning_rate":0.0000490393,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.2980033774,"step":3000,"loss":0.0841,"grad_norm":0.2599439919,"learning_rate":0.0000487126,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.3228369922,"step":3250,"loss":0.0704,"grad_norm":0.136757344,"learning_rate":0.0000483858,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.3476706069,"step":3500,"loss":0.0627,"grad_norm":0.2034457624,"learning_rate":0.000048059,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.3725042217,"step":3750,"loss":0.0608,"grad_norm":0.1265211999,"learning_rate":0.0000477323,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.3973378365,"step":4000,"loss":0.0823,"grad_norm":0.5200492144,"learning_rate":0.0000474055,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.4221714513,"step":4250,"loss":0.0715,"grad_norm":0.4572677016,"learning_rate":0.0000470787,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.4470050661,"step":4500,"loss":0.0583,"grad_norm":0.261872232,"learning_rate":0.000046752,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.4718386808,"step":4750,"loss":0.0552,"grad_norm":0.803602159,"learning_rate":0.0000464252,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.4966722956,"step":5000,"loss":0.0664,"grad_norm":4.0464506149,"learning_rate":0.0000460984,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.5215059104,"step":5250,"loss":0.0657,"grad_norm":0.2125871032,"learning_rate":0.0000457717,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.5463395252,"step":5500,"loss":0.0613,"grad_norm":0.1216437444,"learning_rate":0.0000454449,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.57117314,"step":5750,"loss":0.0538,"grad_norm":0.156804204,"learning_rate":0.0000451182,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.5960067547,"step":6000,"loss":0.0541,"grad_norm":0.1619042605,"learning_rate":0.0000447914,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.6208403695,"step":6250,"loss":0.071,"grad_norm":0.1102830395,"learning_rate":0.0000444646,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.6456739843,"step":6500,"loss":0.0543,"grad_norm":0.1619913131,"learning_rate":0.0000441379,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.6705075991,"step":6750,"loss":0.0491,"grad_norm":1.8771800995,"learning_rate":0.0000438111,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.6953412139,"step":7000,"loss":0.0629,"grad_norm":0.8181144595,"learning_rate":0.0000434843,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.7201748286,"step":7250,"loss":0.0595,"grad_norm":0.0885839611,"learning_rate":0.0000431576,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.7450084434,"step":7500,"loss":0.0475,"grad_norm":0.0475071594,"learning_rate":0.0000428308,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.7698420582,"step":7750,"loss":0.05,"grad_norm":0.2234110832,"learning_rate":0.0000425041,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.794675673,"step":8000,"loss":0.0628,"grad_norm":0.7562886477,"learning_rate":0.0000421773,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.8195092878,"step":8250,"loss":0.0592,"grad_norm":0.1472263932,"learning_rate":0.0000418505,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.8443429026,"step":8500,"loss":0.0519,"grad_norm":0.8230469227,"learning_rate":0.0000415238,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.8691765173,"step":8750,"loss":0.0573,"grad_norm":0.3549256325,"learning_rate":0.000041197,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.8940101321,"step":9000,"loss":0.0568,"grad_norm":1.0336612463,"learning_rate":0.0000408702,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.9188437469,"step":9250,"loss":0.0584,"grad_norm":0.2352485806,"learning_rate":0.0000405435,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.9436773617,"step":9500,"loss":0.0569,"grad_norm":0.1039064974,"learning_rate":0.0000402167,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.9685109765,"step":9750,"loss":0.0646,"grad_norm":0.587021172,"learning_rate":0.0000398899,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":0.9933445912,"step":10000,"loss":0.0488,"grad_norm":13.2972211838,"learning_rate":0.0000395632,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":0.0643972456,"eval_rouge":0.9763679582,"eval_tool_call_equivalence":0.8103448276,"eval_binary_tool_call":0.8017241379,"eval_staged_tool_call":0.8556034483,"eval_runtime":9.0438,"eval_samples_per_second":12.827,"eval_steps_per_second":12.827,"epoch":1.0,"step":10067,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.018178206,"step":10250,"loss":0.05,"grad_norm":0.0552540123,"learning_rate":0.0000392364,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.0430118208,"step":10500,"loss":0.0395,"grad_norm":0.4703384042,"learning_rate":0.0000389097,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.0678454356,"step":10750,"loss":0.0545,"grad_norm":0.392344743,"learning_rate":0.0000385829,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.0926790504,"step":11000,"loss":0.0473,"grad_norm":0.4328499138,"learning_rate":0.0000382561,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.1175126651,"step":11250,"loss":0.0448,"grad_norm":2.6124651432,"learning_rate":0.0000379294,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.1423462799,"step":11500,"loss":0.047,"grad_norm":0.4061683714,"learning_rate":0.0000376026,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.1671798947,"step":11750,"loss":0.0557,"grad_norm":0.1156855524,"learning_rate":0.0000372758,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.1920135095,"step":12000,"loss":0.0478,"grad_norm":0.1109383553,"learning_rate":0.0000369491,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.2168471243,"step":12250,"loss":0.041,"grad_norm":0.1112424359,"learning_rate":0.0000366223,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.241680739,"step":12500,"loss":0.0447,"grad_norm":0.1579927057,"learning_rate":0.0000362956,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.2665143538,"step":12750,"loss":0.0489,"grad_norm":0.4291910231,"learning_rate":0.0000359688,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.2913479686,"step":13000,"loss":0.0469,"grad_norm":0.6510604024,"learning_rate":0.000035642,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.3161815834,"step":13250,"loss":0.0431,"grad_norm":0.6754758954,"learning_rate":0.0000353153,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.3410151982,"step":13500,"loss":0.0392,"grad_norm":0.3190574646,"learning_rate":0.0000349885,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.365848813,"step":13750,"loss":0.0382,"grad_norm":0.0556767248,"learning_rate":0.0000346617,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.3906824277,"step":14000,"loss":0.0551,"grad_norm":0.1057418212,"learning_rate":0.000034335,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.4155160425,"step":14250,"loss":0.0516,"grad_norm":0.3781132698,"learning_rate":0.0000340082,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.4403496573,"step":14500,"loss":0.0488,"grad_norm":0.0596432909,"learning_rate":0.0000336814,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.4651832721,"step":14750,"loss":0.0444,"grad_norm":1.0107779503,"learning_rate":0.0000333547,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.4900168869,"step":15000,"loss":0.0449,"grad_norm":0.8016837835,"learning_rate":0.0000330279,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.5148505016,"step":15250,"loss":0.045,"grad_norm":0.1110835075,"learning_rate":0.0000327012,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.5396841164,"step":15500,"loss":0.0495,"grad_norm":0.1134795621,"learning_rate":0.0000323744,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.5645177312,"step":15750,"loss":0.0571,"grad_norm":0.0876661763,"learning_rate":0.0000320476,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.589351346,"step":16000,"loss":0.0437,"grad_norm":0.0965368077,"learning_rate":0.0000317209,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.6141849608,"step":16250,"loss":0.0456,"grad_norm":0.6337117553,"learning_rate":0.0000313941,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.6390185755,"step":16500,"loss":0.0449,"grad_norm":0.061980363,"learning_rate":0.0000310673,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.6638521903,"step":16750,"loss":0.0457,"grad_norm":0.0588269979,"learning_rate":0.0000307406,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.6886858051,"step":17000,"loss":0.0468,"grad_norm":0.792786479,"learning_rate":0.0000304138,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.7135194199,"step":17250,"loss":0.0518,"grad_norm":0.0996412411,"learning_rate":0.000030087,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.7383530347,"step":17500,"loss":0.0513,"grad_norm":0.1178871915,"learning_rate":0.0000297603,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.7631866494,"step":17750,"loss":0.0471,"grad_norm":0.1890922785,"learning_rate":0.0000294335,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.7880202642,"step":18000,"loss":0.0399,"grad_norm":0.0514776036,"learning_rate":0.0000291068,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.812853879,"step":18250,"loss":0.0384,"grad_norm":0.095758006,"learning_rate":0.00002878,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.8376874938,"step":18500,"loss":0.0419,"grad_norm":0.6582738757,"learning_rate":0.0000284532,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.8625211086,"step":18750,"loss":0.0435,"grad_norm":2.2903850079,"learning_rate":0.0000281265,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.8873547234,"step":19000,"loss":0.0514,"grad_norm":0.3981194496,"learning_rate":0.0000277997,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.9121883381,"step":19250,"loss":0.0395,"grad_norm":0.2885676026,"learning_rate":0.0000274729,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.9370219529,"step":19500,"loss":0.0389,"grad_norm":0.3023632169,"learning_rate":0.0000271462,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.9618555677,"step":19750,"loss":0.0465,"grad_norm":0.1197957397,"learning_rate":0.0000268194,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":1.9866891825,"step":20000,"loss":0.0513,"grad_norm":4.8108739853,"learning_rate":0.0000264927,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":0.0497446135,"eval_rouge":0.9826921656,"eval_tool_call_equivalence":0.8275862069,"eval_binary_tool_call":0.8189655172,"eval_staged_tool_call":0.8512931034,"eval_runtime":9.0385,"eval_samples_per_second":12.834,"eval_steps_per_second":12.834,"epoch":2.0,"step":20134,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.0115227973,"step":20250,"loss":0.0433,"grad_norm":0.2571648359,"learning_rate":0.0000261659,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.036356412,"step":20500,"loss":0.0319,"grad_norm":0.0797785819,"learning_rate":0.0000258391,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.0611900268,"step":20750,"loss":0.0423,"grad_norm":0.6390244961,"learning_rate":0.0000255124,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.0860236416,"step":21000,"loss":0.0383,"grad_norm":0.0651589334,"learning_rate":0.0000251856,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.1108572564,"step":21250,"loss":0.033,"grad_norm":0.0487190336,"learning_rate":0.0000248588,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.1356908712,"step":21500,"loss":0.0404,"grad_norm":0.1252134293,"learning_rate":0.0000245321,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.1605244859,"step":21750,"loss":0.0337,"grad_norm":0.0602798983,"learning_rate":0.0000242053,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.1853581007,"step":22000,"loss":0.0449,"grad_norm":4.4454398155,"learning_rate":0.0000238785,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.2101917155,"step":22250,"loss":0.0324,"grad_norm":0.0417073779,"learning_rate":0.0000235518,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.2350253303,"step":22500,"loss":0.0401,"grad_norm":0.0848601311,"learning_rate":0.000023225,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.2598589451,"step":22750,"loss":0.0455,"grad_norm":0.046788875,"learning_rate":0.0000228983,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.2846925598,"step":23000,"loss":0.0377,"grad_norm":0.0342435278,"learning_rate":0.0000225715,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.3095261746,"step":23250,"loss":0.0404,"grad_norm":0.0831611156,"learning_rate":0.0000222447,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.3343597894,"step":23500,"loss":0.0373,"grad_norm":0.0233554021,"learning_rate":0.000021918,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.3591934042,"step":23750,"loss":0.0427,"grad_norm":0.3366115689,"learning_rate":0.0000215912,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.384027019,"step":24000,"loss":0.0365,"grad_norm":0.053785488,"learning_rate":0.0000212644,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.4088606338,"step":24250,"loss":0.0434,"grad_norm":1.818696022,"learning_rate":0.0000209377,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.4336942485,"step":24500,"loss":0.034,"grad_norm":0.0581700951,"learning_rate":0.0000206109,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.4585278633,"step":24750,"loss":0.0391,"grad_norm":0.0731598139,"learning_rate":0.0000202842,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.4833614781,"step":25000,"loss":0.0434,"grad_norm":0.0540302061,"learning_rate":0.0000199574,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.5081950929,"step":25250,"loss":0.0412,"grad_norm":0.0796190947,"learning_rate":0.0000196306,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.5330287077,"step":25500,"loss":0.0375,"grad_norm":0.5343271494,"learning_rate":0.0000193039,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.5578623224,"step":25750,"loss":0.0438,"grad_norm":0.5644518137,"learning_rate":0.0000189771,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.5826959372,"step":26000,"loss":0.0421,"grad_norm":0.0622491576,"learning_rate":0.0000186503,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.607529552,"step":26250,"loss":0.0307,"grad_norm":0.0878384858,"learning_rate":0.0000183236,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.6323631668,"step":26500,"loss":0.0432,"grad_norm":0.0275695529,"learning_rate":0.0000179968,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.6571967816,"step":26750,"loss":0.0373,"grad_norm":0.0562305078,"learning_rate":0.00001767,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.6820303963,"step":27000,"loss":0.0415,"grad_norm":0.2438167781,"learning_rate":0.0000173433,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.7068640111,"step":27250,"loss":0.0334,"grad_norm":0.0625845939,"learning_rate":0.0000170165,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.7316976259,"step":27500,"loss":0.0363,"grad_norm":0.4112043977,"learning_rate":0.0000166898,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.7565312407,"step":27750,"loss":0.0462,"grad_norm":0.3606038988,"learning_rate":0.000016363,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.7813648555,"step":28000,"loss":0.0375,"grad_norm":0.077768065,"learning_rate":0.0000160362,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.8061984702,"step":28250,"loss":0.0372,"grad_norm":0.4190590382,"learning_rate":0.0000157095,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.831032085,"step":28500,"loss":0.0422,"grad_norm":0.0445631221,"learning_rate":0.0000153827,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.8558656998,"step":28750,"loss":0.0384,"grad_norm":0.0306271184,"learning_rate":0.0000150559,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.8806993146,"step":29000,"loss":0.0453,"grad_norm":0.0460517853,"learning_rate":0.0000147292,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.9055329294,"step":29250,"loss":0.0391,"grad_norm":0.0651085824,"learning_rate":0.0000144024,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.9303665442,"step":29500,"loss":0.0415,"grad_norm":0.1139728725,"learning_rate":0.0000140757,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.9552001589,"step":29750,"loss":0.0432,"grad_norm":0.0603395328,"learning_rate":0.0000137489,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":2.9800337737,"step":30000,"loss":0.0322,"grad_norm":0.126148507,"learning_rate":0.0000134221,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":0.0569855124,"eval_rouge":0.9837365953,"eval_tool_call_equivalence":0.8448275862,"eval_binary_tool_call":0.8362068966,"eval_staged_tool_call":0.8685344828,"eval_runtime":8.8728,"eval_samples_per_second":13.074,"eval_steps_per_second":13.074,"epoch":3.0,"step":30201,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.0048673885,"step":30250,"loss":0.0384,"grad_norm":0.0759669393,"learning_rate":0.0000130954,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.0297010033,"step":30500,"loss":0.0335,"grad_norm":0.0581116788,"learning_rate":0.0000127686,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.0545346181,"step":30750,"loss":0.0376,"grad_norm":0.2857528627,"learning_rate":0.0000124418,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.0793682328,"step":31000,"loss":0.0425,"grad_norm":0.2913094759,"learning_rate":0.0000121151,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.1042018476,"step":31250,"loss":0.0345,"grad_norm":0.057530582,"learning_rate":0.0000117883,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.1290354624,"step":31500,"loss":0.0363,"grad_norm":0.5920750499,"learning_rate":0.0000114615,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.1538690772,"step":31750,"loss":0.0354,"grad_norm":0.0892687961,"learning_rate":0.0000111348,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.178702692,"step":32000,"loss":0.0271,"grad_norm":0.1276922226,"learning_rate":0.000010808,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.2035363067,"step":32250,"loss":0.0408,"grad_norm":0.1062248275,"learning_rate":0.0000104813,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.2283699215,"step":32500,"loss":0.0365,"grad_norm":0.0449275486,"learning_rate":0.0000101545,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.2532035363,"step":32750,"loss":0.0357,"grad_norm":0.0906295925,"learning_rate":0.0000098277,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.2780371511,"step":33000,"loss":0.037,"grad_norm":0.1071613058,"learning_rate":0.000009501,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.3028707659,"step":33250,"loss":0.0305,"grad_norm":0.0650367439,"learning_rate":0.0000091742,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.3277043806,"step":33500,"loss":0.032,"grad_norm":0.2549956441,"learning_rate":0.0000088474,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.3525379954,"step":33750,"loss":0.0336,"grad_norm":0.0445257016,"learning_rate":0.0000085207,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.3773716102,"step":34000,"loss":0.0367,"grad_norm":0.2905561328,"learning_rate":0.0000081939,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.402205225,"step":34250,"loss":0.0341,"grad_norm":0.067139335,"learning_rate":0.0000078672,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.4270388398,"step":34500,"loss":0.0357,"grad_norm":0.8738816977,"learning_rate":0.0000075404,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.4518724546,"step":34750,"loss":0.0445,"grad_norm":2.5799980164,"learning_rate":0.0000072136,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.4767060693,"step":35000,"loss":0.0338,"grad_norm":0.2384272069,"learning_rate":0.0000068869,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.5015396841,"step":35250,"loss":0.0315,"grad_norm":0.0434488617,"learning_rate":0.0000065601,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.5263732989,"step":35500,"loss":0.0304,"grad_norm":0.6418414712,"learning_rate":0.0000062333,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.5512069137,"step":35750,"loss":0.0323,"grad_norm":0.0552973971,"learning_rate":0.0000059066,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.5760405285,"step":36000,"loss":0.027,"grad_norm":0.0832837448,"learning_rate":0.0000055798,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.6008741432,"step":36250,"loss":0.0309,"grad_norm":0.108182773,"learning_rate":0.000005253,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.625707758,"step":36500,"loss":0.025,"grad_norm":0.1131080538,"learning_rate":0.0000049263,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.6505413728,"step":36750,"loss":0.0401,"grad_norm":0.1196356937,"learning_rate":0.0000045995,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.6753749876,"step":37000,"loss":0.0368,"grad_norm":0.0324246734,"learning_rate":0.0000042728,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.7002086024,"step":37250,"loss":0.0347,"grad_norm":0.7848063707,"learning_rate":0.000003946,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.7250422171,"step":37500,"loss":0.0335,"grad_norm":0.1033596024,"learning_rate":0.0000036192,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.7498758319,"step":37750,"loss":0.0381,"grad_norm":0.440266788,"learning_rate":0.0000032925,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.7747094467,"step":38000,"loss":0.0308,"grad_norm":0.0929857716,"learning_rate":0.0000029657,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.7995430615,"step":38250,"loss":0.029,"grad_norm":0.0891520604,"learning_rate":0.0000026389,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.8243766763,"step":38500,"loss":0.0369,"grad_norm":0.0414980985,"learning_rate":0.0000023122,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.849210291,"step":38750,"loss":0.0329,"grad_norm":0.0405808389,"learning_rate":0.0000019854,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.8740439058,"step":39000,"loss":0.029,"grad_norm":0.2531946599,"learning_rate":0.0000016587,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.8988775206,"step":39250,"loss":0.0336,"grad_norm":0.0816422775,"learning_rate":0.0000013319,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.9237111354,"step":39500,"loss":0.0356,"grad_norm":0.0616473481,"learning_rate":0.0000010051,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.9485447502,"step":39750,"loss":0.0293,"grad_norm":0.0898075104,"learning_rate":0.0000006784,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.973378365,"step":40000,"loss":0.032,"grad_norm":0.1297069192,"learning_rate":0.0000003516,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":3.9982119797,"step":40250,"loss":0.0314,"grad_norm":0.0346293487,"learning_rate":0.0000000248,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":0.0620321706,"eval_rouge":0.9852065334,"eval_tool_call_equivalence":0.8362068966,"eval_binary_tool_call":0.8275862069,"eval_staged_tool_call":0.8556034483,"eval_runtime":9.2427,"eval_samples_per_second":12.55,"eval_steps_per_second":12.55,"epoch":4.0,"step":40268,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":null,"train_samples_per_second":null,"train_steps_per_second":null,"total_flos":null,"train_loss":null} {"eval_loss":null,"eval_rouge":null,"eval_tool_call_equivalence":null,"eval_binary_tool_call":null,"eval_staged_tool_call":null,"eval_runtime":null,"eval_samples_per_second":null,"eval_steps_per_second":null,"epoch":4.0,"step":40268,"loss":null,"grad_norm":null,"learning_rate":null,"train_runtime":7224.9579,"train_samples_per_second":5.573,"train_steps_per_second":5.573,"total_flos":6.154596108e+17,"train_loss":0.0515053023}