diff --git "a/train.log" "b/train.log" new file mode 100644--- /dev/null +++ "b/train.log" @@ -0,0 +1,2976 @@ +INFO __main__ Tue, 26 Mar 2024 18:04:12 Writing config to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/args.json +INFO arabiner.utils.data Tue, 26 Mar 2024 18:04:12 2891 batches found +INFO arabiner.utils.data Tue, 26 Mar 2024 18:04:12 413 batches found +INFO arabiner.utils.data Tue, 26 Mar 2024 18:04:12 826 batches found +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:19 Epoch 0 | Batch 10/2891 | Timestep 10 | LR 0.0001000000 | Loss 38.036158 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:21 Epoch 0 | Batch 20/2891 | Timestep 20 | LR 0.0001000000 | Loss 25.645523 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:23 Epoch 0 | Batch 30/2891 | Timestep 30 | LR 0.0001000000 | Loss 17.971964 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:25 Epoch 0 | Batch 40/2891 | Timestep 40 | LR 0.0001000000 | Loss 11.638056 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:27 Epoch 0 | Batch 50/2891 | Timestep 50 | LR 0.0001000000 | Loss 8.120996 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:29 Epoch 0 | Batch 60/2891 | Timestep 60 | LR 0.0001000000 | Loss 5.419473 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:31 Epoch 0 | Batch 70/2891 | Timestep 70 | LR 0.0001000000 | Loss 3.742189 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:34 Epoch 0 | Batch 80/2891 | Timestep 80 | LR 0.0001000000 | Loss 3.385757 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:36 Epoch 0 | Batch 90/2891 | Timestep 90 | LR 0.0001000000 | Loss 2.351185 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:38 Epoch 0 | Batch 100/2891 | Timestep 100 | LR 0.0001000000 | Loss 1.491716 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:40 Epoch 0 | Batch 110/2891 | Timestep 110 | LR 0.0001000000 | Loss 1.466668 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:42 Epoch 0 | Batch 120/2891 | Timestep 120 | LR 0.0001000000 | Loss 1.099143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:44 Epoch 0 | Batch 130/2891 | Timestep 130 | LR 0.0001000000 | Loss 1.170963 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:46 Epoch 0 | Batch 140/2891 | Timestep 140 | LR 0.0001000000 | Loss 0.955306 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:48 Epoch 0 | Batch 150/2891 | Timestep 150 | LR 0.0001000000 | Loss 1.312362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:51 Epoch 0 | Batch 160/2891 | Timestep 160 | LR 0.0001000000 | Loss 1.095882 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:53 Epoch 0 | Batch 170/2891 | Timestep 170 | LR 0.0001000000 | Loss 1.067245 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:55 Epoch 0 | Batch 180/2891 | Timestep 180 | LR 0.0001000000 | Loss 0.837340 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:57 Epoch 0 | Batch 190/2891 | Timestep 190 | LR 0.0001000000 | Loss 0.829486 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:04:59 Epoch 0 | Batch 200/2891 | Timestep 200 | LR 0.0001000000 | Loss 1.277778 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:01 Epoch 0 | Batch 210/2891 | Timestep 210 | LR 0.0001000000 | Loss 0.829878 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:03 Epoch 0 | Batch 220/2891 | Timestep 220 | LR 0.0001000000 | Loss 0.686360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:05 Epoch 0 | Batch 230/2891 | Timestep 230 | LR 0.0001000000 | Loss 0.757668 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:08 Epoch 0 | Batch 240/2891 | Timestep 240 | LR 0.0001000000 | Loss 0.658734 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:10 Epoch 0 | Batch 250/2891 | Timestep 250 | LR 0.0001000000 | Loss 0.926205 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:12 Epoch 0 | Batch 260/2891 | Timestep 260 | LR 0.0001000000 | Loss 0.727311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:14 Epoch 0 | Batch 270/2891 | Timestep 270 | LR 0.0001000000 | Loss 0.545389 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:16 Epoch 0 | Batch 280/2891 | Timestep 280 | LR 0.0001000000 | Loss 0.539329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:18 Epoch 0 | Batch 290/2891 | Timestep 290 | LR 0.0001000000 | Loss 0.448666 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:20 Epoch 0 | Batch 300/2891 | Timestep 300 | LR 0.0001000000 | Loss 0.289943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:22 Epoch 0 | Batch 310/2891 | Timestep 310 | LR 0.0001000000 | Loss 0.338512 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:25 Epoch 0 | Batch 320/2891 | Timestep 320 | LR 0.0001000000 | Loss 0.242458 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:27 Epoch 0 | Batch 330/2891 | Timestep 330 | LR 0.0001000000 | Loss 0.642745 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:29 Epoch 0 | Batch 340/2891 | Timestep 340 | LR 0.0001000000 | Loss 0.327995 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:31 Epoch 0 | Batch 350/2891 | Timestep 350 | LR 0.0001000000 | Loss 0.478046 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:34 Epoch 0 | Batch 360/2891 | Timestep 360 | LR 0.0001000000 | Loss 0.546312 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:36 Epoch 0 | Batch 370/2891 | Timestep 370 | LR 0.0001000000 | Loss 0.518137 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:38 Epoch 0 | Batch 380/2891 | Timestep 380 | LR 0.0001000000 | Loss 0.273544 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:40 Epoch 0 | Batch 390/2891 | Timestep 390 | LR 0.0001000000 | Loss 0.354831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:42 Epoch 0 | Batch 400/2891 | Timestep 400 | LR 0.0001000000 | Loss 0.336362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:44 Epoch 0 | Batch 410/2891 | Timestep 410 | LR 0.0001000000 | Loss 0.329513 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:46 Epoch 0 | Batch 420/2891 | Timestep 420 | LR 0.0001000000 | Loss 0.489221 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:48 Epoch 0 | Batch 430/2891 | Timestep 430 | LR 0.0001000000 | Loss 0.223694 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:50 Epoch 0 | Batch 440/2891 | Timestep 440 | LR 0.0001000000 | Loss 0.351715 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:52 Epoch 0 | Batch 450/2891 | Timestep 450 | LR 0.0001000000 | Loss 0.422495 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:54 Epoch 0 | Batch 460/2891 | Timestep 460 | LR 0.0001000000 | Loss 0.374875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:56 Epoch 0 | Batch 470/2891 | Timestep 470 | LR 0.0001000000 | Loss 0.339501 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:05:59 Epoch 0 | Batch 480/2891 | Timestep 480 | LR 0.0001000000 | Loss 0.205166 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:01 Epoch 0 | Batch 490/2891 | Timestep 490 | LR 0.0001000000 | Loss 0.528296 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:03 Epoch 0 | Batch 500/2891 | Timestep 500 | LR 0.0001000000 | Loss 0.228997 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:05 Epoch 0 | Batch 510/2891 | Timestep 510 | LR 0.0001000000 | Loss 0.223643 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:07 Epoch 0 | Batch 520/2891 | Timestep 520 | LR 0.0001000000 | Loss 0.367366 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:09 Epoch 0 | Batch 530/2891 | Timestep 530 | LR 0.0001000000 | Loss 0.200154 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:11 Epoch 0 | Batch 540/2891 | Timestep 540 | LR 0.0001000000 | Loss 0.151578 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:13 Epoch 0 | Batch 550/2891 | Timestep 550 | LR 0.0001000000 | Loss 0.186664 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:15 Epoch 0 | Batch 560/2891 | Timestep 560 | LR 0.0001000000 | Loss 0.439005 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:17 Epoch 0 | Batch 570/2891 | Timestep 570 | LR 0.0001000000 | Loss 0.198570 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:20 Epoch 0 | Batch 580/2891 | Timestep 580 | LR 0.0001000000 | Loss 0.728534 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:22 Epoch 0 | Batch 590/2891 | Timestep 590 | LR 0.0001000000 | Loss 0.209982 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:24 Epoch 0 | Batch 600/2891 | Timestep 600 | LR 0.0001000000 | Loss 0.368997 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:27 Epoch 0 | Batch 610/2891 | Timestep 610 | LR 0.0001000000 | Loss 0.206432 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:29 Epoch 0 | Batch 620/2891 | Timestep 620 | LR 0.0001000000 | Loss 0.213927 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:31 Epoch 0 | Batch 630/2891 | Timestep 630 | LR 0.0001000000 | Loss 0.403147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:33 Epoch 0 | Batch 640/2891 | Timestep 640 | LR 0.0001000000 | Loss 0.387315 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:35 Epoch 0 | Batch 650/2891 | Timestep 650 | LR 0.0001000000 | Loss 0.152567 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:37 Epoch 0 | Batch 660/2891 | Timestep 660 | LR 0.0001000000 | Loss 0.206928 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:40 Epoch 0 | Batch 670/2891 | Timestep 670 | LR 0.0001000000 | Loss 0.218676 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:42 Epoch 0 | Batch 680/2891 | Timestep 680 | LR 0.0001000000 | Loss 0.274431 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:44 Epoch 0 | Batch 690/2891 | Timestep 690 | LR 0.0001000000 | Loss 0.229575 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:46 Epoch 0 | Batch 700/2891 | Timestep 700 | LR 0.0001000000 | Loss 0.312834 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:48 Epoch 0 | Batch 710/2891 | Timestep 710 | LR 0.0001000000 | Loss 0.101815 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:50 Epoch 0 | Batch 720/2891 | Timestep 720 | LR 0.0001000000 | Loss 0.155199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:52 Epoch 0 | Batch 730/2891 | Timestep 730 | LR 0.0001000000 | Loss 0.321433 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:54 Epoch 0 | Batch 740/2891 | Timestep 740 | LR 0.0001000000 | Loss 0.069513 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:56 Epoch 0 | Batch 750/2891 | Timestep 750 | LR 0.0001000000 | Loss 0.210138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:06:59 Epoch 0 | Batch 760/2891 | Timestep 760 | LR 0.0001000000 | Loss 0.214633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:01 Epoch 0 | Batch 770/2891 | Timestep 770 | LR 0.0001000000 | Loss 0.404146 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:03 Epoch 0 | Batch 780/2891 | Timestep 780 | LR 0.0001000000 | Loss 0.360442 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:05 Epoch 0 | Batch 790/2891 | Timestep 790 | LR 0.0001000000 | Loss 0.171559 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:07 Epoch 0 | Batch 800/2891 | Timestep 800 | LR 0.0001000000 | Loss 0.125143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:10 Epoch 0 | Batch 810/2891 | Timestep 810 | LR 0.0001000000 | Loss 0.285947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:12 Epoch 0 | Batch 820/2891 | Timestep 820 | LR 0.0001000000 | Loss 0.168330 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:14 Epoch 0 | Batch 830/2891 | Timestep 830 | LR 0.0001000000 | Loss 0.258455 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:16 Epoch 0 | Batch 840/2891 | Timestep 840 | LR 0.0001000000 | Loss 0.163380 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:18 Epoch 0 | Batch 850/2891 | Timestep 850 | LR 0.0001000000 | Loss 0.219119 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:20 Epoch 0 | Batch 860/2891 | Timestep 860 | LR 0.0001000000 | Loss 0.097164 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:23 Epoch 0 | Batch 870/2891 | Timestep 870 | LR 0.0001000000 | Loss 0.084793 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:25 Epoch 0 | Batch 880/2891 | Timestep 880 | LR 0.0001000000 | Loss 0.041310 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:27 Epoch 0 | Batch 890/2891 | Timestep 890 | LR 0.0001000000 | Loss 0.064988 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:29 Epoch 0 | Batch 900/2891 | Timestep 900 | LR 0.0001000000 | Loss 0.142357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:32 Epoch 0 | Batch 910/2891 | Timestep 910 | LR 0.0001000000 | Loss 0.148303 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:34 Epoch 0 | Batch 920/2891 | Timestep 920 | LR 0.0001000000 | Loss 0.250433 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:36 Epoch 0 | Batch 930/2891 | Timestep 930 | LR 0.0001000000 | Loss 0.080530 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:38 Epoch 0 | Batch 940/2891 | Timestep 940 | LR 0.0001000000 | Loss 0.150245 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:41 Epoch 0 | Batch 950/2891 | Timestep 950 | LR 0.0001000000 | Loss 0.089438 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:43 Epoch 0 | Batch 960/2891 | Timestep 960 | LR 0.0001000000 | Loss 0.152052 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:45 Epoch 0 | Batch 970/2891 | Timestep 970 | LR 0.0001000000 | Loss 0.213498 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:47 Epoch 0 | Batch 980/2891 | Timestep 980 | LR 0.0001000000 | Loss 0.280220 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:49 Epoch 0 | Batch 990/2891 | Timestep 990 | LR 0.0001000000 | Loss 0.142902 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:51 Epoch 0 | Batch 1000/2891 | Timestep 1000 | LR 0.0001000000 | Loss 0.231281 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:53 Epoch 0 | Batch 1010/2891 | Timestep 1010 | LR 0.0001000000 | Loss 0.078217 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:56 Epoch 0 | Batch 1020/2891 | Timestep 1020 | LR 0.0001000000 | Loss 0.338229 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:07:58 Epoch 0 | Batch 1030/2891 | Timestep 1030 | LR 0.0001000000 | Loss 0.139895 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:00 Epoch 0 | Batch 1040/2891 | Timestep 1040 | LR 0.0001000000 | Loss 0.234752 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:03 Epoch 0 | Batch 1050/2891 | Timestep 1050 | LR 0.0001000000 | Loss 0.218742 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:05 Epoch 0 | Batch 1060/2891 | Timestep 1060 | LR 0.0001000000 | Loss 0.242511 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:07 Epoch 0 | Batch 1070/2891 | Timestep 1070 | LR 0.0001000000 | Loss 0.170266 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:09 Epoch 0 | Batch 1080/2891 | Timestep 1080 | LR 0.0001000000 | Loss 0.085050 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:12 Epoch 0 | Batch 1090/2891 | Timestep 1090 | LR 0.0001000000 | Loss 0.217037 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:14 Epoch 0 | Batch 1100/2891 | Timestep 1100 | LR 0.0001000000 | Loss 0.145804 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:16 Epoch 0 | Batch 1110/2891 | Timestep 1110 | LR 0.0001000000 | Loss 0.169740 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:18 Epoch 0 | Batch 1120/2891 | Timestep 1120 | LR 0.0001000000 | Loss 0.189899 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:21 Epoch 0 | Batch 1130/2891 | Timestep 1130 | LR 0.0001000000 | Loss 0.071118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:23 Epoch 0 | Batch 1140/2891 | Timestep 1140 | LR 0.0001000000 | Loss 0.270059 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:25 Epoch 0 | Batch 1150/2891 | Timestep 1150 | LR 0.0001000000 | Loss 0.140489 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:27 Epoch 0 | Batch 1160/2891 | Timestep 1160 | LR 0.0001000000 | Loss 0.051336 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:29 Epoch 0 | Batch 1170/2891 | Timestep 1170 | LR 0.0001000000 | Loss 0.209964 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:31 Epoch 0 | Batch 1180/2891 | Timestep 1180 | LR 0.0001000000 | Loss 0.048169 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:33 Epoch 0 | Batch 1190/2891 | Timestep 1190 | LR 0.0001000000 | Loss 0.205923 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:36 Epoch 0 | Batch 1200/2891 | Timestep 1200 | LR 0.0001000000 | Loss 0.136726 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:38 Epoch 0 | Batch 1210/2891 | Timestep 1210 | LR 0.0001000000 | Loss 0.388298 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:40 Epoch 0 | Batch 1220/2891 | Timestep 1220 | LR 0.0001000000 | Loss 0.114231 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:42 Epoch 0 | Batch 1230/2891 | Timestep 1230 | LR 0.0001000000 | Loss 0.080937 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:44 Epoch 0 | Batch 1240/2891 | Timestep 1240 | LR 0.0001000000 | Loss 0.091161 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:46 Epoch 0 | Batch 1250/2891 | Timestep 1250 | LR 0.0001000000 | Loss 0.068882 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:48 Epoch 0 | Batch 1260/2891 | Timestep 1260 | LR 0.0001000000 | Loss 0.123062 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:51 Epoch 0 | Batch 1270/2891 | Timestep 1270 | LR 0.0001000000 | Loss 0.062683 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:54 Epoch 0 | Batch 1280/2891 | Timestep 1280 | LR 0.0001000000 | Loss 0.124934 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:56 Epoch 0 | Batch 1290/2891 | Timestep 1290 | LR 0.0001000000 | Loss 0.182164 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:08:58 Epoch 0 | Batch 1300/2891 | Timestep 1300 | LR 0.0001000000 | Loss 0.190824 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:00 Epoch 0 | Batch 1310/2891 | Timestep 1310 | LR 0.0001000000 | Loss 0.240509 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:02 Epoch 0 | Batch 1320/2891 | Timestep 1320 | LR 0.0001000000 | Loss 0.108103 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:04 Epoch 0 | Batch 1330/2891 | Timestep 1330 | LR 0.0001000000 | Loss 0.097160 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:07 Epoch 0 | Batch 1340/2891 | Timestep 1340 | LR 0.0001000000 | Loss 0.070232 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:09 Epoch 0 | Batch 1350/2891 | Timestep 1350 | LR 0.0001000000 | Loss 0.097085 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:11 Epoch 0 | Batch 1360/2891 | Timestep 1360 | LR 0.0001000000 | Loss 0.143309 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:13 Epoch 0 | Batch 1370/2891 | Timestep 1370 | LR 0.0001000000 | Loss 0.161536 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:15 Epoch 0 | Batch 1380/2891 | Timestep 1380 | LR 0.0001000000 | Loss 2.402255 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:17 Epoch 0 | Batch 1390/2891 | Timestep 1390 | LR 0.0001000000 | Loss 0.018577 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:19 Epoch 0 | Batch 1400/2891 | Timestep 1400 | LR 0.0001000000 | Loss 0.405250 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:21 Epoch 0 | Batch 1410/2891 | Timestep 1410 | LR 0.0001000000 | Loss 0.075027 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:23 Epoch 0 | Batch 1420/2891 | Timestep 1420 | LR 0.0001000000 | Loss 0.074512 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:26 Epoch 0 | Batch 1430/2891 | Timestep 1430 | LR 0.0001000000 | Loss 0.281151 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:28 Epoch 0 | Batch 1440/2891 | Timestep 1440 | LR 0.0001000000 | Loss 0.145040 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:30 Epoch 0 | Batch 1450/2891 | Timestep 1450 | LR 0.0001000000 | Loss 0.061768 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:32 Epoch 0 | Batch 1460/2891 | Timestep 1460 | LR 0.0001000000 | Loss 0.139366 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:34 Epoch 0 | Batch 1470/2891 | Timestep 1470 | LR 0.0001000000 | Loss 0.201618 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:36 Epoch 0 | Batch 1480/2891 | Timestep 1480 | LR 0.0001000000 | Loss 0.160580 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:39 Epoch 0 | Batch 1490/2891 | Timestep 1490 | LR 0.0001000000 | Loss 0.214628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:41 Epoch 0 | Batch 1500/2891 | Timestep 1500 | LR 0.0001000000 | Loss 0.036200 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:43 Epoch 0 | Batch 1510/2891 | Timestep 1510 | LR 0.0001000000 | Loss 0.107052 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:45 Epoch 0 | Batch 1520/2891 | Timestep 1520 | LR 0.0001000000 | Loss 0.235792 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:47 Epoch 0 | Batch 1530/2891 | Timestep 1530 | LR 0.0001000000 | Loss 0.098257 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:50 Epoch 0 | Batch 1540/2891 | Timestep 1540 | LR 0.0001000000 | Loss 0.067000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:52 Epoch 0 | Batch 1550/2891 | Timestep 1550 | LR 0.0001000000 | Loss 0.075793 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:54 Epoch 0 | Batch 1560/2891 | Timestep 1560 | LR 0.0001000000 | Loss 0.222283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:56 Epoch 0 | Batch 1570/2891 | Timestep 1570 | LR 0.0001000000 | Loss 0.108725 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:09:58 Epoch 0 | Batch 1580/2891 | Timestep 1580 | LR 0.0001000000 | Loss 2.400777 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:00 Epoch 0 | Batch 1590/2891 | Timestep 1590 | LR 0.0001000000 | Loss 0.392568 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:03 Epoch 0 | Batch 1600/2891 | Timestep 1600 | LR 0.0001000000 | Loss 0.066770 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:05 Epoch 0 | Batch 1610/2891 | Timestep 1610 | LR 0.0001000000 | Loss 0.116131 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:07 Epoch 0 | Batch 1620/2891 | Timestep 1620 | LR 0.0001000000 | Loss 0.089215 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:09 Epoch 0 | Batch 1630/2891 | Timestep 1630 | LR 0.0001000000 | Loss 0.071570 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:12 Epoch 0 | Batch 1640/2891 | Timestep 1640 | LR 0.0001000000 | Loss 0.188713 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:14 Epoch 0 | Batch 1650/2891 | Timestep 1650 | LR 0.0001000000 | Loss 0.174718 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:15 Epoch 0 | Batch 1660/2891 | Timestep 1660 | LR 0.0001000000 | Loss 0.199684 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:18 Epoch 0 | Batch 1670/2891 | Timestep 1670 | LR 0.0001000000 | Loss 0.131753 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:20 Epoch 0 | Batch 1680/2891 | Timestep 1680 | LR 0.0001000000 | Loss 0.319422 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:22 Epoch 0 | Batch 1690/2891 | Timestep 1690 | LR 0.0001000000 | Loss 0.130359 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:24 Epoch 0 | Batch 1700/2891 | Timestep 1700 | LR 0.0001000000 | Loss 0.126259 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:26 Epoch 0 | Batch 1710/2891 | Timestep 1710 | LR 0.0001000000 | Loss 0.118343 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:28 Epoch 0 | Batch 1720/2891 | Timestep 1720 | LR 0.0001000000 | Loss 0.113537 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:30 Epoch 0 | Batch 1730/2891 | Timestep 1730 | LR 0.0001000000 | Loss 0.346829 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:33 Epoch 0 | Batch 1740/2891 | Timestep 1740 | LR 0.0001000000 | Loss 0.108238 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:35 Epoch 0 | Batch 1750/2891 | Timestep 1750 | LR 0.0001000000 | Loss 0.229124 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:36 Epoch 0 | Batch 1760/2891 | Timestep 1760 | LR 0.0001000000 | Loss 0.045372 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:38 Epoch 0 | Batch 1770/2891 | Timestep 1770 | LR 0.0001000000 | Loss 0.087299 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:40 Epoch 0 | Batch 1780/2891 | Timestep 1780 | LR 0.0001000000 | Loss 0.242042 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:42 Epoch 0 | Batch 1790/2891 | Timestep 1790 | LR 0.0001000000 | Loss 0.054807 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:45 Epoch 0 | Batch 1800/2891 | Timestep 1800 | LR 0.0001000000 | Loss 0.082385 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:47 Epoch 0 | Batch 1810/2891 | Timestep 1810 | LR 0.0001000000 | Loss 0.089785 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:49 Epoch 0 | Batch 1820/2891 | Timestep 1820 | LR 0.0001000000 | Loss 0.055780 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:51 Epoch 0 | Batch 1830/2891 | Timestep 1830 | LR 0.0001000000 | Loss 0.125304 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:53 Epoch 0 | Batch 1840/2891 | Timestep 1840 | LR 0.0001000000 | Loss 0.131452 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:56 Epoch 0 | Batch 1850/2891 | Timestep 1850 | LR 0.0001000000 | Loss 1.413234 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:10:58 Epoch 0 | Batch 1860/2891 | Timestep 1860 | LR 0.0001000000 | Loss 0.071829 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:00 Epoch 0 | Batch 1870/2891 | Timestep 1870 | LR 0.0001000000 | Loss 0.092023 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:02 Epoch 0 | Batch 1880/2891 | Timestep 1880 | LR 0.0001000000 | Loss 0.143633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:04 Epoch 0 | Batch 1890/2891 | Timestep 1890 | LR 0.0001000000 | Loss 0.078741 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:06 Epoch 0 | Batch 1900/2891 | Timestep 1900 | LR 0.0001000000 | Loss 0.045697 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:09 Epoch 0 | Batch 1910/2891 | Timestep 1910 | LR 0.0001000000 | Loss 0.151132 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:11 Epoch 0 | Batch 1920/2891 | Timestep 1920 | LR 0.0001000000 | Loss 0.340675 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:13 Epoch 0 | Batch 1930/2891 | Timestep 1930 | LR 0.0001000000 | Loss 0.141658 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:15 Epoch 0 | Batch 1940/2891 | Timestep 1940 | LR 0.0001000000 | Loss 0.070979 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:18 Epoch 0 | Batch 1950/2891 | Timestep 1950 | LR 0.0001000000 | Loss 0.038535 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:20 Epoch 0 | Batch 1960/2891 | Timestep 1960 | LR 0.0001000000 | Loss 0.221200 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:22 Epoch 0 | Batch 1970/2891 | Timestep 1970 | LR 0.0001000000 | Loss 0.539450 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:24 Epoch 0 | Batch 1980/2891 | Timestep 1980 | LR 0.0001000000 | Loss 0.129464 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:26 Epoch 0 | Batch 1990/2891 | Timestep 1990 | LR 0.0001000000 | Loss 0.076359 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:29 Epoch 0 | Batch 2000/2891 | Timestep 2000 | LR 0.0001000000 | Loss 0.062693 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:31 Epoch 0 | Batch 2010/2891 | Timestep 2010 | LR 0.0001000000 | Loss 0.248758 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:33 Epoch 0 | Batch 2020/2891 | Timestep 2020 | LR 0.0001000000 | Loss 0.063458 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:35 Epoch 0 | Batch 2030/2891 | Timestep 2030 | LR 0.0001000000 | Loss 0.090609 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:38 Epoch 0 | Batch 2040/2891 | Timestep 2040 | LR 0.0001000000 | Loss 0.102017 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:40 Epoch 0 | Batch 2050/2891 | Timestep 2050 | LR 0.0001000000 | Loss 0.115016 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:42 Epoch 0 | Batch 2060/2891 | Timestep 2060 | LR 0.0001000000 | Loss 0.134237 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:44 Epoch 0 | Batch 2070/2891 | Timestep 2070 | LR 0.0001000000 | Loss 0.075582 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:46 Epoch 0 | Batch 2080/2891 | Timestep 2080 | LR 0.0001000000 | Loss 0.392927 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:48 Epoch 0 | Batch 2090/2891 | Timestep 2090 | LR 0.0001000000 | Loss 0.121893 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:50 Epoch 0 | Batch 2100/2891 | Timestep 2100 | LR 0.0001000000 | Loss 0.045164 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:53 Epoch 0 | Batch 2110/2891 | Timestep 2110 | LR 0.0001000000 | Loss 0.131909 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:55 Epoch 0 | Batch 2120/2891 | Timestep 2120 | LR 0.0001000000 | Loss 0.094819 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:57 Epoch 0 | Batch 2130/2891 | Timestep 2130 | LR 0.0001000000 | Loss 0.065168 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:11:59 Epoch 0 | Batch 2140/2891 | Timestep 2140 | LR 0.0001000000 | Loss 0.094622 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:01 Epoch 0 | Batch 2150/2891 | Timestep 2150 | LR 0.0001000000 | Loss 0.150454 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:03 Epoch 0 | Batch 2160/2891 | Timestep 2160 | LR 0.0001000000 | Loss 0.068766 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:06 Epoch 0 | Batch 2170/2891 | Timestep 2170 | LR 0.0001000000 | Loss 0.119149 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:08 Epoch 0 | Batch 2180/2891 | Timestep 2180 | LR 0.0001000000 | Loss 0.172453 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:10 Epoch 0 | Batch 2190/2891 | Timestep 2190 | LR 0.0001000000 | Loss 0.242479 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:12 Epoch 0 | Batch 2200/2891 | Timestep 2200 | LR 0.0001000000 | Loss 0.045533 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:14 Epoch 0 | Batch 2210/2891 | Timestep 2210 | LR 0.0001000000 | Loss 0.053062 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:17 Epoch 0 | Batch 2220/2891 | Timestep 2220 | LR 0.0001000000 | Loss 0.081152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:19 Epoch 0 | Batch 2230/2891 | Timestep 2230 | LR 0.0001000000 | Loss 0.062796 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:21 Epoch 0 | Batch 2240/2891 | Timestep 2240 | LR 0.0001000000 | Loss 0.068186 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:23 Epoch 0 | Batch 2250/2891 | Timestep 2250 | LR 0.0001000000 | Loss 0.051518 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:26 Epoch 0 | Batch 2260/2891 | Timestep 2260 | LR 0.0001000000 | Loss 0.051302 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:28 Epoch 0 | Batch 2270/2891 | Timestep 2270 | LR 0.0001000000 | Loss 0.019261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:30 Epoch 0 | Batch 2280/2891 | Timestep 2280 | LR 0.0001000000 | Loss 0.119711 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:32 Epoch 0 | Batch 2290/2891 | Timestep 2290 | LR 0.0001000000 | Loss 0.032510 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:34 Epoch 0 | Batch 2300/2891 | Timestep 2300 | LR 0.0001000000 | Loss 0.096505 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:37 Epoch 0 | Batch 2310/2891 | Timestep 2310 | LR 0.0001000000 | Loss 0.160650 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:39 Epoch 0 | Batch 2320/2891 | Timestep 2320 | LR 0.0001000000 | Loss 0.091075 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:41 Epoch 0 | Batch 2330/2891 | Timestep 2330 | LR 0.0001000000 | Loss 0.051210 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:44 Epoch 0 | Batch 2340/2891 | Timestep 2340 | LR 0.0001000000 | Loss 0.024374 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:46 Epoch 0 | Batch 2350/2891 | Timestep 2350 | LR 0.0001000000 | Loss 0.038941 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:48 Epoch 0 | Batch 2360/2891 | Timestep 2360 | LR 0.0001000000 | Loss 0.123574 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:50 Epoch 0 | Batch 2370/2891 | Timestep 2370 | LR 0.0001000000 | Loss 0.081040 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:52 Epoch 0 | Batch 2380/2891 | Timestep 2380 | LR 0.0001000000 | Loss 0.316491 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:55 Epoch 0 | Batch 2390/2891 | Timestep 2390 | LR 0.0001000000 | Loss 0.058047 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:57 Epoch 0 | Batch 2400/2891 | Timestep 2400 | LR 0.0001000000 | Loss 0.142260 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:12:59 Epoch 0 | Batch 2410/2891 | Timestep 2410 | LR 0.0001000000 | Loss 0.130568 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:01 Epoch 0 | Batch 2420/2891 | Timestep 2420 | LR 0.0001000000 | Loss 0.082073 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:03 Epoch 0 | Batch 2430/2891 | Timestep 2430 | LR 0.0001000000 | Loss 0.281979 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:06 Epoch 0 | Batch 2440/2891 | Timestep 2440 | LR 0.0001000000 | Loss 0.049312 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:08 Epoch 0 | Batch 2450/2891 | Timestep 2450 | LR 0.0001000000 | Loss 0.069954 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:10 Epoch 0 | Batch 2460/2891 | Timestep 2460 | LR 0.0001000000 | Loss 0.019294 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:12 Epoch 0 | Batch 2470/2891 | Timestep 2470 | LR 0.0001000000 | Loss 0.092072 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:14 Epoch 0 | Batch 2480/2891 | Timestep 2480 | LR 0.0001000000 | Loss 0.063099 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:17 Epoch 0 | Batch 2490/2891 | Timestep 2490 | LR 0.0001000000 | Loss 0.124255 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:20 Epoch 0 | Batch 2500/2891 | Timestep 2500 | LR 0.0001000000 | Loss 0.122109 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:22 Epoch 0 | Batch 2510/2891 | Timestep 2510 | LR 0.0001000000 | Loss 0.052508 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:24 Epoch 0 | Batch 2520/2891 | Timestep 2520 | LR 0.0001000000 | Loss 0.300385 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:26 Epoch 0 | Batch 2530/2891 | Timestep 2530 | LR 0.0001000000 | Loss 0.161048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:28 Epoch 0 | Batch 2540/2891 | Timestep 2540 | LR 0.0001000000 | Loss 0.053075 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:30 Epoch 0 | Batch 2550/2891 | Timestep 2550 | LR 0.0001000000 | Loss 0.048079 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:32 Epoch 0 | Batch 2560/2891 | Timestep 2560 | LR 0.0001000000 | Loss 0.237811 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:35 Epoch 0 | Batch 2570/2891 | Timestep 2570 | LR 0.0001000000 | Loss 0.034755 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:37 Epoch 0 | Batch 2580/2891 | Timestep 2580 | LR 0.0001000000 | Loss 0.127875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:39 Epoch 0 | Batch 2590/2891 | Timestep 2590 | LR 0.0001000000 | Loss 0.088385 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:41 Epoch 0 | Batch 2600/2891 | Timestep 2600 | LR 0.0001000000 | Loss 0.155962 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:43 Epoch 0 | Batch 2610/2891 | Timestep 2610 | LR 0.0001000000 | Loss 0.285760 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:45 Epoch 0 | Batch 2620/2891 | Timestep 2620 | LR 0.0001000000 | Loss 0.028074 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:47 Epoch 0 | Batch 2630/2891 | Timestep 2630 | LR 0.0001000000 | Loss 0.166776 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:50 Epoch 0 | Batch 2640/2891 | Timestep 2640 | LR 0.0001000000 | Loss 0.151262 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:52 Epoch 0 | Batch 2650/2891 | Timestep 2650 | LR 0.0001000000 | Loss 0.318415 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:54 Epoch 0 | Batch 2660/2891 | Timestep 2660 | LR 0.0001000000 | Loss 0.066462 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:56 Epoch 0 | Batch 2670/2891 | Timestep 2670 | LR 0.0001000000 | Loss 0.124701 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:13:58 Epoch 0 | Batch 2680/2891 | Timestep 2680 | LR 0.0001000000 | Loss 0.222369 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:00 Epoch 0 | Batch 2690/2891 | Timestep 2690 | LR 0.0001000000 | Loss 0.144442 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:02 Epoch 0 | Batch 2700/2891 | Timestep 2700 | LR 0.0001000000 | Loss 0.133213 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:05 Epoch 0 | Batch 2710/2891 | Timestep 2710 | LR 0.0001000000 | Loss 0.147225 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:07 Epoch 0 | Batch 2720/2891 | Timestep 2720 | LR 0.0001000000 | Loss 0.094077 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:09 Epoch 0 | Batch 2730/2891 | Timestep 2730 | LR 0.0001000000 | Loss 0.172758 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:11 Epoch 0 | Batch 2740/2891 | Timestep 2740 | LR 0.0001000000 | Loss 0.108803 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:13 Epoch 0 | Batch 2750/2891 | Timestep 2750 | LR 0.0001000000 | Loss 0.133038 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:15 Epoch 0 | Batch 2760/2891 | Timestep 2760 | LR 0.0001000000 | Loss 0.088861 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:17 Epoch 0 | Batch 2770/2891 | Timestep 2770 | LR 0.0001000000 | Loss 0.163889 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:20 Epoch 0 | Batch 2780/2891 | Timestep 2780 | LR 0.0001000000 | Loss 0.127627 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:22 Epoch 0 | Batch 2790/2891 | Timestep 2790 | LR 0.0001000000 | Loss 0.048946 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:24 Epoch 0 | Batch 2800/2891 | Timestep 2800 | LR 0.0001000000 | Loss 0.082211 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:26 Epoch 0 | Batch 2810/2891 | Timestep 2810 | LR 0.0001000000 | Loss 0.043212 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:28 Epoch 0 | Batch 2820/2891 | Timestep 2820 | LR 0.0001000000 | Loss 0.149125 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:30 Epoch 0 | Batch 2830/2891 | Timestep 2830 | LR 0.0001000000 | Loss 0.150169 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:32 Epoch 0 | Batch 2840/2891 | Timestep 2840 | LR 0.0001000000 | Loss 0.097861 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:34 Epoch 0 | Batch 2850/2891 | Timestep 2850 | LR 0.0001000000 | Loss 0.116762 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:37 Epoch 0 | Batch 2860/2891 | Timestep 2860 | LR 0.0001000000 | Loss 0.078736 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:40 Epoch 0 | Batch 2870/2891 | Timestep 2870 | LR 0.0001000000 | Loss 0.037493 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:42 Epoch 0 | Batch 2880/2891 | Timestep 2880 | LR 0.0001000000 | Loss 0.081365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:44 Epoch 0 | Batch 2890/2891 | Timestep 2890 | LR 0.0001000000 | Loss 0.086169 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:14:44 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 18:16:04 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.5214 0.7019 0.5984 104 + CAMP 0.8732 0.8732 0.8732 71 + CARDINAL 0.8288 0.5412 0.6548 170 + CLUSTER 0.3158 0.2308 0.2667 26 + COM 0.7059 0.6154 0.6575 39 + CONTINENT 1.0000 0.6087 0.7568 23 + COUNTRY 0.9561 0.9641 0.9600 835 + CURR 0.6667 0.6667 0.6667 24 + DATE 0.9215 0.9237 0.9226 1691 + EDU 0.8349 0.8349 0.8349 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.6513 0.5822 0.6148 292 + FAC 0.5130 0.7117 0.5962 111 + GOV 0.8367 0.8105 0.8234 860 + GPE 0.9571 0.9571 0.9571 2261 + GPE_ORG 0.8176 0.8323 0.8249 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 1.0000 0.6250 0.7692 16 + LAW 0.5741 0.6596 0.6139 47 + LOC 0.5912 0.7402 0.6573 127 + MED 0.9610 0.9403 0.9505 419 + MONEY 0.6957 0.7273 0.7111 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.8140 0.8581 0.8355 571 + NORP 0.6063 0.5590 0.5817 551 + OCC 0.7953 0.7739 0.7845 522 + ORDINAL 0.8712 0.9449 0.9065 544 + ORG 0.8900 0.8905 0.8903 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.0000 0.0000 0.0000 6 + PERCENT 0.0762 0.6667 0.1368 12 + PERS 0.9185 0.8630 0.8899 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.0000 0.0000 0.0000 3 + REGION-GENERAL 0.9000 0.7297 0.8060 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.0000 0.0000 0.0000 10 + SCI 0.0000 0.0000 0.0000 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.8556 0.8603 0.8579 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.7419 0.6970 0.7188 33 + TOWN 0.9629 0.9392 0.9509 1217 + UNIT 0.0000 0.0000 0.0000 4 + WATER-BODY 0.4167 0.3571 0.3846 14 + WEBSITE 0.4348 0.5000 0.4651 80 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.8615 0.8582 0.8599 13790 + macro avg 0.5001 0.4936 0.4881 13790 + weighted avg 0.8638 0.8582 0.8597 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:16:46 Epoch 0 | Timestep 2891 | Train Loss 0.804567 | Val Loss 0.121967 | F1 0.859852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:16:46 ** Validation improved, evaluating test data ** +INFO arabiner.data.transforms Tue, 26 Mar 2024 18:16:50 Truncating the sequence لكن صوت جوالي مزعج ما دفعني للنهوض وبعصبية وارتباك من هذا الاتصال وخصوصا أن الساعة الواحدة والنصف يعنى عز دين النوم فأمسكت الجوال وقمت بالضغط على زر الرد . فقلت الو مين معي فقال معك الرئيس فقلت رئيس مين بالضبط فقال جورج بوش رئيس الولايات المتحدة الأمريكية فقلت اهلا أهلا يا سيادة الرئيس , بس أنا على حد علمي انه الرئيس جورج بوش بتكلم اللغة الانجليزية فكيف أنت بتحكي عربي بوش انأ بتكلم اللغة العربية جيدا حتى أنى ممكن أحكى باللهجة الغزواية . فقلت عليك اه خير شو مالك متصل فيا وكيف عرفت رقمي بوش ما في شي قلت أسال كيف أهل غزة بجو الحصار أما كيف عرفت رقمك فقلت لمديرة مكتبي أعطيني اتصال مباشر مع اى شخص من غزة فقلت غزة ااه بدك تعرف أخبار غزة صامدين صامدين ومش راح نتخلى عن الثوابت الفلسطينية لو شو ما تعملوا بوش يعنى بدك تقنعني انه ما فى نتيجة من الحصار فقلت لا ما في نتيجة لأنه إحنا بنخاف على بعض وبنحب بعض حتى رغيف الخبز مرات بنتقاسموا بوش اه واضح حتى التعذيب بتتقاسموه بالضفة وغزة فقلت يا عمى هيك عارف كل شى , شو بدك من الأخر لأني بدى أنام بوش شو رأيك تحضر مؤتمر انابولس فقلت احضر شو , شمعنا أنا يعني بوش هيك اجت فى بالى الفكرة فقلت لا لا مش فاضى , ميش مستعد اضيع وقتي في شي عارف نهايته بوش طيب تابعنا على التلفزيون منه بتعرف شو صار قلت صدقني وقتي فل , بكون بقرا بكتاب الجنة لا تبعد كثيرا بوش غريبة أول إنسان عربي ادعوه على المؤتمر ويكون وقته مشغول قلت شكلوا الكل مضيوف بالبيت الأبيض بوش اه مليان مش عارف أتحرك براحتي مخنوق فقلت اذا انت مخنوق شو نقول احنا بوش عارف بحاول معهم لكن لا حياة لمن تنادى من الطرفين وحابب اخذ رايك بالموضوع هل فى امل ? فقلت : رأي انك تستقيل قبل مؤتمر انابولس واكسب بياض الوجه وسيبك من الشرق الأوسط صدقني ما بتستاهلوا شي بوش : لا وحياتك راح يستقيل اولمرت وعباس اذا صار شي فقلت : اسمحي بدى أنام نعسان , بس دير بالك على العراق وأفغانستان اصلو بسمع انه في قتلي بشكل غريب بوش : وما تقلق راح أتوصي بإيران كويس وراح نعمل الوطن العربي كله سلطة قلت : طيب يالله سلام بوش : بس ما تنسانى قلت : له / هو فى حدا راح ينساك وانقطع حلمي برنه جوال حقيقة شرذمت ما تبقى من الحلم , فاعذروني فما هذه المكالمة إلا من عتمة أفكاري فأتمنى للرئيس عباس كل التوفيق وأرجو الا يكون هذا المؤتمر هو رحلة حب قصيرة الأمد . to 510 +INFO root Tue, 26 Mar 2024 18:17:54 Predictions written to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/predictions.txt +INFO root Tue, 26 Mar 2024 18:19:25 + precision recall f1-score support + + AIRPORT 0.0000 0.0000 0.0000 1 + BOUNDARY 0.0000 0.0000 0.0000 3 + BUILDING-OR-GROUNDS 0.4963 0.6618 0.5672 204 + CAMP 0.9146 0.8929 0.9036 168 + CARDINAL 0.8190 0.5556 0.6620 342 + CELESTIAL 0.0000 0.0000 0.0000 2 + CLUSTER 0.3261 0.1948 0.2439 77 + COM 0.6413 0.5315 0.5813 111 + CONTINENT 0.9688 0.5439 0.6966 57 + COUNTRY 0.9429 0.9458 0.9444 1625 + CURR 0.5238 0.5366 0.5301 41 + DATE 0.9302 0.9357 0.9330 3206 + EDU 0.6929 0.7719 0.7303 228 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.6862 0.6368 0.6606 570 + FAC 0.4968 0.6996 0.5810 223 + GOV 0.8271 0.7954 0.8109 1696 + GPE 0.9484 0.9488 0.9486 4554 + GPE_ORG 0.8493 0.7631 0.8039 325 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 118 + LANGUAGE 0.9500 0.4419 0.6032 43 + LAW 0.6200 0.6889 0.6526 90 + LOC 0.6285 0.7224 0.6722 281 + MED 0.9599 0.9492 0.9545 807 + MONEY 0.5897 0.6970 0.6389 33 + NEIGHBORHOOD 0.0000 0.0000 0.0000 30 + NONGOV 0.8036 0.8175 0.8105 1151 + NORP 0.6539 0.5934 0.6222 1092 + OCC 0.7816 0.7688 0.7751 1103 + ORDINAL 0.8628 0.9409 0.9002 1083 + ORG 0.8582 0.8648 0.8615 3618 + ORG_FAC 0.0000 0.0000 0.0000 19 + PATH 0.0000 0.0000 0.0000 18 + PERCENT 0.0909 0.7273 0.1616 33 + PERS 0.9059 0.8661 0.8856 1568 + PRODUCT 0.0000 0.0000 0.0000 19 + QUANTITY 0.0000 0.0000 0.0000 9 + REGION-GENERAL 0.7458 0.6377 0.6875 69 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 29 + REL 0.0000 0.0000 0.0000 25 + SCI 0.0000 0.0000 0.0000 29 + SPO 0.0000 0.0000 0.0000 8 + SPORT 0.0000 0.0000 0.0000 1 + STATE-OR-PROVINCE 0.8379 0.8717 0.8545 421 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 23 + TIME 0.6438 0.5595 0.5987 84 + TOWN 0.9527 0.9354 0.9440 2431 + UNIT 0.0000 0.0000 0.0000 11 + WATER-BODY 0.6154 0.3810 0.4706 21 + WEBSITE 0.4069 0.5086 0.4521 116 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.8465 0.8481 0.8473 27817 + macro avg 0.4700 0.4586 0.4538 27817 + weighted avg 0.8537 0.8481 0.8493 27817 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:20:48 Epoch 0 | Timestep 2891 | Test Loss 0.117114 | F1 0.847271 +INFO arabiner.trainers.BaseTrainer Tue, 26 Mar 2024 18:20:48 Saving checkpoint to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/checkpoints/checkpoint_0.pt +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:20:53 Epoch 1 | Batch 9/2891 | Timestep 2900 | LR 0.0001000000 | Loss 0.011508 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:20:55 Epoch 1 | Batch 19/2891 | Timestep 2910 | LR 0.0001000000 | Loss 0.148410 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:20:57 Epoch 1 | Batch 29/2891 | Timestep 2920 | LR 0.0001000000 | Loss 0.056251 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:20:59 Epoch 1 | Batch 39/2891 | Timestep 2930 | LR 0.0001000000 | Loss 0.060255 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:01 Epoch 1 | Batch 49/2891 | Timestep 2940 | LR 0.0001000000 | Loss 0.183412 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:03 Epoch 1 | Batch 59/2891 | Timestep 2950 | LR 0.0001000000 | Loss 0.089176 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:05 Epoch 1 | Batch 69/2891 | Timestep 2960 | LR 0.0001000000 | Loss 0.051244 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:07 Epoch 1 | Batch 79/2891 | Timestep 2970 | LR 0.0001000000 | Loss 0.049468 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:10 Epoch 1 | Batch 89/2891 | Timestep 2980 | LR 0.0001000000 | Loss 0.100368 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:12 Epoch 1 | Batch 99/2891 | Timestep 2990 | LR 0.0001000000 | Loss 0.056090 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:14 Epoch 1 | Batch 109/2891 | Timestep 3000 | LR 0.0001000000 | Loss 0.157459 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:17 Epoch 1 | Batch 119/2891 | Timestep 3010 | LR 0.0001000000 | Loss 0.037233 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:19 Epoch 1 | Batch 129/2891 | Timestep 3020 | LR 0.0001000000 | Loss 0.084574 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:21 Epoch 1 | Batch 139/2891 | Timestep 3030 | LR 0.0001000000 | Loss 0.062934 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:23 Epoch 1 | Batch 149/2891 | Timestep 3040 | LR 0.0001000000 | Loss 0.086093 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:25 Epoch 1 | Batch 159/2891 | Timestep 3050 | LR 0.0001000000 | Loss 0.147056 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:27 Epoch 1 | Batch 169/2891 | Timestep 3060 | LR 0.0001000000 | Loss 0.057333 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:30 Epoch 1 | Batch 179/2891 | Timestep 3070 | LR 0.0001000000 | Loss 0.073360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:32 Epoch 1 | Batch 189/2891 | Timestep 3080 | LR 0.0001000000 | Loss 0.095250 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:34 Epoch 1 | Batch 199/2891 | Timestep 3090 | LR 0.0001000000 | Loss 0.306531 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:36 Epoch 1 | Batch 209/2891 | Timestep 3100 | LR 0.0001000000 | Loss 0.345306 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:39 Epoch 1 | Batch 219/2891 | Timestep 3110 | LR 0.0001000000 | Loss 0.065048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:41 Epoch 1 | Batch 229/2891 | Timestep 3120 | LR 0.0001000000 | Loss 0.110486 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:43 Epoch 1 | Batch 239/2891 | Timestep 3130 | LR 0.0001000000 | Loss 0.130801 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:45 Epoch 1 | Batch 249/2891 | Timestep 3140 | LR 0.0001000000 | Loss 0.168276 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:48 Epoch 1 | Batch 259/2891 | Timestep 3150 | LR 0.0001000000 | Loss 0.016620 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:50 Epoch 1 | Batch 269/2891 | Timestep 3160 | LR 0.0001000000 | Loss 0.045944 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:52 Epoch 1 | Batch 279/2891 | Timestep 3170 | LR 0.0001000000 | Loss 0.176559 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:54 Epoch 1 | Batch 289/2891 | Timestep 3180 | LR 0.0001000000 | Loss 0.016953 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:56 Epoch 1 | Batch 299/2891 | Timestep 3190 | LR 0.0001000000 | Loss 0.080666 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:21:58 Epoch 1 | Batch 309/2891 | Timestep 3200 | LR 0.0001000000 | Loss 0.055798 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:00 Epoch 1 | Batch 319/2891 | Timestep 3210 | LR 0.0001000000 | Loss 0.075815 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:03 Epoch 1 | Batch 329/2891 | Timestep 3220 | LR 0.0001000000 | Loss 0.101039 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:05 Epoch 1 | Batch 339/2891 | Timestep 3230 | LR 0.0001000000 | Loss 0.137810 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:07 Epoch 1 | Batch 349/2891 | Timestep 3240 | LR 0.0001000000 | Loss 0.241686 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:09 Epoch 1 | Batch 359/2891 | Timestep 3250 | LR 0.0001000000 | Loss 0.155758 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:12 Epoch 1 | Batch 369/2891 | Timestep 3260 | LR 0.0001000000 | Loss 0.203108 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:14 Epoch 1 | Batch 379/2891 | Timestep 3270 | LR 0.0001000000 | Loss 0.134978 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:17 Epoch 1 | Batch 389/2891 | Timestep 3280 | LR 0.0001000000 | Loss 0.089875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:19 Epoch 1 | Batch 399/2891 | Timestep 3290 | LR 0.0001000000 | Loss 0.188214 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:21 Epoch 1 | Batch 409/2891 | Timestep 3300 | LR 0.0001000000 | Loss 0.195090 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:23 Epoch 1 | Batch 419/2891 | Timestep 3310 | LR 0.0001000000 | Loss 0.057749 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:26 Epoch 1 | Batch 429/2891 | Timestep 3320 | LR 0.0001000000 | Loss 0.211290 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:28 Epoch 1 | Batch 439/2891 | Timestep 3330 | LR 0.0001000000 | Loss 0.099411 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:30 Epoch 1 | Batch 449/2891 | Timestep 3340 | LR 0.0001000000 | Loss 0.067226 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:33 Epoch 1 | Batch 459/2891 | Timestep 3350 | LR 0.0001000000 | Loss 0.050273 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:35 Epoch 1 | Batch 469/2891 | Timestep 3360 | LR 0.0001000000 | Loss 0.152941 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:37 Epoch 1 | Batch 479/2891 | Timestep 3370 | LR 0.0001000000 | Loss 0.160365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:40 Epoch 1 | Batch 489/2891 | Timestep 3380 | LR 0.0001000000 | Loss 0.052229 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:42 Epoch 1 | Batch 499/2891 | Timestep 3390 | LR 0.0001000000 | Loss 0.087779 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:44 Epoch 1 | Batch 509/2891 | Timestep 3400 | LR 0.0001000000 | Loss 0.014699 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:46 Epoch 1 | Batch 519/2891 | Timestep 3410 | LR 0.0001000000 | Loss 0.047481 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:49 Epoch 1 | Batch 529/2891 | Timestep 3420 | LR 0.0001000000 | Loss 0.078227 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:51 Epoch 1 | Batch 539/2891 | Timestep 3430 | LR 0.0001000000 | Loss 0.056593 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:53 Epoch 1 | Batch 549/2891 | Timestep 3440 | LR 0.0001000000 | Loss 0.059117 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:56 Epoch 1 | Batch 559/2891 | Timestep 3450 | LR 0.0001000000 | Loss 0.022666 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:22:58 Epoch 1 | Batch 569/2891 | Timestep 3460 | LR 0.0001000000 | Loss 0.047447 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:00 Epoch 1 | Batch 579/2891 | Timestep 3470 | LR 0.0001000000 | Loss 0.037826 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:02 Epoch 1 | Batch 589/2891 | Timestep 3480 | LR 0.0001000000 | Loss 0.176514 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:04 Epoch 1 | Batch 599/2891 | Timestep 3490 | LR 0.0001000000 | Loss 0.024708 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:06 Epoch 1 | Batch 609/2891 | Timestep 3500 | LR 0.0001000000 | Loss 0.088415 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:09 Epoch 1 | Batch 619/2891 | Timestep 3510 | LR 0.0001000000 | Loss 0.074109 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:11 Epoch 1 | Batch 629/2891 | Timestep 3520 | LR 0.0001000000 | Loss 0.138585 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:13 Epoch 1 | Batch 639/2891 | Timestep 3530 | LR 0.0001000000 | Loss 0.092852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:15 Epoch 1 | Batch 649/2891 | Timestep 3540 | LR 0.0001000000 | Loss 0.067874 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:17 Epoch 1 | Batch 659/2891 | Timestep 3550 | LR 0.0001000000 | Loss 0.126758 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:20 Epoch 1 | Batch 669/2891 | Timestep 3560 | LR 0.0001000000 | Loss 0.016934 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:22 Epoch 1 | Batch 679/2891 | Timestep 3570 | LR 0.0001000000 | Loss 0.080008 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:24 Epoch 1 | Batch 689/2891 | Timestep 3580 | LR 0.0001000000 | Loss 0.150466 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:26 Epoch 1 | Batch 699/2891 | Timestep 3590 | LR 0.0001000000 | Loss 0.040716 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:28 Epoch 1 | Batch 709/2891 | Timestep 3600 | LR 0.0001000000 | Loss 0.041923 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:30 Epoch 1 | Batch 719/2891 | Timestep 3610 | LR 0.0001000000 | Loss 0.065143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:32 Epoch 1 | Batch 729/2891 | Timestep 3620 | LR 0.0001000000 | Loss 0.044304 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:34 Epoch 1 | Batch 739/2891 | Timestep 3630 | LR 0.0001000000 | Loss 0.045590 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:37 Epoch 1 | Batch 749/2891 | Timestep 3640 | LR 0.0001000000 | Loss 0.410057 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:39 Epoch 1 | Batch 759/2891 | Timestep 3650 | LR 0.0001000000 | Loss 0.093449 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:41 Epoch 1 | Batch 769/2891 | Timestep 3660 | LR 0.0001000000 | Loss 0.144033 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:43 Epoch 1 | Batch 779/2891 | Timestep 3670 | LR 0.0001000000 | Loss 0.309833 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:45 Epoch 1 | Batch 789/2891 | Timestep 3680 | LR 0.0001000000 | Loss 0.070359 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:47 Epoch 1 | Batch 799/2891 | Timestep 3690 | LR 0.0001000000 | Loss 0.193460 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:49 Epoch 1 | Batch 809/2891 | Timestep 3700 | LR 0.0001000000 | Loss 0.046506 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:51 Epoch 1 | Batch 819/2891 | Timestep 3710 | LR 0.0001000000 | Loss 0.131574 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:53 Epoch 1 | Batch 829/2891 | Timestep 3720 | LR 0.0001000000 | Loss 0.122867 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:56 Epoch 1 | Batch 839/2891 | Timestep 3730 | LR 0.0001000000 | Loss 0.063806 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:23:58 Epoch 1 | Batch 849/2891 | Timestep 3740 | LR 0.0001000000 | Loss 0.060902 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:00 Epoch 1 | Batch 859/2891 | Timestep 3750 | LR 0.0001000000 | Loss 0.084618 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:02 Epoch 1 | Batch 869/2891 | Timestep 3760 | LR 0.0001000000 | Loss 0.082519 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:04 Epoch 1 | Batch 879/2891 | Timestep 3770 | LR 0.0001000000 | Loss 0.049387 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:06 Epoch 1 | Batch 889/2891 | Timestep 3780 | LR 0.0001000000 | Loss 0.015429 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:08 Epoch 1 | Batch 899/2891 | Timestep 3790 | LR 0.0001000000 | Loss 0.251805 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:10 Epoch 1 | Batch 909/2891 | Timestep 3800 | LR 0.0001000000 | Loss 0.043591 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:13 Epoch 1 | Batch 919/2891 | Timestep 3810 | LR 0.0001000000 | Loss 0.058976 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:15 Epoch 1 | Batch 929/2891 | Timestep 3820 | LR 0.0001000000 | Loss 0.043413 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:17 Epoch 1 | Batch 939/2891 | Timestep 3830 | LR 0.0001000000 | Loss 0.065555 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:20 Epoch 1 | Batch 949/2891 | Timestep 3840 | LR 0.0001000000 | Loss 0.106713 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:22 Epoch 1 | Batch 959/2891 | Timestep 3850 | LR 0.0001000000 | Loss 0.095943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:24 Epoch 1 | Batch 969/2891 | Timestep 3860 | LR 0.0001000000 | Loss 0.066703 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:26 Epoch 1 | Batch 979/2891 | Timestep 3870 | LR 0.0001000000 | Loss 0.202804 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:29 Epoch 1 | Batch 989/2891 | Timestep 3880 | LR 0.0001000000 | Loss 0.085232 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:31 Epoch 1 | Batch 999/2891 | Timestep 3890 | LR 0.0001000000 | Loss 0.056393 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:33 Epoch 1 | Batch 1009/2891 | Timestep 3900 | LR 0.0001000000 | Loss 0.050035 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:36 Epoch 1 | Batch 1019/2891 | Timestep 3910 | LR 0.0001000000 | Loss 0.076341 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:38 Epoch 1 | Batch 1029/2891 | Timestep 3920 | LR 0.0001000000 | Loss 0.251378 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:40 Epoch 1 | Batch 1039/2891 | Timestep 3930 | LR 0.0001000000 | Loss 67.409796 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:43 Epoch 1 | Batch 1049/2891 | Timestep 3940 | LR 0.0001000000 | Loss 0.077842 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:45 Epoch 1 | Batch 1059/2891 | Timestep 3950 | LR 0.0001000000 | Loss 0.086828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:47 Epoch 1 | Batch 1069/2891 | Timestep 3960 | LR 0.0001000000 | Loss 0.052048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:49 Epoch 1 | Batch 1079/2891 | Timestep 3970 | LR 0.0001000000 | Loss 0.044656 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:51 Epoch 1 | Batch 1089/2891 | Timestep 3980 | LR 0.0001000000 | Loss 0.024491 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:53 Epoch 1 | Batch 1099/2891 | Timestep 3990 | LR 0.0001000000 | Loss 0.129334 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:55 Epoch 1 | Batch 1109/2891 | Timestep 4000 | LR 0.0001000000 | Loss 0.035419 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:24:58 Epoch 1 | Batch 1119/2891 | Timestep 4010 | LR 0.0001000000 | Loss 0.054381 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:00 Epoch 1 | Batch 1129/2891 | Timestep 4020 | LR 0.0001000000 | Loss 0.082329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:02 Epoch 1 | Batch 1139/2891 | Timestep 4030 | LR 0.0001000000 | Loss 0.071322 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:04 Epoch 1 | Batch 1149/2891 | Timestep 4040 | LR 0.0001000000 | Loss 0.073513 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:07 Epoch 1 | Batch 1159/2891 | Timestep 4050 | LR 0.0001000000 | Loss 0.016943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:09 Epoch 1 | Batch 1169/2891 | Timestep 4060 | LR 0.0001000000 | Loss 0.030966 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:11 Epoch 1 | Batch 1179/2891 | Timestep 4070 | LR 0.0001000000 | Loss 0.124376 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:13 Epoch 1 | Batch 1189/2891 | Timestep 4080 | LR 0.0001000000 | Loss 0.019648 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:15 Epoch 1 | Batch 1199/2891 | Timestep 4090 | LR 0.0001000000 | Loss 0.225541 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:17 Epoch 1 | Batch 1209/2891 | Timestep 4100 | LR 0.0001000000 | Loss 0.074614 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:19 Epoch 1 | Batch 1219/2891 | Timestep 4110 | LR 0.0001000000 | Loss 0.036873 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:22 Epoch 1 | Batch 1229/2891 | Timestep 4120 | LR 0.0001000000 | Loss 0.053285 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:24 Epoch 1 | Batch 1239/2891 | Timestep 4130 | LR 0.0001000000 | Loss 0.159765 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:26 Epoch 1 | Batch 1249/2891 | Timestep 4140 | LR 0.0001000000 | Loss 0.066283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:28 Epoch 1 | Batch 1259/2891 | Timestep 4150 | LR 0.0001000000 | Loss 0.075840 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:30 Epoch 1 | Batch 1269/2891 | Timestep 4160 | LR 0.0001000000 | Loss 0.072868 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:32 Epoch 1 | Batch 1279/2891 | Timestep 4170 | LR 0.0001000000 | Loss 0.283907 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:35 Epoch 1 | Batch 1289/2891 | Timestep 4180 | LR 0.0001000000 | Loss 0.021497 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:37 Epoch 1 | Batch 1299/2891 | Timestep 4190 | LR 0.0001000000 | Loss 0.037187 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:39 Epoch 1 | Batch 1309/2891 | Timestep 4200 | LR 0.0001000000 | Loss 0.095742 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:42 Epoch 1 | Batch 1319/2891 | Timestep 4210 | LR 0.0001000000 | Loss 0.045021 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:44 Epoch 1 | Batch 1329/2891 | Timestep 4220 | LR 0.0001000000 | Loss 0.125412 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:46 Epoch 1 | Batch 1339/2891 | Timestep 4230 | LR 0.0001000000 | Loss 0.143270 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:48 Epoch 1 | Batch 1349/2891 | Timestep 4240 | LR 0.0001000000 | Loss 0.035980 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:50 Epoch 1 | Batch 1359/2891 | Timestep 4250 | LR 0.0001000000 | Loss 0.052895 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:52 Epoch 1 | Batch 1369/2891 | Timestep 4260 | LR 0.0001000000 | Loss 0.206348 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:54 Epoch 1 | Batch 1379/2891 | Timestep 4270 | LR 0.0001000000 | Loss 0.106020 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:56 Epoch 1 | Batch 1389/2891 | Timestep 4280 | LR 0.0001000000 | Loss 0.213676 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:25:58 Epoch 1 | Batch 1399/2891 | Timestep 4290 | LR 0.0001000000 | Loss 0.043017 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:01 Epoch 1 | Batch 1409/2891 | Timestep 4300 | LR 0.0001000000 | Loss 0.043267 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:03 Epoch 1 | Batch 1419/2891 | Timestep 4310 | LR 0.0001000000 | Loss 0.080159 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:05 Epoch 1 | Batch 1429/2891 | Timestep 4320 | LR 0.0001000000 | Loss 0.154820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:07 Epoch 1 | Batch 1439/2891 | Timestep 4330 | LR 0.0001000000 | Loss 0.367323 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:09 Epoch 1 | Batch 1449/2891 | Timestep 4340 | LR 0.0001000000 | Loss 0.150009 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:11 Epoch 1 | Batch 1459/2891 | Timestep 4350 | LR 0.0001000000 | Loss 0.178443 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:14 Epoch 1 | Batch 1469/2891 | Timestep 4360 | LR 0.0001000000 | Loss 0.025685 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:16 Epoch 1 | Batch 1479/2891 | Timestep 4370 | LR 0.0001000000 | Loss 0.122365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:18 Epoch 1 | Batch 1489/2891 | Timestep 4380 | LR 0.0001000000 | Loss 0.279992 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:20 Epoch 1 | Batch 1499/2891 | Timestep 4390 | LR 0.0001000000 | Loss 0.142531 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:22 Epoch 1 | Batch 1509/2891 | Timestep 4400 | LR 0.0001000000 | Loss 0.107420 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:24 Epoch 1 | Batch 1519/2891 | Timestep 4410 | LR 0.0001000000 | Loss 0.030031 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:26 Epoch 1 | Batch 1529/2891 | Timestep 4420 | LR 0.0001000000 | Loss 0.098229 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:28 Epoch 1 | Batch 1539/2891 | Timestep 4430 | LR 0.0001000000 | Loss 0.032560 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:30 Epoch 1 | Batch 1549/2891 | Timestep 4440 | LR 0.0001000000 | Loss 0.109510 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:32 Epoch 1 | Batch 1559/2891 | Timestep 4450 | LR 0.0001000000 | Loss 0.127337 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:35 Epoch 1 | Batch 1569/2891 | Timestep 4460 | LR 0.0001000000 | Loss 0.038975 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:37 Epoch 1 | Batch 1579/2891 | Timestep 4470 | LR 0.0001000000 | Loss 0.047590 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:39 Epoch 1 | Batch 1589/2891 | Timestep 4480 | LR 0.0001000000 | Loss 0.152673 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:41 Epoch 1 | Batch 1599/2891 | Timestep 4490 | LR 0.0001000000 | Loss 0.036382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:43 Epoch 1 | Batch 1609/2891 | Timestep 4500 | LR 0.0001000000 | Loss 0.032007 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:45 Epoch 1 | Batch 1619/2891 | Timestep 4510 | LR 0.0001000000 | Loss 0.055843 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:47 Epoch 1 | Batch 1629/2891 | Timestep 4520 | LR 0.0001000000 | Loss 0.124311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:49 Epoch 1 | Batch 1639/2891 | Timestep 4530 | LR 0.0001000000 | Loss 0.079950 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:51 Epoch 1 | Batch 1649/2891 | Timestep 4540 | LR 0.0001000000 | Loss 0.123941 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:54 Epoch 1 | Batch 1659/2891 | Timestep 4550 | LR 0.0001000000 | Loss 0.033654 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:56 Epoch 1 | Batch 1669/2891 | Timestep 4560 | LR 0.0001000000 | Loss 0.039894 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:26:58 Epoch 1 | Batch 1679/2891 | Timestep 4570 | LR 0.0001000000 | Loss 0.125537 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:01 Epoch 1 | Batch 1689/2891 | Timestep 4580 | LR 0.0001000000 | Loss 0.092813 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:03 Epoch 1 | Batch 1699/2891 | Timestep 4590 | LR 0.0001000000 | Loss 0.035405 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:06 Epoch 1 | Batch 1709/2891 | Timestep 4600 | LR 0.0001000000 | Loss 0.059089 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:08 Epoch 1 | Batch 1719/2891 | Timestep 4610 | LR 0.0001000000 | Loss 0.036137 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:10 Epoch 1 | Batch 1729/2891 | Timestep 4620 | LR 0.0001000000 | Loss 0.139567 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:12 Epoch 1 | Batch 1739/2891 | Timestep 4630 | LR 0.0001000000 | Loss 0.255654 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:14 Epoch 1 | Batch 1749/2891 | Timestep 4640 | LR 0.0001000000 | Loss 0.210296 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:16 Epoch 1 | Batch 1759/2891 | Timestep 4650 | LR 0.0001000000 | Loss 0.034763 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:18 Epoch 1 | Batch 1769/2891 | Timestep 4660 | LR 0.0001000000 | Loss 0.094820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:20 Epoch 1 | Batch 1779/2891 | Timestep 4670 | LR 0.0001000000 | Loss 0.031951 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:22 Epoch 1 | Batch 1789/2891 | Timestep 4680 | LR 0.0001000000 | Loss 0.078896 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:24 Epoch 1 | Batch 1799/2891 | Timestep 4690 | LR 0.0001000000 | Loss 0.132561 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:26 Epoch 1 | Batch 1809/2891 | Timestep 4700 | LR 0.0001000000 | Loss 0.098079 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:29 Epoch 1 | Batch 1819/2891 | Timestep 4710 | LR 0.0001000000 | Loss 0.043283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:31 Epoch 1 | Batch 1829/2891 | Timestep 4720 | LR 0.0001000000 | Loss 0.034138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:33 Epoch 1 | Batch 1839/2891 | Timestep 4730 | LR 0.0001000000 | Loss 0.222602 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:35 Epoch 1 | Batch 1849/2891 | Timestep 4740 | LR 0.0001000000 | Loss 0.034799 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:37 Epoch 1 | Batch 1859/2891 | Timestep 4750 | LR 0.0001000000 | Loss 0.065892 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:39 Epoch 1 | Batch 1869/2891 | Timestep 4760 | LR 0.0001000000 | Loss 0.018785 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:41 Epoch 1 | Batch 1879/2891 | Timestep 4770 | LR 0.0001000000 | Loss 0.175595 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:44 Epoch 1 | Batch 1889/2891 | Timestep 4780 | LR 0.0001000000 | Loss 0.049051 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:46 Epoch 1 | Batch 1899/2891 | Timestep 4790 | LR 0.0001000000 | Loss 0.217213 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:48 Epoch 1 | Batch 1909/2891 | Timestep 4800 | LR 0.0001000000 | Loss 0.073151 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:51 Epoch 1 | Batch 1919/2891 | Timestep 4810 | LR 0.0001000000 | Loss 0.007193 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:53 Epoch 1 | Batch 1929/2891 | Timestep 4820 | LR 0.0001000000 | Loss 0.006786 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:55 Epoch 1 | Batch 1939/2891 | Timestep 4830 | LR 0.0001000000 | Loss 0.013931 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:57 Epoch 1 | Batch 1949/2891 | Timestep 4840 | LR 0.0001000000 | Loss 0.087274 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:27:59 Epoch 1 | Batch 1959/2891 | Timestep 4850 | LR 0.0001000000 | Loss 0.126400 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:01 Epoch 1 | Batch 1969/2891 | Timestep 4860 | LR 0.0001000000 | Loss 0.140515 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:04 Epoch 1 | Batch 1979/2891 | Timestep 4870 | LR 0.0001000000 | Loss 0.320507 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:06 Epoch 1 | Batch 1989/2891 | Timestep 4880 | LR 0.0001000000 | Loss 0.078709 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:08 Epoch 1 | Batch 1999/2891 | Timestep 4890 | LR 0.0001000000 | Loss 0.030040 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:10 Epoch 1 | Batch 2009/2891 | Timestep 4900 | LR 0.0001000000 | Loss 0.052227 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:12 Epoch 1 | Batch 2019/2891 | Timestep 4910 | LR 0.0001000000 | Loss 0.137730 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:14 Epoch 1 | Batch 2029/2891 | Timestep 4920 | LR 0.0001000000 | Loss 0.041783 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:16 Epoch 1 | Batch 2039/2891 | Timestep 4930 | LR 0.0001000000 | Loss 0.008487 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:19 Epoch 1 | Batch 2049/2891 | Timestep 4940 | LR 0.0001000000 | Loss 0.040532 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:21 Epoch 1 | Batch 2059/2891 | Timestep 4950 | LR 0.0001000000 | Loss 0.109585 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:23 Epoch 1 | Batch 2069/2891 | Timestep 4960 | LR 0.0001000000 | Loss 0.033018 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:25 Epoch 1 | Batch 2079/2891 | Timestep 4970 | LR 0.0001000000 | Loss 0.026058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:27 Epoch 1 | Batch 2089/2891 | Timestep 4980 | LR 0.0001000000 | Loss 0.106670 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:29 Epoch 1 | Batch 2099/2891 | Timestep 4990 | LR 0.0001000000 | Loss 0.024720 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:31 Epoch 1 | Batch 2109/2891 | Timestep 5000 | LR 0.0001000000 | Loss 0.047378 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:33 Epoch 1 | Batch 2119/2891 | Timestep 5010 | LR 0.0001000000 | Loss 0.023874 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:35 Epoch 1 | Batch 2129/2891 | Timestep 5020 | LR 0.0001000000 | Loss 0.028326 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:38 Epoch 1 | Batch 2139/2891 | Timestep 5030 | LR 0.0001000000 | Loss 0.109096 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:40 Epoch 1 | Batch 2149/2891 | Timestep 5040 | LR 0.0001000000 | Loss 0.097805 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:42 Epoch 1 | Batch 2159/2891 | Timestep 5050 | LR 0.0001000000 | Loss 0.334257 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:44 Epoch 1 | Batch 2169/2891 | Timestep 5060 | LR 0.0001000000 | Loss 0.139660 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:46 Epoch 1 | Batch 2179/2891 | Timestep 5070 | LR 0.0001000000 | Loss 0.052987 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:48 Epoch 1 | Batch 2189/2891 | Timestep 5080 | LR 0.0001000000 | Loss 0.034421 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:50 Epoch 1 | Batch 2199/2891 | Timestep 5090 | LR 0.0001000000 | Loss 0.112319 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:52 Epoch 1 | Batch 2209/2891 | Timestep 5100 | LR 0.0001000000 | Loss 0.103895 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:54 Epoch 1 | Batch 2219/2891 | Timestep 5110 | LR 0.0001000000 | Loss 0.031326 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:57 Epoch 1 | Batch 2229/2891 | Timestep 5120 | LR 0.0001000000 | Loss 0.125075 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:28:59 Epoch 1 | Batch 2239/2891 | Timestep 5130 | LR 0.0001000000 | Loss 0.211002 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:01 Epoch 1 | Batch 2249/2891 | Timestep 5140 | LR 0.0001000000 | Loss 0.102973 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:04 Epoch 1 | Batch 2259/2891 | Timestep 5150 | LR 0.0001000000 | Loss 0.033817 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:06 Epoch 1 | Batch 2269/2891 | Timestep 5160 | LR 0.0001000000 | Loss 0.028272 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:08 Epoch 1 | Batch 2279/2891 | Timestep 5170 | LR 0.0001000000 | Loss 0.067428 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:10 Epoch 1 | Batch 2289/2891 | Timestep 5180 | LR 0.0001000000 | Loss 0.113936 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:12 Epoch 1 | Batch 2299/2891 | Timestep 5190 | LR 0.0001000000 | Loss 0.090977 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:14 Epoch 1 | Batch 2309/2891 | Timestep 5200 | LR 0.0001000000 | Loss 0.083165 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:17 Epoch 1 | Batch 2319/2891 | Timestep 5210 | LR 0.0001000000 | Loss 0.028863 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:19 Epoch 1 | Batch 2329/2891 | Timestep 5220 | LR 0.0001000000 | Loss 0.028800 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:21 Epoch 1 | Batch 2339/2891 | Timestep 5230 | LR 0.0001000000 | Loss 0.049550 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:23 Epoch 1 | Batch 2349/2891 | Timestep 5240 | LR 0.0001000000 | Loss 0.068504 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:25 Epoch 1 | Batch 2359/2891 | Timestep 5250 | LR 0.0001000000 | Loss 0.110953 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:27 Epoch 1 | Batch 2369/2891 | Timestep 5260 | LR 0.0001000000 | Loss 0.038624 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:30 Epoch 1 | Batch 2379/2891 | Timestep 5270 | LR 0.0001000000 | Loss 0.163701 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:32 Epoch 1 | Batch 2389/2891 | Timestep 5280 | LR 0.0001000000 | Loss 0.017049 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:35 Epoch 1 | Batch 2399/2891 | Timestep 5290 | LR 0.0001000000 | Loss 0.038065 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:37 Epoch 1 | Batch 2409/2891 | Timestep 5300 | LR 0.0001000000 | Loss 0.064216 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:39 Epoch 1 | Batch 2419/2891 | Timestep 5310 | LR 0.0001000000 | Loss 0.081940 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:41 Epoch 1 | Batch 2429/2891 | Timestep 5320 | LR 0.0001000000 | Loss 0.079505 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:44 Epoch 1 | Batch 2439/2891 | Timestep 5330 | LR 0.0001000000 | Loss 0.012274 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:46 Epoch 1 | Batch 2449/2891 | Timestep 5340 | LR 0.0001000000 | Loss 0.036414 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:48 Epoch 1 | Batch 2459/2891 | Timestep 5350 | LR 0.0001000000 | Loss 0.085186 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:50 Epoch 1 | Batch 2469/2891 | Timestep 5360 | LR 0.0001000000 | Loss 0.011095 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:52 Epoch 1 | Batch 2479/2891 | Timestep 5370 | LR 0.0001000000 | Loss 0.125796 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:54 Epoch 1 | Batch 2489/2891 | Timestep 5380 | LR 0.0001000000 | Loss 0.046424 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:56 Epoch 1 | Batch 2499/2891 | Timestep 5390 | LR 0.0001000000 | Loss 0.041577 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:29:58 Epoch 1 | Batch 2509/2891 | Timestep 5400 | LR 0.0001000000 | Loss 0.114531 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:01 Epoch 1 | Batch 2519/2891 | Timestep 5410 | LR 0.0001000000 | Loss 0.052067 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:03 Epoch 1 | Batch 2529/2891 | Timestep 5420 | LR 0.0001000000 | Loss 0.013347 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:05 Epoch 1 | Batch 2539/2891 | Timestep 5430 | LR 0.0001000000 | Loss 0.007116 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:07 Epoch 1 | Batch 2549/2891 | Timestep 5440 | LR 0.0001000000 | Loss 0.015797 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:10 Epoch 1 | Batch 2559/2891 | Timestep 5450 | LR 0.0001000000 | Loss 0.025582 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:12 Epoch 1 | Batch 2569/2891 | Timestep 5460 | LR 0.0001000000 | Loss 0.090455 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:14 Epoch 1 | Batch 2579/2891 | Timestep 5470 | LR 0.0001000000 | Loss 0.079720 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:16 Epoch 1 | Batch 2589/2891 | Timestep 5480 | LR 0.0001000000 | Loss 0.096370 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:18 Epoch 1 | Batch 2599/2891 | Timestep 5490 | LR 0.0001000000 | Loss 0.153541 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:20 Epoch 1 | Batch 2609/2891 | Timestep 5500 | LR 0.0001000000 | Loss 0.128111 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:22 Epoch 1 | Batch 2619/2891 | Timestep 5510 | LR 0.0001000000 | Loss 0.029471 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:24 Epoch 1 | Batch 2629/2891 | Timestep 5520 | LR 0.0001000000 | Loss 0.040927 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:26 Epoch 1 | Batch 2639/2891 | Timestep 5530 | LR 0.0001000000 | Loss 0.069531 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:28 Epoch 1 | Batch 2649/2891 | Timestep 5540 | LR 0.0001000000 | Loss 0.015692 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:30 Epoch 1 | Batch 2659/2891 | Timestep 5550 | LR 0.0001000000 | Loss 0.119628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:32 Epoch 1 | Batch 2669/2891 | Timestep 5560 | LR 0.0001000000 | Loss 0.622219 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:35 Epoch 1 | Batch 2679/2891 | Timestep 5570 | LR 0.0001000000 | Loss 0.072905 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:37 Epoch 1 | Batch 2689/2891 | Timestep 5580 | LR 0.0001000000 | Loss 0.122728 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:39 Epoch 1 | Batch 2699/2891 | Timestep 5590 | LR 0.0001000000 | Loss 0.024105 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:41 Epoch 1 | Batch 2709/2891 | Timestep 5600 | LR 0.0001000000 | Loss 0.051693 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:43 Epoch 1 | Batch 2719/2891 | Timestep 5610 | LR 0.0001000000 | Loss 0.061380 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:45 Epoch 1 | Batch 2729/2891 | Timestep 5620 | LR 0.0001000000 | Loss 0.072375 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:47 Epoch 1 | Batch 2739/2891 | Timestep 5630 | LR 0.0001000000 | Loss 0.017230 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:50 Epoch 1 | Batch 2749/2891 | Timestep 5640 | LR 0.0001000000 | Loss 0.123618 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:52 Epoch 1 | Batch 2759/2891 | Timestep 5650 | LR 0.0001000000 | Loss 0.045696 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:54 Epoch 1 | Batch 2769/2891 | Timestep 5660 | LR 0.0001000000 | Loss 0.101566 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:56 Epoch 1 | Batch 2779/2891 | Timestep 5670 | LR 0.0001000000 | Loss 0.053790 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:30:58 Epoch 1 | Batch 2789/2891 | Timestep 5680 | LR 0.0001000000 | Loss 0.093806 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:00 Epoch 1 | Batch 2799/2891 | Timestep 5690 | LR 0.0001000000 | Loss 0.012404 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:02 Epoch 1 | Batch 2809/2891 | Timestep 5700 | LR 0.0001000000 | Loss 0.062456 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:04 Epoch 1 | Batch 2819/2891 | Timestep 5710 | LR 0.0001000000 | Loss 0.067261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:06 Epoch 1 | Batch 2829/2891 | Timestep 5720 | LR 0.0001000000 | Loss 0.022286 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:08 Epoch 1 | Batch 2839/2891 | Timestep 5730 | LR 0.0001000000 | Loss 0.062633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:11 Epoch 1 | Batch 2849/2891 | Timestep 5740 | LR 0.0001000000 | Loss 0.042128 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:14 Epoch 1 | Batch 2859/2891 | Timestep 5750 | LR 0.0001000000 | Loss 0.144254 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:16 Epoch 1 | Batch 2869/2891 | Timestep 5760 | LR 0.0001000000 | Loss 0.002541 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:19 Epoch 1 | Batch 2879/2891 | Timestep 5770 | LR 0.0001000000 | Loss 0.057364 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:21 Epoch 1 | Batch 2889/2891 | Timestep 5780 | LR 0.0001000000 | Loss 0.063289 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:31:22 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 18:32:42 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.7379 0.7308 0.7343 104 + CAMP 0.9552 0.9014 0.9275 71 + CARDINAL 0.7633 0.7588 0.7611 170 + CLUSTER 0.3846 0.1923 0.2564 26 + COM 0.1726 0.7436 0.2802 39 + CONTINENT 0.9565 0.9565 0.9565 23 + COUNTRY 0.9782 0.9653 0.9717 835 + CURR 0.8571 0.7500 0.8000 24 + DATE 0.9194 0.9308 0.9251 1691 + EDU 0.8584 0.8899 0.8739 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.5783 0.6575 0.6154 292 + FAC 0.8113 0.7748 0.7926 111 + GOV 0.7920 0.8942 0.8400 860 + GPE 0.9588 0.9469 0.9528 2261 + GPE_ORG 0.6937 0.9222 0.7918 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 0.7692 0.6250 0.6897 16 + LAW 0.6032 0.8085 0.6909 47 + LOC 0.5447 0.5276 0.5360 127 + MED 0.9904 0.9833 0.9868 419 + MONEY 0.4828 0.6364 0.5490 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.8479 0.7811 0.8131 571 + NORP 0.5906 0.5681 0.5791 551 + OCC 0.7613 0.8065 0.7833 522 + ORDINAL 0.9675 0.8750 0.9189 544 + ORG 0.8692 0.9207 0.8942 1790 + ORG_FAC 0.2308 0.4286 0.3000 7 + PATH 0.3333 0.1667 0.2222 6 + PERCENT 0.9231 1.0000 0.9600 12 + PERS 0.8990 0.9175 0.9082 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.3333 0.6667 0.4444 3 + REGION-GENERAL 0.3590 0.3784 0.3684 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.4000 0.6000 0.4800 10 + SCI 0.2222 0.1538 0.1818 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.5714 0.4916 0.5285 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.6571 0.6970 0.6765 33 + TOWN 0.9335 0.9458 0.9396 1217 + UNIT 0.5000 0.7500 0.6000 4 + WATER-BODY 0.3684 0.5000 0.4242 14 + WEBSITE 0.4881 0.5125 0.5000 80 + + micro avg 0.8520 0.8690 0.8604 13790 + macro avg 0.5430 0.5782 0.5511 13790 + weighted avg 0.8557 0.8690 0.8608 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:33:24 Epoch 1 | Timestep 5782 | Train Loss 0.156982 | Val Loss 0.096819 | F1 0.860415 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:33:24 ** Validation improved, evaluating test data ** +INFO arabiner.data.transforms Tue, 26 Mar 2024 18:33:28 Truncating the sequence لكن صوت جوالي مزعج ما دفعني للنهوض وبعصبية وارتباك من هذا الاتصال وخصوصا أن الساعة الواحدة والنصف يعنى عز دين النوم فأمسكت الجوال وقمت بالضغط على زر الرد . فقلت الو مين معي فقال معك الرئيس فقلت رئيس مين بالضبط فقال جورج بوش رئيس الولايات المتحدة الأمريكية فقلت اهلا أهلا يا سيادة الرئيس , بس أنا على حد علمي انه الرئيس جورج بوش بتكلم اللغة الانجليزية فكيف أنت بتحكي عربي بوش انأ بتكلم اللغة العربية جيدا حتى أنى ممكن أحكى باللهجة الغزواية . فقلت عليك اه خير شو مالك متصل فيا وكيف عرفت رقمي بوش ما في شي قلت أسال كيف أهل غزة بجو الحصار أما كيف عرفت رقمك فقلت لمديرة مكتبي أعطيني اتصال مباشر مع اى شخص من غزة فقلت غزة ااه بدك تعرف أخبار غزة صامدين صامدين ومش راح نتخلى عن الثوابت الفلسطينية لو شو ما تعملوا بوش يعنى بدك تقنعني انه ما فى نتيجة من الحصار فقلت لا ما في نتيجة لأنه إحنا بنخاف على بعض وبنحب بعض حتى رغيف الخبز مرات بنتقاسموا بوش اه واضح حتى التعذيب بتتقاسموه بالضفة وغزة فقلت يا عمى هيك عارف كل شى , شو بدك من الأخر لأني بدى أنام بوش شو رأيك تحضر مؤتمر انابولس فقلت احضر شو , شمعنا أنا يعني بوش هيك اجت فى بالى الفكرة فقلت لا لا مش فاضى , ميش مستعد اضيع وقتي في شي عارف نهايته بوش طيب تابعنا على التلفزيون منه بتعرف شو صار قلت صدقني وقتي فل , بكون بقرا بكتاب الجنة لا تبعد كثيرا بوش غريبة أول إنسان عربي ادعوه على المؤتمر ويكون وقته مشغول قلت شكلوا الكل مضيوف بالبيت الأبيض بوش اه مليان مش عارف أتحرك براحتي مخنوق فقلت اذا انت مخنوق شو نقول احنا بوش عارف بحاول معهم لكن لا حياة لمن تنادى من الطرفين وحابب اخذ رايك بالموضوع هل فى امل ? فقلت : رأي انك تستقيل قبل مؤتمر انابولس واكسب بياض الوجه وسيبك من الشرق الأوسط صدقني ما بتستاهلوا شي بوش : لا وحياتك راح يستقيل اولمرت وعباس اذا صار شي فقلت : اسمحي بدى أنام نعسان , بس دير بالك على العراق وأفغانستان اصلو بسمع انه في قتلي بشكل غريب بوش : وما تقلق راح أتوصي بإيران كويس وراح نعمل الوطن العربي كله سلطة قلت : طيب يالله سلام بوش : بس ما تنسانى قلت : له / هو فى حدا راح ينساك وانقطع حلمي برنه جوال حقيقة شرذمت ما تبقى من الحلم , فاعذروني فما هذه المكالمة إلا من عتمة أفكاري فأتمنى للرئيس عباس كل التوفيق وأرجو الا يكون هذا المؤتمر هو رحلة حب قصيرة الأمد . to 510 +INFO root Tue, 26 Mar 2024 18:34:31 Predictions written to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/predictions.txt +INFO root Tue, 26 Mar 2024 18:36:03 + precision recall f1-score support + + AIRPORT 0.0000 0.0000 0.0000 1 + BOUNDARY 0.0000 0.0000 0.0000 3 + BUILDING-OR-GROUNDS 0.6207 0.6176 0.6192 204 + CAMP 0.9441 0.9048 0.9240 168 + CARDINAL 0.7937 0.8099 0.8017 342 + CELESTIAL 0.0000 0.0000 0.0000 2 + CLUSTER 0.4138 0.1558 0.2264 77 + COM 0.2139 0.7748 0.3353 111 + CONTINENT 0.9565 0.7719 0.8544 57 + COUNTRY 0.9665 0.9588 0.9626 1625 + CURR 0.8000 0.6829 0.7368 41 + DATE 0.9202 0.9357 0.9279 3206 + EDU 0.8095 0.8202 0.8148 228 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.5991 0.6947 0.6434 570 + FAC 0.7374 0.6547 0.6936 223 + GOV 0.7894 0.8886 0.8361 1696 + GPE 0.9512 0.9407 0.9459 4554 + GPE_ORG 0.7644 0.8985 0.8260 325 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 118 + LANGUAGE 0.9286 0.6047 0.7324 43 + LAW 0.6518 0.8111 0.7228 90 + LOC 0.5437 0.5089 0.5257 281 + MED 0.9839 0.9814 0.9826 807 + MONEY 0.4792 0.6970 0.5679 33 + NEIGHBORHOOD 0.0000 0.0000 0.0000 30 + NONGOV 0.8192 0.7480 0.7820 1151 + NORP 0.6413 0.6108 0.6257 1092 + OCC 0.7771 0.7933 0.7851 1103 + ORDINAL 0.9646 0.8800 0.9203 1083 + ORG 0.8423 0.9093 0.8745 3618 + ORG_FAC 0.3333 0.5789 0.4231 19 + PATH 0.3750 0.1667 0.2308 18 + PERCENT 0.8621 0.7576 0.8065 33 + PERS 0.8874 0.9050 0.8961 1568 + PRODUCT 0.0000 0.0000 0.0000 19 + QUANTITY 0.1429 0.3333 0.2000 9 + REGION-GENERAL 0.2381 0.2174 0.2273 69 +REGION-INTERNATIONAL 0.0870 0.0690 0.0769 29 + REL 0.6250 0.6000 0.6122 25 + SCI 0.3214 0.3103 0.3158 29 + SPO 0.0000 0.0000 0.0000 8 + SPORT 0.0000 0.0000 0.0000 1 + STATE-OR-PROVINCE 0.6464 0.5297 0.5822 421 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 23 + TIME 0.6753 0.6190 0.6460 84 + TOWN 0.9209 0.9432 0.9319 2431 + UNIT 0.3478 0.7273 0.4706 11 + WATER-BODY 0.3000 0.5714 0.3934 21 + WEBSITE 0.3741 0.4741 0.4183 116 + + micro avg 0.8454 0.8607 0.8530 27817 + macro avg 0.5210 0.5371 0.5180 27817 + weighted avg 0.8478 0.8607 0.8524 27817 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:27 Epoch 1 | Timestep 5782 | Test Loss 0.105160 | F1 0.852975 +INFO arabiner.trainers.BaseTrainer Tue, 26 Mar 2024 18:37:27 Saving checkpoint to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/checkpoints/checkpoint_1.pt +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:32 Epoch 2 | Batch 8/2891 | Timestep 5790 | LR 0.0001000000 | Loss 0.043201 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:34 Epoch 2 | Batch 18/2891 | Timestep 5800 | LR 0.0001000000 | Loss 0.038592 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:36 Epoch 2 | Batch 28/2891 | Timestep 5810 | LR 0.0001000000 | Loss 0.043278 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:38 Epoch 2 | Batch 38/2891 | Timestep 5820 | LR 0.0001000000 | Loss 0.012632 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:40 Epoch 2 | Batch 48/2891 | Timestep 5830 | LR 0.0001000000 | Loss 0.085904 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:42 Epoch 2 | Batch 58/2891 | Timestep 5840 | LR 0.0001000000 | Loss 0.015090 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:45 Epoch 2 | Batch 68/2891 | Timestep 5850 | LR 0.0001000000 | Loss 0.024394 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:47 Epoch 2 | Batch 78/2891 | Timestep 5860 | LR 0.0001000000 | Loss 0.059680 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:49 Epoch 2 | Batch 88/2891 | Timestep 5870 | LR 0.0001000000 | Loss 0.025954 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:51 Epoch 2 | Batch 98/2891 | Timestep 5880 | LR 0.0001000000 | Loss 0.016685 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:53 Epoch 2 | Batch 108/2891 | Timestep 5890 | LR 0.0001000000 | Loss 0.033743 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:55 Epoch 2 | Batch 118/2891 | Timestep 5900 | LR 0.0001000000 | Loss 0.031726 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:37:57 Epoch 2 | Batch 128/2891 | Timestep 5910 | LR 0.0001000000 | Loss 0.141045 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:00 Epoch 2 | Batch 138/2891 | Timestep 5920 | LR 0.0001000000 | Loss 0.117357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:02 Epoch 2 | Batch 148/2891 | Timestep 5930 | LR 0.0001000000 | Loss 0.004273 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:04 Epoch 2 | Batch 158/2891 | Timestep 5940 | LR 0.0001000000 | Loss 0.044286 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:06 Epoch 2 | Batch 168/2891 | Timestep 5950 | LR 0.0001000000 | Loss 0.015636 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:08 Epoch 2 | Batch 178/2891 | Timestep 5960 | LR 0.0001000000 | Loss 0.033089 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:10 Epoch 2 | Batch 188/2891 | Timestep 5970 | LR 0.0001000000 | Loss 0.024998 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:13 Epoch 2 | Batch 198/2891 | Timestep 5980 | LR 0.0001000000 | Loss 0.122456 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:15 Epoch 2 | Batch 208/2891 | Timestep 5990 | LR 0.0001000000 | Loss 0.042996 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:17 Epoch 2 | Batch 218/2891 | Timestep 6000 | LR 0.0001000000 | Loss 0.062963 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:19 Epoch 2 | Batch 228/2891 | Timestep 6010 | LR 0.0001000000 | Loss 0.182980 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:21 Epoch 2 | Batch 238/2891 | Timestep 6020 | LR 0.0001000000 | Loss 0.165977 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:24 Epoch 2 | Batch 248/2891 | Timestep 6030 | LR 0.0001000000 | Loss 0.096724 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:26 Epoch 2 | Batch 258/2891 | Timestep 6040 | LR 0.0001000000 | Loss 0.009109 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:28 Epoch 2 | Batch 268/2891 | Timestep 6050 | LR 0.0001000000 | Loss 0.053594 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:30 Epoch 2 | Batch 278/2891 | Timestep 6060 | LR 0.0001000000 | Loss 0.053958 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:32 Epoch 2 | Batch 288/2891 | Timestep 6070 | LR 0.0001000000 | Loss 0.182725 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:34 Epoch 2 | Batch 298/2891 | Timestep 6080 | LR 0.0001000000 | Loss 0.020082 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:36 Epoch 2 | Batch 308/2891 | Timestep 6090 | LR 0.0001000000 | Loss 0.045052 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:39 Epoch 2 | Batch 318/2891 | Timestep 6100 | LR 0.0001000000 | Loss 0.025577 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:41 Epoch 2 | Batch 328/2891 | Timestep 6110 | LR 0.0001000000 | Loss 0.088650 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:43 Epoch 2 | Batch 338/2891 | Timestep 6120 | LR 0.0001000000 | Loss 0.009536 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:45 Epoch 2 | Batch 348/2891 | Timestep 6130 | LR 0.0001000000 | Loss 0.018005 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:47 Epoch 2 | Batch 358/2891 | Timestep 6140 | LR 0.0001000000 | Loss 0.007728 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:50 Epoch 2 | Batch 368/2891 | Timestep 6150 | LR 0.0001000000 | Loss 0.060174 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:52 Epoch 2 | Batch 378/2891 | Timestep 6160 | LR 0.0001000000 | Loss 0.013156 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:54 Epoch 2 | Batch 388/2891 | Timestep 6170 | LR 0.0001000000 | Loss 0.003222 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:56 Epoch 2 | Batch 398/2891 | Timestep 6180 | LR 0.0001000000 | Loss 0.056121 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:38:58 Epoch 2 | Batch 408/2891 | Timestep 6190 | LR 0.0001000000 | Loss 0.002475 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:00 Epoch 2 | Batch 418/2891 | Timestep 6200 | LR 0.0001000000 | Loss 0.082068 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:02 Epoch 2 | Batch 428/2891 | Timestep 6210 | LR 0.0001000000 | Loss 0.132854 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:04 Epoch 2 | Batch 438/2891 | Timestep 6220 | LR 0.0001000000 | Loss 0.008778 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:07 Epoch 2 | Batch 448/2891 | Timestep 6230 | LR 0.0001000000 | Loss 0.037329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:09 Epoch 2 | Batch 458/2891 | Timestep 6240 | LR 0.0001000000 | Loss 0.005260 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:11 Epoch 2 | Batch 468/2891 | Timestep 6250 | LR 0.0001000000 | Loss 0.020666 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:13 Epoch 2 | Batch 478/2891 | Timestep 6260 | LR 0.0001000000 | Loss 0.038144 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:16 Epoch 2 | Batch 488/2891 | Timestep 6270 | LR 0.0001000000 | Loss 0.080087 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:18 Epoch 2 | Batch 498/2891 | Timestep 6280 | LR 0.0001000000 | Loss 0.005841 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:20 Epoch 2 | Batch 508/2891 | Timestep 6290 | LR 0.0001000000 | Loss 0.036911 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:22 Epoch 2 | Batch 518/2891 | Timestep 6300 | LR 0.0001000000 | Loss 0.079322 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:24 Epoch 2 | Batch 528/2891 | Timestep 6310 | LR 0.0001000000 | Loss 0.084704 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:27 Epoch 2 | Batch 538/2891 | Timestep 6320 | LR 0.0001000000 | Loss 0.082603 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:29 Epoch 2 | Batch 548/2891 | Timestep 6330 | LR 0.0001000000 | Loss 0.051540 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:32 Epoch 2 | Batch 558/2891 | Timestep 6340 | LR 0.0001000000 | Loss 0.082706 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:34 Epoch 2 | Batch 568/2891 | Timestep 6350 | LR 0.0001000000 | Loss 0.030020 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:36 Epoch 2 | Batch 578/2891 | Timestep 6360 | LR 0.0001000000 | Loss 0.030235 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:38 Epoch 2 | Batch 588/2891 | Timestep 6370 | LR 0.0001000000 | Loss 0.058641 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:41 Epoch 2 | Batch 598/2891 | Timestep 6380 | LR 0.0001000000 | Loss 0.071559 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:43 Epoch 2 | Batch 608/2891 | Timestep 6390 | LR 0.0001000000 | Loss 0.084203 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:45 Epoch 2 | Batch 618/2891 | Timestep 6400 | LR 0.0001000000 | Loss 0.120401 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:47 Epoch 2 | Batch 628/2891 | Timestep 6410 | LR 0.0001000000 | Loss 0.021170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:49 Epoch 2 | Batch 638/2891 | Timestep 6420 | LR 0.0001000000 | Loss 0.005764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:51 Epoch 2 | Batch 648/2891 | Timestep 6430 | LR 0.0001000000 | Loss 0.068861 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:53 Epoch 2 | Batch 658/2891 | Timestep 6440 | LR 0.0001000000 | Loss 0.075080 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:55 Epoch 2 | Batch 668/2891 | Timestep 6450 | LR 0.0001000000 | Loss 0.023798 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:39:58 Epoch 2 | Batch 678/2891 | Timestep 6460 | LR 0.0001000000 | Loss 0.071979 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:00 Epoch 2 | Batch 688/2891 | Timestep 6470 | LR 0.0001000000 | Loss 0.080267 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:02 Epoch 2 | Batch 698/2891 | Timestep 6480 | LR 0.0001000000 | Loss 0.029244 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:04 Epoch 2 | Batch 708/2891 | Timestep 6490 | LR 0.0001000000 | Loss 0.067473 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:07 Epoch 2 | Batch 718/2891 | Timestep 6500 | LR 0.0001000000 | Loss 0.018694 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:09 Epoch 2 | Batch 728/2891 | Timestep 6510 | LR 0.0001000000 | Loss 0.018783 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:11 Epoch 2 | Batch 738/2891 | Timestep 6520 | LR 0.0001000000 | Loss 0.057583 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:13 Epoch 2 | Batch 748/2891 | Timestep 6530 | LR 0.0001000000 | Loss 0.025600 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:15 Epoch 2 | Batch 758/2891 | Timestep 6540 | LR 0.0001000000 | Loss 0.026151 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:17 Epoch 2 | Batch 768/2891 | Timestep 6550 | LR 0.0001000000 | Loss 0.060107 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:20 Epoch 2 | Batch 778/2891 | Timestep 6560 | LR 0.0001000000 | Loss 0.020011 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:22 Epoch 2 | Batch 788/2891 | Timestep 6570 | LR 0.0001000000 | Loss 0.063073 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:24 Epoch 2 | Batch 798/2891 | Timestep 6580 | LR 0.0001000000 | Loss 0.123383 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:26 Epoch 2 | Batch 808/2891 | Timestep 6590 | LR 0.0001000000 | Loss 0.108568 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:29 Epoch 2 | Batch 818/2891 | Timestep 6600 | LR 0.0001000000 | Loss 0.027607 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:31 Epoch 2 | Batch 828/2891 | Timestep 6610 | LR 0.0001000000 | Loss 0.036116 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:33 Epoch 2 | Batch 838/2891 | Timestep 6620 | LR 0.0001000000 | Loss 0.174772 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:36 Epoch 2 | Batch 848/2891 | Timestep 6630 | LR 0.0001000000 | Loss 0.071491 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:38 Epoch 2 | Batch 858/2891 | Timestep 6640 | LR 0.0001000000 | Loss 0.062629 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:40 Epoch 2 | Batch 868/2891 | Timestep 6650 | LR 0.0001000000 | Loss 0.034993 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:43 Epoch 2 | Batch 878/2891 | Timestep 6660 | LR 0.0001000000 | Loss 0.092563 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:44 Epoch 2 | Batch 888/2891 | Timestep 6670 | LR 0.0001000000 | Loss 0.052118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:47 Epoch 2 | Batch 898/2891 | Timestep 6680 | LR 0.0001000000 | Loss 0.054803 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:49 Epoch 2 | Batch 908/2891 | Timestep 6690 | LR 0.0001000000 | Loss 0.013118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:51 Epoch 2 | Batch 918/2891 | Timestep 6700 | LR 0.0001000000 | Loss 0.037047 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:53 Epoch 2 | Batch 928/2891 | Timestep 6710 | LR 0.0001000000 | Loss 0.228605 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:56 Epoch 2 | Batch 938/2891 | Timestep 6720 | LR 0.0001000000 | Loss 0.010286 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:40:58 Epoch 2 | Batch 948/2891 | Timestep 6730 | LR 0.0001000000 | Loss 0.067900 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:00 Epoch 2 | Batch 958/2891 | Timestep 6740 | LR 0.0001000000 | Loss 0.034599 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:02 Epoch 2 | Batch 968/2891 | Timestep 6750 | LR 0.0001000000 | Loss 0.058182 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:04 Epoch 2 | Batch 978/2891 | Timestep 6760 | LR 0.0001000000 | Loss 0.024057 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:06 Epoch 2 | Batch 988/2891 | Timestep 6770 | LR 0.0001000000 | Loss 0.009735 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:08 Epoch 2 | Batch 998/2891 | Timestep 6780 | LR 0.0001000000 | Loss 0.043674 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:11 Epoch 2 | Batch 1008/2891 | Timestep 6790 | LR 0.0001000000 | Loss 0.034678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:13 Epoch 2 | Batch 1018/2891 | Timestep 6800 | LR 0.0001000000 | Loss 0.015630 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:15 Epoch 2 | Batch 1028/2891 | Timestep 6810 | LR 0.0001000000 | Loss 0.056287 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:17 Epoch 2 | Batch 1038/2891 | Timestep 6820 | LR 0.0001000000 | Loss 0.087857 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:20 Epoch 2 | Batch 1048/2891 | Timestep 6830 | LR 0.0001000000 | Loss 0.066154 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:22 Epoch 2 | Batch 1058/2891 | Timestep 6840 | LR 0.0001000000 | Loss 0.007577 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:24 Epoch 2 | Batch 1068/2891 | Timestep 6850 | LR 0.0001000000 | Loss 0.017081 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:26 Epoch 2 | Batch 1078/2891 | Timestep 6860 | LR 0.0001000000 | Loss 0.160445 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:29 Epoch 2 | Batch 1088/2891 | Timestep 6870 | LR 0.0001000000 | Loss 0.019105 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:31 Epoch 2 | Batch 1098/2891 | Timestep 6880 | LR 0.0001000000 | Loss 0.008051 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:33 Epoch 2 | Batch 1108/2891 | Timestep 6890 | LR 0.0001000000 | Loss 0.118993 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:35 Epoch 2 | Batch 1118/2891 | Timestep 6900 | LR 0.0001000000 | Loss 0.022946 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:37 Epoch 2 | Batch 1128/2891 | Timestep 6910 | LR 0.0001000000 | Loss 0.040865 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:39 Epoch 2 | Batch 1138/2891 | Timestep 6920 | LR 0.0001000000 | Loss 0.030336 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:41 Epoch 2 | Batch 1148/2891 | Timestep 6930 | LR 0.0001000000 | Loss 0.066639 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:44 Epoch 2 | Batch 1158/2891 | Timestep 6940 | LR 0.0001000000 | Loss 0.028034 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:46 Epoch 2 | Batch 1168/2891 | Timestep 6950 | LR 0.0001000000 | Loss 0.049963 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:48 Epoch 2 | Batch 1178/2891 | Timestep 6960 | LR 0.0001000000 | Loss 0.088921 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:50 Epoch 2 | Batch 1188/2891 | Timestep 6970 | LR 0.0001000000 | Loss 0.017663 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:52 Epoch 2 | Batch 1198/2891 | Timestep 6980 | LR 0.0001000000 | Loss 0.207712 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:55 Epoch 2 | Batch 1208/2891 | Timestep 6990 | LR 0.0001000000 | Loss 0.015034 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:57 Epoch 2 | Batch 1218/2891 | Timestep 7000 | LR 0.0001000000 | Loss 0.015604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:41:59 Epoch 2 | Batch 1228/2891 | Timestep 7010 | LR 0.0001000000 | Loss 0.106924 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:01 Epoch 2 | Batch 1238/2891 | Timestep 7020 | LR 0.0001000000 | Loss 0.047885 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:03 Epoch 2 | Batch 1248/2891 | Timestep 7030 | LR 0.0001000000 | Loss 0.084388 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:05 Epoch 2 | Batch 1258/2891 | Timestep 7040 | LR 0.0001000000 | Loss 0.277071 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:07 Epoch 2 | Batch 1268/2891 | Timestep 7050 | LR 0.0001000000 | Loss 0.057222 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:09 Epoch 2 | Batch 1278/2891 | Timestep 7060 | LR 0.0001000000 | Loss 0.253687 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:11 Epoch 2 | Batch 1288/2891 | Timestep 7070 | LR 0.0001000000 | Loss 0.042174 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:13 Epoch 2 | Batch 1298/2891 | Timestep 7080 | LR 0.0001000000 | Loss 0.019723 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:15 Epoch 2 | Batch 1308/2891 | Timestep 7090 | LR 0.0001000000 | Loss 0.024288 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:18 Epoch 2 | Batch 1318/2891 | Timestep 7100 | LR 0.0001000000 | Loss 2.681532 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:20 Epoch 2 | Batch 1328/2891 | Timestep 7110 | LR 0.0001000000 | Loss 0.160813 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:22 Epoch 2 | Batch 1338/2891 | Timestep 7120 | LR 0.0001000000 | Loss 0.045212 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:24 Epoch 2 | Batch 1348/2891 | Timestep 7130 | LR 0.0001000000 | Loss 0.203057 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:26 Epoch 2 | Batch 1358/2891 | Timestep 7140 | LR 0.0001000000 | Loss 1.871201 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:28 Epoch 2 | Batch 1368/2891 | Timestep 7150 | LR 0.0001000000 | Loss 0.084230 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:30 Epoch 2 | Batch 1378/2891 | Timestep 7160 | LR 0.0001000000 | Loss 0.047372 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:32 Epoch 2 | Batch 1388/2891 | Timestep 7170 | LR 0.0001000000 | Loss 0.068959 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:34 Epoch 2 | Batch 1398/2891 | Timestep 7180 | LR 0.0001000000 | Loss 0.022324 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:37 Epoch 2 | Batch 1408/2891 | Timestep 7190 | LR 0.0001000000 | Loss 0.051699 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:39 Epoch 2 | Batch 1418/2891 | Timestep 7200 | LR 0.0001000000 | Loss 0.054036 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:41 Epoch 2 | Batch 1428/2891 | Timestep 7210 | LR 0.0001000000 | Loss 0.054635 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:43 Epoch 2 | Batch 1438/2891 | Timestep 7220 | LR 0.0001000000 | Loss 0.033887 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:45 Epoch 2 | Batch 1448/2891 | Timestep 7230 | LR 0.0001000000 | Loss 0.064133 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:47 Epoch 2 | Batch 1458/2891 | Timestep 7240 | LR 0.0001000000 | Loss 0.070174 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:49 Epoch 2 | Batch 1468/2891 | Timestep 7250 | LR 0.0001000000 | Loss 0.079678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:51 Epoch 2 | Batch 1478/2891 | Timestep 7260 | LR 0.0001000000 | Loss 0.011933 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:53 Epoch 2 | Batch 1488/2891 | Timestep 7270 | LR 0.0001000000 | Loss 0.038188 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:56 Epoch 2 | Batch 1498/2891 | Timestep 7280 | LR 0.0001000000 | Loss 0.038575 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:42:58 Epoch 2 | Batch 1508/2891 | Timestep 7290 | LR 0.0001000000 | Loss 0.053411 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:00 Epoch 2 | Batch 1518/2891 | Timestep 7300 | LR 0.0001000000 | Loss 0.029196 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:02 Epoch 2 | Batch 1528/2891 | Timestep 7310 | LR 0.0001000000 | Loss 0.096897 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:04 Epoch 2 | Batch 1538/2891 | Timestep 7320 | LR 0.0001000000 | Loss 0.075534 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:06 Epoch 2 | Batch 1548/2891 | Timestep 7330 | LR 0.0001000000 | Loss 0.074868 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:09 Epoch 2 | Batch 1558/2891 | Timestep 7340 | LR 0.0001000000 | Loss 0.059152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:11 Epoch 2 | Batch 1568/2891 | Timestep 7350 | LR 0.0001000000 | Loss 0.026888 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:13 Epoch 2 | Batch 1578/2891 | Timestep 7360 | LR 0.0001000000 | Loss 0.060182 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:15 Epoch 2 | Batch 1588/2891 | Timestep 7370 | LR 0.0001000000 | Loss 0.016610 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:18 Epoch 2 | Batch 1598/2891 | Timestep 7380 | LR 0.0001000000 | Loss 0.026846 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:20 Epoch 2 | Batch 1608/2891 | Timestep 7390 | LR 0.0001000000 | Loss 0.138872 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:22 Epoch 2 | Batch 1618/2891 | Timestep 7400 | LR 0.0001000000 | Loss 0.017165 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:24 Epoch 2 | Batch 1628/2891 | Timestep 7410 | LR 0.0001000000 | Loss 0.038768 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:26 Epoch 2 | Batch 1638/2891 | Timestep 7420 | LR 0.0001000000 | Loss 0.037094 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:29 Epoch 2 | Batch 1648/2891 | Timestep 7430 | LR 0.0001000000 | Loss 0.027986 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:31 Epoch 2 | Batch 1658/2891 | Timestep 7440 | LR 0.0001000000 | Loss 0.017891 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:33 Epoch 2 | Batch 1668/2891 | Timestep 7450 | LR 0.0001000000 | Loss 0.029219 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:35 Epoch 2 | Batch 1678/2891 | Timestep 7460 | LR 0.0001000000 | Loss 0.033660 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:38 Epoch 2 | Batch 1688/2891 | Timestep 7470 | LR 0.0001000000 | Loss 0.143307 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:39 Epoch 2 | Batch 1698/2891 | Timestep 7480 | LR 0.0001000000 | Loss 0.010062 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:42 Epoch 2 | Batch 1708/2891 | Timestep 7490 | LR 0.0001000000 | Loss 0.085199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:44 Epoch 2 | Batch 1718/2891 | Timestep 7500 | LR 0.0001000000 | Loss 0.063226 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:46 Epoch 2 | Batch 1728/2891 | Timestep 7510 | LR 0.0001000000 | Loss 0.036135 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:48 Epoch 2 | Batch 1738/2891 | Timestep 7520 | LR 0.0001000000 | Loss 0.048134 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:51 Epoch 2 | Batch 1748/2891 | Timestep 7530 | LR 0.0001000000 | Loss 0.007800 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:52 Epoch 2 | Batch 1758/2891 | Timestep 7540 | LR 0.0001000000 | Loss 0.172429 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:54 Epoch 2 | Batch 1768/2891 | Timestep 7550 | LR 0.0001000000 | Loss 0.031158 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:57 Epoch 2 | Batch 1778/2891 | Timestep 7560 | LR 0.0001000000 | Loss 0.017500 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:43:59 Epoch 2 | Batch 1788/2891 | Timestep 7570 | LR 0.0001000000 | Loss 0.027404 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:01 Epoch 2 | Batch 1798/2891 | Timestep 7580 | LR 0.0001000000 | Loss 0.132223 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:03 Epoch 2 | Batch 1808/2891 | Timestep 7590 | LR 0.0001000000 | Loss 0.242064 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:06 Epoch 2 | Batch 1818/2891 | Timestep 7600 | LR 0.0001000000 | Loss 0.137956 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:08 Epoch 2 | Batch 1828/2891 | Timestep 7610 | LR 0.0001000000 | Loss 0.178223 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:10 Epoch 2 | Batch 1838/2891 | Timestep 7620 | LR 0.0001000000 | Loss 0.184309 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:12 Epoch 2 | Batch 1848/2891 | Timestep 7630 | LR 0.0001000000 | Loss 0.128382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:15 Epoch 2 | Batch 1858/2891 | Timestep 7640 | LR 0.0001000000 | Loss 0.019296 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:17 Epoch 2 | Batch 1868/2891 | Timestep 7650 | LR 0.0001000000 | Loss 0.127945 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:19 Epoch 2 | Batch 1878/2891 | Timestep 7660 | LR 0.0001000000 | Loss 0.026972 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:21 Epoch 2 | Batch 1888/2891 | Timestep 7670 | LR 0.0001000000 | Loss 0.040871 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:23 Epoch 2 | Batch 1898/2891 | Timestep 7680 | LR 0.0001000000 | Loss 0.444625 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:25 Epoch 2 | Batch 1908/2891 | Timestep 7690 | LR 0.0001000000 | Loss 0.091180 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:28 Epoch 2 | Batch 1918/2891 | Timestep 7700 | LR 0.0001000000 | Loss 0.031019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:30 Epoch 2 | Batch 1928/2891 | Timestep 7710 | LR 0.0001000000 | Loss 0.083719 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:32 Epoch 2 | Batch 1938/2891 | Timestep 7720 | LR 0.0001000000 | Loss 0.018870 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:34 Epoch 2 | Batch 1948/2891 | Timestep 7730 | LR 0.0001000000 | Loss 0.027253 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:36 Epoch 2 | Batch 1958/2891 | Timestep 7740 | LR 0.0001000000 | Loss 0.033875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:38 Epoch 2 | Batch 1968/2891 | Timestep 7750 | LR 0.0001000000 | Loss 0.088596 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:40 Epoch 2 | Batch 1978/2891 | Timestep 7760 | LR 0.0001000000 | Loss 0.009131 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:42 Epoch 2 | Batch 1988/2891 | Timestep 7770 | LR 0.0001000000 | Loss 0.058000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:45 Epoch 2 | Batch 1998/2891 | Timestep 7780 | LR 0.0001000000 | Loss 0.023226 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:48 Epoch 2 | Batch 2008/2891 | Timestep 7790 | LR 0.0001000000 | Loss 0.138828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:49 Epoch 2 | Batch 2018/2891 | Timestep 7800 | LR 0.0001000000 | Loss 0.029868 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:52 Epoch 2 | Batch 2028/2891 | Timestep 7810 | LR 0.0001000000 | Loss 0.144663 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:54 Epoch 2 | Batch 2038/2891 | Timestep 7820 | LR 0.0001000000 | Loss 0.019030 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:56 Epoch 2 | Batch 2048/2891 | Timestep 7830 | LR 0.0001000000 | Loss 0.020645 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:44:59 Epoch 2 | Batch 2058/2891 | Timestep 7840 | LR 0.0001000000 | Loss 0.058452 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:01 Epoch 2 | Batch 2068/2891 | Timestep 7850 | LR 0.0001000000 | Loss 0.078382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:04 Epoch 2 | Batch 2078/2891 | Timestep 7860 | LR 0.0001000000 | Loss 0.204983 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:06 Epoch 2 | Batch 2088/2891 | Timestep 7870 | LR 0.0001000000 | Loss 0.017475 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:08 Epoch 2 | Batch 2098/2891 | Timestep 7880 | LR 0.0001000000 | Loss 0.046326 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:11 Epoch 2 | Batch 2108/2891 | Timestep 7890 | LR 0.0001000000 | Loss 0.015354 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:14 Epoch 2 | Batch 2118/2891 | Timestep 7900 | LR 0.0001000000 | Loss 0.070028 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:16 Epoch 2 | Batch 2128/2891 | Timestep 7910 | LR 0.0001000000 | Loss 0.089433 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:18 Epoch 2 | Batch 2138/2891 | Timestep 7920 | LR 0.0001000000 | Loss 0.048420 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:21 Epoch 2 | Batch 2148/2891 | Timestep 7930 | LR 0.0001000000 | Loss 0.117035 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:23 Epoch 2 | Batch 2158/2891 | Timestep 7940 | LR 0.0001000000 | Loss 0.077718 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:25 Epoch 2 | Batch 2168/2891 | Timestep 7950 | LR 0.0001000000 | Loss 0.107945 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:27 Epoch 2 | Batch 2178/2891 | Timestep 7960 | LR 0.0001000000 | Loss 0.064827 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:30 Epoch 2 | Batch 2188/2891 | Timestep 7970 | LR 0.0001000000 | Loss 0.045221 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:32 Epoch 2 | Batch 2198/2891 | Timestep 7980 | LR 0.0001000000 | Loss 0.103743 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:34 Epoch 2 | Batch 2208/2891 | Timestep 7990 | LR 0.0001000000 | Loss 0.014394 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:36 Epoch 2 | Batch 2218/2891 | Timestep 8000 | LR 0.0001000000 | Loss 0.113828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:38 Epoch 2 | Batch 2228/2891 | Timestep 8010 | LR 0.0001000000 | Loss 0.093827 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:40 Epoch 2 | Batch 2238/2891 | Timestep 8020 | LR 0.0001000000 | Loss 0.035340 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:42 Epoch 2 | Batch 2248/2891 | Timestep 8030 | LR 0.0001000000 | Loss 0.024066 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:45 Epoch 2 | Batch 2258/2891 | Timestep 8040 | LR 0.0001000000 | Loss 0.018893 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:47 Epoch 2 | Batch 2268/2891 | Timestep 8050 | LR 0.0001000000 | Loss 0.109604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:49 Epoch 2 | Batch 2278/2891 | Timestep 8060 | LR 0.0001000000 | Loss 0.145936 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:52 Epoch 2 | Batch 2288/2891 | Timestep 8070 | LR 0.0001000000 | Loss 0.030518 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:54 Epoch 2 | Batch 2298/2891 | Timestep 8080 | LR 0.0001000000 | Loss 0.028626 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:56 Epoch 2 | Batch 2308/2891 | Timestep 8090 | LR 0.0001000000 | Loss 0.121032 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:45:58 Epoch 2 | Batch 2318/2891 | Timestep 8100 | LR 0.0001000000 | Loss 0.058451 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:00 Epoch 2 | Batch 2328/2891 | Timestep 8110 | LR 0.0001000000 | Loss 0.014991 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:02 Epoch 2 | Batch 2338/2891 | Timestep 8120 | LR 0.0001000000 | Loss 0.024297 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:04 Epoch 2 | Batch 2348/2891 | Timestep 8130 | LR 0.0001000000 | Loss 0.070937 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:06 Epoch 2 | Batch 2358/2891 | Timestep 8140 | LR 0.0001000000 | Loss 0.039426 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:08 Epoch 2 | Batch 2368/2891 | Timestep 8150 | LR 0.0001000000 | Loss 0.040665 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:11 Epoch 2 | Batch 2378/2891 | Timestep 8160 | LR 0.0001000000 | Loss 0.126794 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:12 Epoch 2 | Batch 2388/2891 | Timestep 8170 | LR 0.0001000000 | Loss 0.046740 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:15 Epoch 2 | Batch 2398/2891 | Timestep 8180 | LR 0.0001000000 | Loss 0.051701 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:17 Epoch 2 | Batch 2408/2891 | Timestep 8190 | LR 0.0001000000 | Loss 0.017596 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:19 Epoch 2 | Batch 2418/2891 | Timestep 8200 | LR 0.0001000000 | Loss 0.021376 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:21 Epoch 2 | Batch 2428/2891 | Timestep 8210 | LR 0.0001000000 | Loss 0.051713 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:23 Epoch 2 | Batch 2438/2891 | Timestep 8220 | LR 0.0001000000 | Loss 0.057072 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:25 Epoch 2 | Batch 2448/2891 | Timestep 8230 | LR 0.0001000000 | Loss 0.094931 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:28 Epoch 2 | Batch 2458/2891 | Timestep 8240 | LR 0.0001000000 | Loss 0.038530 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:30 Epoch 2 | Batch 2468/2891 | Timestep 8250 | LR 0.0001000000 | Loss 0.082270 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:32 Epoch 2 | Batch 2478/2891 | Timestep 8260 | LR 0.0001000000 | Loss 0.030557 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:34 Epoch 2 | Batch 2488/2891 | Timestep 8270 | LR 0.0001000000 | Loss 0.150966 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:37 Epoch 2 | Batch 2498/2891 | Timestep 8280 | LR 0.0001000000 | Loss 0.007534 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:39 Epoch 2 | Batch 2508/2891 | Timestep 8290 | LR 0.0001000000 | Loss 0.121672 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:41 Epoch 2 | Batch 2518/2891 | Timestep 8300 | LR 0.0001000000 | Loss 0.097070 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:43 Epoch 2 | Batch 2528/2891 | Timestep 8310 | LR 0.0001000000 | Loss 0.048639 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:46 Epoch 2 | Batch 2538/2891 | Timestep 8320 | LR 0.0001000000 | Loss 0.029463 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:48 Epoch 2 | Batch 2548/2891 | Timestep 8330 | LR 0.0001000000 | Loss 0.007944 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:50 Epoch 2 | Batch 2558/2891 | Timestep 8340 | LR 0.0001000000 | Loss 0.010268 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:52 Epoch 2 | Batch 2568/2891 | Timestep 8350 | LR 0.0001000000 | Loss 0.012203 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:55 Epoch 2 | Batch 2578/2891 | Timestep 8360 | LR 0.0001000000 | Loss 0.073465 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:57 Epoch 2 | Batch 2588/2891 | Timestep 8370 | LR 0.0001000000 | Loss 0.022780 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:46:59 Epoch 2 | Batch 2598/2891 | Timestep 8380 | LR 0.0001000000 | Loss 0.034272 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:01 Epoch 2 | Batch 2608/2891 | Timestep 8390 | LR 0.0001000000 | Loss 0.314180 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:03 Epoch 2 | Batch 2618/2891 | Timestep 8400 | LR 0.0001000000 | Loss 0.015608 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:06 Epoch 2 | Batch 2628/2891 | Timestep 8410 | LR 0.0001000000 | Loss 0.015830 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:08 Epoch 2 | Batch 2638/2891 | Timestep 8420 | LR 0.0001000000 | Loss 0.040386 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:10 Epoch 2 | Batch 2648/2891 | Timestep 8430 | LR 0.0001000000 | Loss 0.070202 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:12 Epoch 2 | Batch 2658/2891 | Timestep 8440 | LR 0.0001000000 | Loss 0.035550 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:14 Epoch 2 | Batch 2668/2891 | Timestep 8450 | LR 0.0001000000 | Loss 0.067636 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:17 Epoch 2 | Batch 2678/2891 | Timestep 8460 | LR 0.0001000000 | Loss 0.100428 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:18 Epoch 2 | Batch 2688/2891 | Timestep 8470 | LR 0.0001000000 | Loss 0.075809 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:20 Epoch 2 | Batch 2698/2891 | Timestep 8480 | LR 0.0001000000 | Loss 0.009862 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:23 Epoch 2 | Batch 2708/2891 | Timestep 8490 | LR 0.0001000000 | Loss 0.054308 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:25 Epoch 2 | Batch 2718/2891 | Timestep 8500 | LR 0.0001000000 | Loss 0.029840 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:27 Epoch 2 | Batch 2728/2891 | Timestep 8510 | LR 0.0001000000 | Loss 0.072844 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:29 Epoch 2 | Batch 2738/2891 | Timestep 8520 | LR 0.0001000000 | Loss 0.060537 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:31 Epoch 2 | Batch 2748/2891 | Timestep 8530 | LR 0.0001000000 | Loss 0.056881 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:33 Epoch 2 | Batch 2758/2891 | Timestep 8540 | LR 0.0001000000 | Loss 0.065981 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:35 Epoch 2 | Batch 2768/2891 | Timestep 8550 | LR 0.0001000000 | Loss 0.064355 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:37 Epoch 2 | Batch 2778/2891 | Timestep 8560 | LR 0.0001000000 | Loss 0.056600 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:39 Epoch 2 | Batch 2788/2891 | Timestep 8570 | LR 0.0001000000 | Loss 0.044637 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:41 Epoch 2 | Batch 2798/2891 | Timestep 8580 | LR 0.0001000000 | Loss 0.044019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:44 Epoch 2 | Batch 2808/2891 | Timestep 8590 | LR 0.0001000000 | Loss 0.049000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:46 Epoch 2 | Batch 2818/2891 | Timestep 8600 | LR 0.0001000000 | Loss 0.061683 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:48 Epoch 2 | Batch 2828/2891 | Timestep 8610 | LR 0.0001000000 | Loss 0.016867 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:50 Epoch 2 | Batch 2838/2891 | Timestep 8620 | LR 0.0001000000 | Loss 0.006245 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:52 Epoch 2 | Batch 2848/2891 | Timestep 8630 | LR 0.0001000000 | Loss 0.013429 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:55 Epoch 2 | Batch 2858/2891 | Timestep 8640 | LR 0.0001000000 | Loss 0.034790 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:57 Epoch 2 | Batch 2868/2891 | Timestep 8650 | LR 0.0001000000 | Loss 0.106114 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:47:59 Epoch 2 | Batch 2878/2891 | Timestep 8660 | LR 0.0001000000 | Loss 0.229911 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:48:01 Epoch 2 | Batch 2888/2891 | Timestep 8670 | LR 0.0001000000 | Loss 0.037440 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:48:02 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 18:49:22 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.5984 0.7019 0.6460 104 + CAMP 0.9571 0.9437 0.9504 71 + CARDINAL 0.8768 0.7118 0.7857 170 + CLUSTER 0.7273 0.6154 0.6667 26 + COM 0.3803 0.6923 0.4909 39 + CONTINENT 0.9583 1.0000 0.9787 23 + COUNTRY 0.9690 0.9737 0.9713 835 + CURR 0.9545 0.8750 0.9130 24 + DATE 0.9270 0.9243 0.9257 1691 + EDU 0.9159 0.8991 0.9074 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.6570 0.6233 0.6397 292 + FAC 0.6000 0.7838 0.6797 111 + GOV 0.8161 0.9081 0.8597 860 + GPE 0.9661 0.9695 0.9678 2261 + GPE_ORG 0.7923 0.8683 0.8286 167 + LAND-REGION-NATURAL 0.5000 0.1731 0.2571 52 + LANGUAGE 0.7059 0.7500 0.7273 16 + LAW 0.4773 0.8936 0.6222 47 + LOC 0.7227 0.6772 0.6992 127 + MED 0.9881 0.9881 0.9881 419 + MONEY 0.6800 0.7727 0.7234 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.8581 0.8687 0.8634 571 + NORP 0.5997 0.6715 0.6336 551 + OCC 0.7570 0.8295 0.7916 522 + ORDINAL 0.8881 0.9485 0.9173 544 + ORG 0.8579 0.9274 0.8913 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.1538 0.3333 0.2105 6 + PERCENT 0.7143 0.8333 0.7692 12 + PERS 0.9262 0.9057 0.9159 679 + PRODUCT 0.4000 0.2500 0.3077 8 + QUANTITY 0.2222 0.6667 0.3333 3 + REGION-GENERAL 0.7941 0.7297 0.7606 37 +REGION-INTERNATIONAL 0.4444 0.6667 0.5333 12 + REL 0.5455 0.6000 0.5714 10 + SCI 0.1111 0.0769 0.0909 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.9277 0.8603 0.8928 179 + SUBAREA-FACILITY 0.4286 0.1875 0.2609 16 + TIME 0.6176 0.6364 0.6269 33 + TOWN 0.9652 0.9573 0.9612 1217 + UNIT 0.3750 0.7500 0.5000 4 + WATER-BODY 0.2692 0.5000 0.3500 14 + WEBSITE 0.3471 0.5250 0.4179 80 + + micro avg 0.8653 0.8943 0.8796 13790 + macro avg 0.5911 0.6348 0.6006 13790 + weighted avg 0.8710 0.8943 0.8809 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:50:04 Epoch 2 | Timestep 8673 | Train Loss 0.097704 | Val Loss 0.084552 | F1 0.879569 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:50:04 ** Validation improved, evaluating test data ** +INFO arabiner.data.transforms Tue, 26 Mar 2024 18:50:08 Truncating the sequence لكن صوت جوالي مزعج ما دفعني للنهوض وبعصبية وارتباك من هذا الاتصال وخصوصا أن الساعة الواحدة والنصف يعنى عز دين النوم فأمسكت الجوال وقمت بالضغط على زر الرد . فقلت الو مين معي فقال معك الرئيس فقلت رئيس مين بالضبط فقال جورج بوش رئيس الولايات المتحدة الأمريكية فقلت اهلا أهلا يا سيادة الرئيس , بس أنا على حد علمي انه الرئيس جورج بوش بتكلم اللغة الانجليزية فكيف أنت بتحكي عربي بوش انأ بتكلم اللغة العربية جيدا حتى أنى ممكن أحكى باللهجة الغزواية . فقلت عليك اه خير شو مالك متصل فيا وكيف عرفت رقمي بوش ما في شي قلت أسال كيف أهل غزة بجو الحصار أما كيف عرفت رقمك فقلت لمديرة مكتبي أعطيني اتصال مباشر مع اى شخص من غزة فقلت غزة ااه بدك تعرف أخبار غزة صامدين صامدين ومش راح نتخلى عن الثوابت الفلسطينية لو شو ما تعملوا بوش يعنى بدك تقنعني انه ما فى نتيجة من الحصار فقلت لا ما في نتيجة لأنه إحنا بنخاف على بعض وبنحب بعض حتى رغيف الخبز مرات بنتقاسموا بوش اه واضح حتى التعذيب بتتقاسموه بالضفة وغزة فقلت يا عمى هيك عارف كل شى , شو بدك من الأخر لأني بدى أنام بوش شو رأيك تحضر مؤتمر انابولس فقلت احضر شو , شمعنا أنا يعني بوش هيك اجت فى بالى الفكرة فقلت لا لا مش فاضى , ميش مستعد اضيع وقتي في شي عارف نهايته بوش طيب تابعنا على التلفزيون منه بتعرف شو صار قلت صدقني وقتي فل , بكون بقرا بكتاب الجنة لا تبعد كثيرا بوش غريبة أول إنسان عربي ادعوه على المؤتمر ويكون وقته مشغول قلت شكلوا الكل مضيوف بالبيت الأبيض بوش اه مليان مش عارف أتحرك براحتي مخنوق فقلت اذا انت مخنوق شو نقول احنا بوش عارف بحاول معهم لكن لا حياة لمن تنادى من الطرفين وحابب اخذ رايك بالموضوع هل فى امل ? فقلت : رأي انك تستقيل قبل مؤتمر انابولس واكسب بياض الوجه وسيبك من الشرق الأوسط صدقني ما بتستاهلوا شي بوش : لا وحياتك راح يستقيل اولمرت وعباس اذا صار شي فقلت : اسمحي بدى أنام نعسان , بس دير بالك على العراق وأفغانستان اصلو بسمع انه في قتلي بشكل غريب بوش : وما تقلق راح أتوصي بإيران كويس وراح نعمل الوطن العربي كله سلطة قلت : طيب يالله سلام بوش : بس ما تنسانى قلت : له / هو فى حدا راح ينساك وانقطع حلمي برنه جوال حقيقة شرذمت ما تبقى من الحلم , فاعذروني فما هذه المكالمة إلا من عتمة أفكاري فأتمنى للرئيس عباس كل التوفيق وأرجو الا يكون هذا المؤتمر هو رحلة حب قصيرة الأمد . to 510 +INFO root Tue, 26 Mar 2024 18:51:11 Predictions written to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/predictions.txt +INFO root Tue, 26 Mar 2024 18:52:44 + precision recall f1-score support + + AIRPORT 0.0000 0.0000 0.0000 1 + BOUNDARY 0.0000 0.0000 0.0000 3 + BUILDING-OR-GROUNDS 0.5980 0.5980 0.5980 204 + CAMP 0.8851 0.9167 0.9006 168 + CARDINAL 0.8940 0.7398 0.8096 342 + CELESTIAL 0.0000 0.0000 0.0000 2 + CLUSTER 0.6912 0.6104 0.6483 77 + COM 0.4494 0.7207 0.5536 111 + CONTINENT 0.9792 0.8246 0.8952 57 + COUNTRY 0.9645 0.9686 0.9665 1625 + CURR 1.0000 0.8537 0.9211 41 + DATE 0.9291 0.9361 0.9326 3206 + EDU 0.7731 0.8070 0.7897 228 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.6299 0.6421 0.6360 570 + FAC 0.6129 0.6816 0.6454 223 + GOV 0.8077 0.8992 0.8510 1696 + GPE 0.9531 0.9646 0.9589 4554 + GPE_ORG 0.8483 0.8431 0.8457 325 + LAND-REGION-NATURAL 0.5429 0.1610 0.2484 118 + LANGUAGE 0.7027 0.6047 0.6500 43 + LAW 0.5241 0.8444 0.6468 90 + LOC 0.7276 0.6655 0.6952 281 + MED 0.9864 0.9888 0.9876 807 + MONEY 0.6098 0.7576 0.6757 33 + NEIGHBORHOOD 0.1667 0.1000 0.1250 30 + NONGOV 0.8383 0.8514 0.8448 1151 + NORP 0.6272 0.7134 0.6675 1092 + OCC 0.7406 0.8178 0.7773 1103 + ORDINAL 0.8942 0.9603 0.9261 1083 + ORG 0.8442 0.9198 0.8804 3618 + ORG_FAC 0.0000 0.0000 0.0000 19 + PATH 0.3913 0.5000 0.4390 18 + PERCENT 0.6410 0.7576 0.6944 33 + PERS 0.8968 0.8814 0.8890 1568 + PRODUCT 0.4000 0.2105 0.2759 19 + QUANTITY 0.3529 0.6667 0.4615 9 + REGION-GENERAL 0.7407 0.5797 0.6504 69 +REGION-INTERNATIONAL 0.5000 0.6552 0.5672 29 + REL 0.8333 0.6000 0.6977 25 + SCI 0.1852 0.1724 0.1786 29 + SPO 0.0000 0.0000 0.0000 8 + SPORT 0.0000 0.0000 0.0000 1 + STATE-OR-PROVINCE 0.9062 0.8266 0.8646 421 + SUBAREA-FACILITY 0.1818 0.0870 0.1176 23 + TIME 0.5765 0.5833 0.5799 84 + TOWN 0.9559 0.9543 0.9551 2431 + UNIT 0.4000 0.7273 0.5161 11 + WATER-BODY 0.3243 0.5714 0.4138 21 + WEBSITE 0.3575 0.5948 0.4466 116 + + micro avg 0.8589 0.8873 0.8729 27817 + macro avg 0.5773 0.5952 0.5765 27817 + weighted avg 0.8622 0.8873 0.8730 27817 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:07 Epoch 2 | Timestep 8673 | Test Loss 0.092734 | F1 0.872869 +INFO arabiner.trainers.BaseTrainer Tue, 26 Mar 2024 18:54:07 Saving checkpoint to /var/home/nhamad/SharedTask2024/nested-final2/output-nested/checkpoints/checkpoint_2.pt +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:11 Epoch 3 | Batch 7/2891 | Timestep 8680 | LR 0.0001000000 | Loss 0.015435 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:13 Epoch 3 | Batch 17/2891 | Timestep 8690 | LR 0.0001000000 | Loss 0.014185 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:16 Epoch 3 | Batch 27/2891 | Timestep 8700 | LR 0.0001000000 | Loss 0.019916 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:18 Epoch 3 | Batch 37/2891 | Timestep 8710 | LR 0.0001000000 | Loss 0.020335 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:20 Epoch 3 | Batch 47/2891 | Timestep 8720 | LR 0.0001000000 | Loss 0.050067 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:22 Epoch 3 | Batch 57/2891 | Timestep 8730 | LR 0.0001000000 | Loss 0.047244 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:24 Epoch 3 | Batch 67/2891 | Timestep 8740 | LR 0.0001000000 | Loss 0.011177 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:27 Epoch 3 | Batch 77/2891 | Timestep 8750 | LR 0.0001000000 | Loss 0.055859 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:29 Epoch 3 | Batch 87/2891 | Timestep 8760 | LR 0.0001000000 | Loss 0.020530 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:31 Epoch 3 | Batch 97/2891 | Timestep 8770 | LR 0.0001000000 | Loss 0.046536 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:33 Epoch 3 | Batch 107/2891 | Timestep 8780 | LR 0.0001000000 | Loss 0.034109 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:35 Epoch 3 | Batch 117/2891 | Timestep 8790 | LR 0.0001000000 | Loss 0.021251 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:37 Epoch 3 | Batch 127/2891 | Timestep 8800 | LR 0.0001000000 | Loss 0.045419 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:39 Epoch 3 | Batch 137/2891 | Timestep 8810 | LR 0.0001000000 | Loss 0.074090 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:41 Epoch 3 | Batch 147/2891 | Timestep 8820 | LR 0.0001000000 | Loss 0.050367 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:43 Epoch 3 | Batch 157/2891 | Timestep 8830 | LR 0.0001000000 | Loss 0.094764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:46 Epoch 3 | Batch 167/2891 | Timestep 8840 | LR 0.0001000000 | Loss 0.013827 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:48 Epoch 3 | Batch 177/2891 | Timestep 8850 | LR 0.0001000000 | Loss 0.020639 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:50 Epoch 3 | Batch 187/2891 | Timestep 8860 | LR 0.0001000000 | Loss 0.074818 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:52 Epoch 3 | Batch 197/2891 | Timestep 8870 | LR 0.0001000000 | Loss 0.042717 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:54 Epoch 3 | Batch 207/2891 | Timestep 8880 | LR 0.0001000000 | Loss 0.010379 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:57 Epoch 3 | Batch 217/2891 | Timestep 8890 | LR 0.0001000000 | Loss 0.012217 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:54:59 Epoch 3 | Batch 227/2891 | Timestep 8900 | LR 0.0001000000 | Loss 0.037466 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:01 Epoch 3 | Batch 237/2891 | Timestep 8910 | LR 0.0001000000 | Loss 0.045814 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:03 Epoch 3 | Batch 247/2891 | Timestep 8920 | LR 0.0001000000 | Loss 0.014828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:05 Epoch 3 | Batch 257/2891 | Timestep 8930 | LR 0.0001000000 | Loss 0.003199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:07 Epoch 3 | Batch 267/2891 | Timestep 8940 | LR 0.0001000000 | Loss 0.007863 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:09 Epoch 3 | Batch 277/2891 | Timestep 8950 | LR 0.0001000000 | Loss 0.027158 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:11 Epoch 3 | Batch 287/2891 | Timestep 8960 | LR 0.0001000000 | Loss 0.037230 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:14 Epoch 3 | Batch 297/2891 | Timestep 8970 | LR 0.0001000000 | Loss 0.008622 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:16 Epoch 3 | Batch 307/2891 | Timestep 8980 | LR 0.0001000000 | Loss 0.013949 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:18 Epoch 3 | Batch 317/2891 | Timestep 8990 | LR 0.0001000000 | Loss 0.007317 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:20 Epoch 3 | Batch 327/2891 | Timestep 9000 | LR 0.0001000000 | Loss 0.041702 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:22 Epoch 3 | Batch 337/2891 | Timestep 9010 | LR 0.0001000000 | Loss 0.011045 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:24 Epoch 3 | Batch 347/2891 | Timestep 9020 | LR 0.0001000000 | Loss 0.073986 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:26 Epoch 3 | Batch 357/2891 | Timestep 9030 | LR 0.0001000000 | Loss 0.005800 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:29 Epoch 3 | Batch 367/2891 | Timestep 9040 | LR 0.0001000000 | Loss 0.044957 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:31 Epoch 3 | Batch 377/2891 | Timestep 9050 | LR 0.0001000000 | Loss 0.092569 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:33 Epoch 3 | Batch 387/2891 | Timestep 9060 | LR 0.0001000000 | Loss 0.030828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:35 Epoch 3 | Batch 397/2891 | Timestep 9070 | LR 0.0001000000 | Loss 0.025631 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:37 Epoch 3 | Batch 407/2891 | Timestep 9080 | LR 0.0001000000 | Loss 0.090209 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:40 Epoch 3 | Batch 417/2891 | Timestep 9090 | LR 0.0001000000 | Loss 0.077372 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:42 Epoch 3 | Batch 427/2891 | Timestep 9100 | LR 0.0001000000 | Loss 0.044374 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:44 Epoch 3 | Batch 437/2891 | Timestep 9110 | LR 0.0001000000 | Loss 0.112185 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:47 Epoch 3 | Batch 447/2891 | Timestep 9120 | LR 0.0001000000 | Loss 0.036147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:49 Epoch 3 | Batch 457/2891 | Timestep 9130 | LR 0.0001000000 | Loss 0.025845 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:51 Epoch 3 | Batch 467/2891 | Timestep 9140 | LR 0.0001000000 | Loss 0.033634 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:54 Epoch 3 | Batch 477/2891 | Timestep 9150 | LR 0.0001000000 | Loss 0.012943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:56 Epoch 3 | Batch 487/2891 | Timestep 9160 | LR 0.0001000000 | Loss 0.018647 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:55:58 Epoch 3 | Batch 497/2891 | Timestep 9170 | LR 0.0001000000 | Loss 0.050727 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:01 Epoch 3 | Batch 507/2891 | Timestep 9180 | LR 0.0001000000 | Loss 0.040583 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:03 Epoch 3 | Batch 517/2891 | Timestep 9190 | LR 0.0001000000 | Loss 0.072397 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:05 Epoch 3 | Batch 527/2891 | Timestep 9200 | LR 0.0001000000 | Loss 0.143899 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:07 Epoch 3 | Batch 537/2891 | Timestep 9210 | LR 0.0001000000 | Loss 0.007831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:09 Epoch 3 | Batch 547/2891 | Timestep 9220 | LR 0.0001000000 | Loss 0.017021 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:11 Epoch 3 | Batch 557/2891 | Timestep 9230 | LR 0.0001000000 | Loss 0.059586 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:13 Epoch 3 | Batch 567/2891 | Timestep 9240 | LR 0.0001000000 | Loss 0.084894 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:15 Epoch 3 | Batch 577/2891 | Timestep 9250 | LR 0.0001000000 | Loss 0.009519 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:17 Epoch 3 | Batch 587/2891 | Timestep 9260 | LR 0.0001000000 | Loss 0.016798 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:19 Epoch 3 | Batch 597/2891 | Timestep 9270 | LR 0.0001000000 | Loss 0.060742 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:22 Epoch 3 | Batch 607/2891 | Timestep 9280 | LR 0.0001000000 | Loss 0.086881 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:24 Epoch 3 | Batch 617/2891 | Timestep 9290 | LR 0.0001000000 | Loss 0.008058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:26 Epoch 3 | Batch 627/2891 | Timestep 9300 | LR 0.0001000000 | Loss 0.104278 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:29 Epoch 3 | Batch 637/2891 | Timestep 9310 | LR 0.0001000000 | Loss 0.012003 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:30 Epoch 3 | Batch 647/2891 | Timestep 9320 | LR 0.0001000000 | Loss 0.014002 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:32 Epoch 3 | Batch 657/2891 | Timestep 9330 | LR 0.0001000000 | Loss 0.032076 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:35 Epoch 3 | Batch 667/2891 | Timestep 9340 | LR 0.0001000000 | Loss 0.028287 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:37 Epoch 3 | Batch 677/2891 | Timestep 9350 | LR 0.0001000000 | Loss 0.094186 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:39 Epoch 3 | Batch 687/2891 | Timestep 9360 | LR 0.0001000000 | Loss 0.110193 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:41 Epoch 3 | Batch 697/2891 | Timestep 9370 | LR 0.0001000000 | Loss 0.010873 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:43 Epoch 3 | Batch 707/2891 | Timestep 9380 | LR 0.0001000000 | Loss 0.038349 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:45 Epoch 3 | Batch 717/2891 | Timestep 9390 | LR 0.0001000000 | Loss 0.012628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:48 Epoch 3 | Batch 727/2891 | Timestep 9400 | LR 0.0001000000 | Loss 0.087832 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:50 Epoch 3 | Batch 737/2891 | Timestep 9410 | LR 0.0001000000 | Loss 0.100889 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:52 Epoch 3 | Batch 747/2891 | Timestep 9420 | LR 0.0001000000 | Loss 0.008269 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:55 Epoch 3 | Batch 757/2891 | Timestep 9430 | LR 0.0001000000 | Loss 0.094135 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:57 Epoch 3 | Batch 767/2891 | Timestep 9440 | LR 0.0001000000 | Loss 0.011424 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:56:59 Epoch 3 | Batch 777/2891 | Timestep 9450 | LR 0.0001000000 | Loss 0.061671 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:01 Epoch 3 | Batch 787/2891 | Timestep 9460 | LR 0.0001000000 | Loss 0.212837 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:03 Epoch 3 | Batch 797/2891 | Timestep 9470 | LR 0.0001000000 | Loss 0.014446 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:06 Epoch 3 | Batch 807/2891 | Timestep 9480 | LR 0.0001000000 | Loss 0.042362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:07 Epoch 3 | Batch 817/2891 | Timestep 9490 | LR 0.0001000000 | Loss 0.046656 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:10 Epoch 3 | Batch 827/2891 | Timestep 9500 | LR 0.0001000000 | Loss 0.035257 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:12 Epoch 3 | Batch 837/2891 | Timestep 9510 | LR 0.0001000000 | Loss 0.006230 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:15 Epoch 3 | Batch 847/2891 | Timestep 9520 | LR 0.0001000000 | Loss 0.002268 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:17 Epoch 3 | Batch 857/2891 | Timestep 9530 | LR 0.0001000000 | Loss 0.043275 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:19 Epoch 3 | Batch 867/2891 | Timestep 9540 | LR 0.0001000000 | Loss 0.069715 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:21 Epoch 3 | Batch 877/2891 | Timestep 9550 | LR 0.0001000000 | Loss 0.063895 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:23 Epoch 3 | Batch 887/2891 | Timestep 9560 | LR 0.0001000000 | Loss 0.008264 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:25 Epoch 3 | Batch 897/2891 | Timestep 9570 | LR 0.0001000000 | Loss 0.032053 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:27 Epoch 3 | Batch 907/2891 | Timestep 9580 | LR 0.0001000000 | Loss 0.066952 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:29 Epoch 3 | Batch 917/2891 | Timestep 9590 | LR 0.0001000000 | Loss 0.014392 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:31 Epoch 3 | Batch 927/2891 | Timestep 9600 | LR 0.0001000000 | Loss 0.031684 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:33 Epoch 3 | Batch 937/2891 | Timestep 9610 | LR 0.0001000000 | Loss 0.034615 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:36 Epoch 3 | Batch 947/2891 | Timestep 9620 | LR 0.0001000000 | Loss 0.108501 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:38 Epoch 3 | Batch 957/2891 | Timestep 9630 | LR 0.0001000000 | Loss 0.071536 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:41 Epoch 3 | Batch 967/2891 | Timestep 9640 | LR 0.0001000000 | Loss 0.003586 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:43 Epoch 3 | Batch 977/2891 | Timestep 9650 | LR 0.0001000000 | Loss 0.021979 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:45 Epoch 3 | Batch 987/2891 | Timestep 9660 | LR 0.0001000000 | Loss 0.055639 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:48 Epoch 3 | Batch 997/2891 | Timestep 9670 | LR 0.0001000000 | Loss 0.029099 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:49 Epoch 3 | Batch 1007/2891 | Timestep 9680 | LR 0.0001000000 | Loss 0.173098 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:52 Epoch 3 | Batch 1017/2891 | Timestep 9690 | LR 0.0001000000 | Loss 0.065694 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:54 Epoch 3 | Batch 1027/2891 | Timestep 9700 | LR 0.0001000000 | Loss 0.048960 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:56 Epoch 3 | Batch 1037/2891 | Timestep 9710 | LR 0.0001000000 | Loss 0.104454 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:57:58 Epoch 3 | Batch 1047/2891 | Timestep 9720 | LR 0.0001000000 | Loss 0.029361 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:01 Epoch 3 | Batch 1057/2891 | Timestep 9730 | LR 0.0001000000 | Loss 0.047859 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:03 Epoch 3 | Batch 1067/2891 | Timestep 9740 | LR 0.0001000000 | Loss 0.022096 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:05 Epoch 3 | Batch 1077/2891 | Timestep 9750 | LR 0.0001000000 | Loss 0.055904 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:08 Epoch 3 | Batch 1087/2891 | Timestep 9760 | LR 0.0001000000 | Loss 0.029604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:10 Epoch 3 | Batch 1097/2891 | Timestep 9770 | LR 0.0001000000 | Loss 0.100053 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:12 Epoch 3 | Batch 1107/2891 | Timestep 9780 | LR 0.0001000000 | Loss 0.017474 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:14 Epoch 3 | Batch 1117/2891 | Timestep 9790 | LR 0.0001000000 | Loss 0.056922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:16 Epoch 3 | Batch 1127/2891 | Timestep 9800 | LR 0.0001000000 | Loss 0.025207 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:18 Epoch 3 | Batch 1137/2891 | Timestep 9810 | LR 0.0001000000 | Loss 0.053850 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:21 Epoch 3 | Batch 1147/2891 | Timestep 9820 | LR 0.0001000000 | Loss 0.005007 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:23 Epoch 3 | Batch 1157/2891 | Timestep 9830 | LR 0.0001000000 | Loss 0.031114 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:25 Epoch 3 | Batch 1167/2891 | Timestep 9840 | LR 0.0001000000 | Loss 0.016109 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:27 Epoch 3 | Batch 1177/2891 | Timestep 9850 | LR 0.0001000000 | Loss 0.046325 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:29 Epoch 3 | Batch 1187/2891 | Timestep 9860 | LR 0.0001000000 | Loss 0.042281 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:31 Epoch 3 | Batch 1197/2891 | Timestep 9870 | LR 0.0001000000 | Loss 0.103713 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:33 Epoch 3 | Batch 1207/2891 | Timestep 9880 | LR 0.0001000000 | Loss 0.024987 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:36 Epoch 3 | Batch 1217/2891 | Timestep 9890 | LR 0.0001000000 | Loss 0.005416 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:38 Epoch 3 | Batch 1227/2891 | Timestep 9900 | LR 0.0001000000 | Loss 0.051674 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:40 Epoch 3 | Batch 1237/2891 | Timestep 9910 | LR 0.0001000000 | Loss 0.038684 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:42 Epoch 3 | Batch 1247/2891 | Timestep 9920 | LR 0.0001000000 | Loss 0.028880 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:44 Epoch 3 | Batch 1257/2891 | Timestep 9930 | LR 0.0001000000 | Loss 0.042233 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:46 Epoch 3 | Batch 1267/2891 | Timestep 9940 | LR 0.0001000000 | Loss 0.061690 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:48 Epoch 3 | Batch 1277/2891 | Timestep 9950 | LR 0.0001000000 | Loss 0.088918 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:50 Epoch 3 | Batch 1287/2891 | Timestep 9960 | LR 0.0001000000 | Loss 0.041015 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:52 Epoch 3 | Batch 1297/2891 | Timestep 9970 | LR 0.0001000000 | Loss 0.013387 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:54 Epoch 3 | Batch 1307/2891 | Timestep 9980 | LR 0.0001000000 | Loss 0.028328 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:56 Epoch 3 | Batch 1317/2891 | Timestep 9990 | LR 0.0001000000 | Loss 0.019986 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:58:58 Epoch 3 | Batch 1327/2891 | Timestep 10000 | LR 0.0001000000 | Loss 0.026238 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:01 Epoch 3 | Batch 1337/2891 | Timestep 10010 | LR 0.0001000000 | Loss 0.037429 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:03 Epoch 3 | Batch 1347/2891 | Timestep 10020 | LR 0.0001000000 | Loss 0.008460 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:05 Epoch 3 | Batch 1357/2891 | Timestep 10030 | LR 0.0001000000 | Loss 0.044503 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:07 Epoch 3 | Batch 1367/2891 | Timestep 10040 | LR 0.0001000000 | Loss 0.102775 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:10 Epoch 3 | Batch 1377/2891 | Timestep 10050 | LR 0.0001000000 | Loss 0.057675 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:12 Epoch 3 | Batch 1387/2891 | Timestep 10060 | LR 0.0001000000 | Loss 0.105287 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:14 Epoch 3 | Batch 1397/2891 | Timestep 10070 | LR 0.0001000000 | Loss 0.047206 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:16 Epoch 3 | Batch 1407/2891 | Timestep 10080 | LR 0.0001000000 | Loss 0.103232 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:18 Epoch 3 | Batch 1417/2891 | Timestep 10090 | LR 0.0001000000 | Loss 0.066593 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:20 Epoch 3 | Batch 1427/2891 | Timestep 10100 | LR 0.0001000000 | Loss 0.035120 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:23 Epoch 3 | Batch 1437/2891 | Timestep 10110 | LR 0.0001000000 | Loss 0.006945 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:26 Epoch 3 | Batch 1447/2891 | Timestep 10120 | LR 0.0001000000 | Loss 0.027805 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:28 Epoch 3 | Batch 1457/2891 | Timestep 10130 | LR 0.0001000000 | Loss 0.047875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:30 Epoch 3 | Batch 1467/2891 | Timestep 10140 | LR 0.0001000000 | Loss 0.031337 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:32 Epoch 3 | Batch 1477/2891 | Timestep 10150 | LR 0.0001000000 | Loss 0.044229 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:34 Epoch 3 | Batch 1487/2891 | Timestep 10160 | LR 0.0001000000 | Loss 0.013657 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:36 Epoch 3 | Batch 1497/2891 | Timestep 10170 | LR 0.0001000000 | Loss 0.013584 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:39 Epoch 3 | Batch 1507/2891 | Timestep 10180 | LR 0.0001000000 | Loss 0.071532 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:41 Epoch 3 | Batch 1517/2891 | Timestep 10190 | LR 0.0001000000 | Loss 0.031855 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:43 Epoch 3 | Batch 1527/2891 | Timestep 10200 | LR 0.0001000000 | Loss 0.024816 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:45 Epoch 3 | Batch 1537/2891 | Timestep 10210 | LR 0.0001000000 | Loss 0.076186 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:47 Epoch 3 | Batch 1547/2891 | Timestep 10220 | LR 0.0001000000 | Loss 0.003536 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:49 Epoch 3 | Batch 1557/2891 | Timestep 10230 | LR 0.0001000000 | Loss 0.103668 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:51 Epoch 3 | Batch 1567/2891 | Timestep 10240 | LR 0.0001000000 | Loss 0.008351 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:53 Epoch 3 | Batch 1577/2891 | Timestep 10250 | LR 0.0001000000 | Loss 0.019399 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:56 Epoch 3 | Batch 1587/2891 | Timestep 10260 | LR 0.0001000000 | Loss 0.043652 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 18:59:58 Epoch 3 | Batch 1597/2891 | Timestep 10270 | LR 0.0001000000 | Loss 0.012363 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:00 Epoch 3 | Batch 1607/2891 | Timestep 10280 | LR 0.0001000000 | Loss 0.032170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:03 Epoch 3 | Batch 1617/2891 | Timestep 10290 | LR 0.0001000000 | Loss 0.086820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:05 Epoch 3 | Batch 1627/2891 | Timestep 10300 | LR 0.0001000000 | Loss 0.048626 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:07 Epoch 3 | Batch 1637/2891 | Timestep 10310 | LR 0.0001000000 | Loss 0.011947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:09 Epoch 3 | Batch 1647/2891 | Timestep 10320 | LR 0.0001000000 | Loss 0.017686 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:12 Epoch 3 | Batch 1657/2891 | Timestep 10330 | LR 0.0001000000 | Loss 0.006051 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:14 Epoch 3 | Batch 1667/2891 | Timestep 10340 | LR 0.0001000000 | Loss 0.034468 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:16 Epoch 3 | Batch 1677/2891 | Timestep 10350 | LR 0.0001000000 | Loss 0.073445 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:19 Epoch 3 | Batch 1687/2891 | Timestep 10360 | LR 0.0001000000 | Loss 0.024437 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:21 Epoch 3 | Batch 1697/2891 | Timestep 10370 | LR 0.0001000000 | Loss 0.010736 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:23 Epoch 3 | Batch 1707/2891 | Timestep 10380 | LR 0.0001000000 | Loss 0.070803 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:25 Epoch 3 | Batch 1717/2891 | Timestep 10390 | LR 0.0001000000 | Loss 0.070050 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:27 Epoch 3 | Batch 1727/2891 | Timestep 10400 | LR 0.0001000000 | Loss 0.027539 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:29 Epoch 3 | Batch 1737/2891 | Timestep 10410 | LR 0.0001000000 | Loss 0.000871 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:31 Epoch 3 | Batch 1747/2891 | Timestep 10420 | LR 0.0001000000 | Loss 0.055618 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:34 Epoch 3 | Batch 1757/2891 | Timestep 10430 | LR 0.0001000000 | Loss 0.048695 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:37 Epoch 3 | Batch 1767/2891 | Timestep 10440 | LR 0.0001000000 | Loss 0.081182 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:39 Epoch 3 | Batch 1777/2891 | Timestep 10450 | LR 0.0001000000 | Loss 0.043397 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:42 Epoch 3 | Batch 1787/2891 | Timestep 10460 | LR 0.0001000000 | Loss 0.052996 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:44 Epoch 3 | Batch 1797/2891 | Timestep 10470 | LR 0.0001000000 | Loss 0.022616 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:46 Epoch 3 | Batch 1807/2891 | Timestep 10480 | LR 0.0001000000 | Loss 0.050718 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:48 Epoch 3 | Batch 1817/2891 | Timestep 10490 | LR 0.0001000000 | Loss 0.045279 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:50 Epoch 3 | Batch 1827/2891 | Timestep 10500 | LR 0.0001000000 | Loss 0.006470 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:52 Epoch 3 | Batch 1837/2891 | Timestep 10510 | LR 0.0001000000 | Loss 0.020518 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:54 Epoch 3 | Batch 1847/2891 | Timestep 10520 | LR 0.0001000000 | Loss 0.045804 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:57 Epoch 3 | Batch 1857/2891 | Timestep 10530 | LR 0.0001000000 | Loss 0.033295 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:00:59 Epoch 3 | Batch 1867/2891 | Timestep 10540 | LR 0.0001000000 | Loss 0.164149 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:01 Epoch 3 | Batch 1877/2891 | Timestep 10550 | LR 0.0001000000 | Loss 0.013651 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:03 Epoch 3 | Batch 1887/2891 | Timestep 10560 | LR 0.0001000000 | Loss 0.095620 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:06 Epoch 3 | Batch 1897/2891 | Timestep 10570 | LR 0.0001000000 | Loss 0.014449 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:08 Epoch 3 | Batch 1907/2891 | Timestep 10580 | LR 0.0001000000 | Loss 0.041885 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:10 Epoch 3 | Batch 1917/2891 | Timestep 10590 | LR 0.0001000000 | Loss 0.005596 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:13 Epoch 3 | Batch 1927/2891 | Timestep 10600 | LR 0.0001000000 | Loss 0.031317 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:15 Epoch 3 | Batch 1937/2891 | Timestep 10610 | LR 0.0001000000 | Loss 0.101442 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:17 Epoch 3 | Batch 1947/2891 | Timestep 10620 | LR 0.0001000000 | Loss 0.035281 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:19 Epoch 3 | Batch 1957/2891 | Timestep 10630 | LR 0.0001000000 | Loss 0.043423 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:22 Epoch 3 | Batch 1967/2891 | Timestep 10640 | LR 0.0001000000 | Loss 0.038177 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:24 Epoch 3 | Batch 1977/2891 | Timestep 10650 | LR 0.0001000000 | Loss 0.069056 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:26 Epoch 3 | Batch 1987/2891 | Timestep 10660 | LR 0.0001000000 | Loss 0.014271 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:28 Epoch 3 | Batch 1997/2891 | Timestep 10670 | LR 0.0001000000 | Loss 0.035940 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:30 Epoch 3 | Batch 2007/2891 | Timestep 10680 | LR 0.0001000000 | Loss 0.007215 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:32 Epoch 3 | Batch 2017/2891 | Timestep 10690 | LR 0.0001000000 | Loss 0.035661 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:34 Epoch 3 | Batch 2027/2891 | Timestep 10700 | LR 0.0001000000 | Loss 0.113316 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:37 Epoch 3 | Batch 2037/2891 | Timestep 10710 | LR 0.0001000000 | Loss 0.001865 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:39 Epoch 3 | Batch 2047/2891 | Timestep 10720 | LR 0.0001000000 | Loss 0.008796 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:41 Epoch 3 | Batch 2057/2891 | Timestep 10730 | LR 0.0001000000 | Loss 0.120107 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:43 Epoch 3 | Batch 2067/2891 | Timestep 10740 | LR 0.0001000000 | Loss 0.048690 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:46 Epoch 3 | Batch 2077/2891 | Timestep 10750 | LR 0.0001000000 | Loss 0.014744 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:48 Epoch 3 | Batch 2087/2891 | Timestep 10760 | LR 0.0001000000 | Loss 0.052314 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:50 Epoch 3 | Batch 2097/2891 | Timestep 10770 | LR 0.0001000000 | Loss 0.233305 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:52 Epoch 3 | Batch 2107/2891 | Timestep 10780 | LR 0.0001000000 | Loss 0.022252 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:54 Epoch 3 | Batch 2117/2891 | Timestep 10790 | LR 0.0001000000 | Loss 0.160893 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:56 Epoch 3 | Batch 2127/2891 | Timestep 10800 | LR 0.0001000000 | Loss 0.002121 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:01:59 Epoch 3 | Batch 2137/2891 | Timestep 10810 | LR 0.0001000000 | Loss 0.020334 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:01 Epoch 3 | Batch 2147/2891 | Timestep 10820 | LR 0.0001000000 | Loss 0.016048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:03 Epoch 3 | Batch 2157/2891 | Timestep 10830 | LR 0.0001000000 | Loss 0.182943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:05 Epoch 3 | Batch 2167/2891 | Timestep 10840 | LR 0.0001000000 | Loss 0.032160 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:07 Epoch 3 | Batch 2177/2891 | Timestep 10850 | LR 0.0001000000 | Loss 0.089093 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:09 Epoch 3 | Batch 2187/2891 | Timestep 10860 | LR 0.0001000000 | Loss 0.023093 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:12 Epoch 3 | Batch 2197/2891 | Timestep 10870 | LR 0.0001000000 | Loss 0.133572 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:14 Epoch 3 | Batch 2207/2891 | Timestep 10880 | LR 0.0001000000 | Loss 0.004586 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:16 Epoch 3 | Batch 2217/2891 | Timestep 10890 | LR 0.0001000000 | Loss 0.004703 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:18 Epoch 3 | Batch 2227/2891 | Timestep 10900 | LR 0.0001000000 | Loss 0.098005 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:20 Epoch 3 | Batch 2237/2891 | Timestep 10910 | LR 0.0001000000 | Loss 0.038042 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:22 Epoch 3 | Batch 2247/2891 | Timestep 10920 | LR 0.0001000000 | Loss 0.002433 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:24 Epoch 3 | Batch 2257/2891 | Timestep 10930 | LR 0.0001000000 | Loss 0.031932 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:27 Epoch 3 | Batch 2267/2891 | Timestep 10940 | LR 0.0001000000 | Loss 0.018603 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:29 Epoch 3 | Batch 2277/2891 | Timestep 10950 | LR 0.0001000000 | Loss 0.108324 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:31 Epoch 3 | Batch 2287/2891 | Timestep 10960 | LR 0.0001000000 | Loss 0.018633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:33 Epoch 3 | Batch 2297/2891 | Timestep 10970 | LR 0.0001000000 | Loss 0.011839 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:35 Epoch 3 | Batch 2307/2891 | Timestep 10980 | LR 0.0001000000 | Loss 0.084855 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:37 Epoch 3 | Batch 2317/2891 | Timestep 10990 | LR 0.0001000000 | Loss 0.018321 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:39 Epoch 3 | Batch 2327/2891 | Timestep 11000 | LR 0.0001000000 | Loss 0.016889 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:41 Epoch 3 | Batch 2337/2891 | Timestep 11010 | LR 0.0001000000 | Loss 0.023010 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:44 Epoch 3 | Batch 2347/2891 | Timestep 11020 | LR 0.0001000000 | Loss 0.017814 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:46 Epoch 3 | Batch 2357/2891 | Timestep 11030 | LR 0.0001000000 | Loss 0.105616 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:48 Epoch 3 | Batch 2367/2891 | Timestep 11040 | LR 0.0001000000 | Loss 0.081477 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:51 Epoch 3 | Batch 2377/2891 | Timestep 11050 | LR 0.0001000000 | Loss 0.081957 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:53 Epoch 3 | Batch 2387/2891 | Timestep 11060 | LR 0.0001000000 | Loss 0.106567 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:55 Epoch 3 | Batch 2397/2891 | Timestep 11070 | LR 0.0001000000 | Loss 0.014169 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:02:57 Epoch 3 | Batch 2407/2891 | Timestep 11080 | LR 0.0001000000 | Loss 0.054922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:00 Epoch 3 | Batch 2417/2891 | Timestep 11090 | LR 0.0001000000 | Loss 0.049048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:02 Epoch 3 | Batch 2427/2891 | Timestep 11100 | LR 0.0001000000 | Loss 0.037171 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:04 Epoch 3 | Batch 2437/2891 | Timestep 11110 | LR 0.0001000000 | Loss 0.025969 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:06 Epoch 3 | Batch 2447/2891 | Timestep 11120 | LR 0.0001000000 | Loss 0.017227 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:08 Epoch 3 | Batch 2457/2891 | Timestep 11130 | LR 0.0001000000 | Loss 0.047495 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:10 Epoch 3 | Batch 2467/2891 | Timestep 11140 | LR 0.0001000000 | Loss 0.048947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:13 Epoch 3 | Batch 2477/2891 | Timestep 11150 | LR 0.0001000000 | Loss 0.011391 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:16 Epoch 3 | Batch 2487/2891 | Timestep 11160 | LR 0.0001000000 | Loss 0.014354 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:18 Epoch 3 | Batch 2497/2891 | Timestep 11170 | LR 0.0001000000 | Loss 0.075914 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:20 Epoch 3 | Batch 2507/2891 | Timestep 11180 | LR 0.0001000000 | Loss 0.024633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:22 Epoch 3 | Batch 2517/2891 | Timestep 11190 | LR 0.0001000000 | Loss 0.191498 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:24 Epoch 3 | Batch 2527/2891 | Timestep 11200 | LR 0.0001000000 | Loss 0.064654 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:26 Epoch 3 | Batch 2537/2891 | Timestep 11210 | LR 0.0001000000 | Loss 0.043336 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:28 Epoch 3 | Batch 2547/2891 | Timestep 11220 | LR 0.0001000000 | Loss 0.042559 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:30 Epoch 3 | Batch 2557/2891 | Timestep 11230 | LR 0.0001000000 | Loss 0.050155 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:32 Epoch 3 | Batch 2567/2891 | Timestep 11240 | LR 0.0001000000 | Loss 0.029959 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:35 Epoch 3 | Batch 2577/2891 | Timestep 11250 | LR 0.0001000000 | Loss 0.123459 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:37 Epoch 3 | Batch 2587/2891 | Timestep 11260 | LR 0.0001000000 | Loss 0.011566 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:39 Epoch 3 | Batch 2597/2891 | Timestep 11270 | LR 0.0001000000 | Loss 0.231207 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:41 Epoch 3 | Batch 2607/2891 | Timestep 11280 | LR 0.0001000000 | Loss 0.015439 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:43 Epoch 3 | Batch 2617/2891 | Timestep 11290 | LR 0.0001000000 | Loss 0.105952 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:45 Epoch 3 | Batch 2627/2891 | Timestep 11300 | LR 0.0001000000 | Loss 2.567754 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:48 Epoch 3 | Batch 2637/2891 | Timestep 11310 | LR 0.0001000000 | Loss 4.595736 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:50 Epoch 3 | Batch 2647/2891 | Timestep 11320 | LR 0.0001000000 | Loss 0.063190 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:52 Epoch 3 | Batch 2657/2891 | Timestep 11330 | LR 0.0001000000 | Loss 0.089011 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:54 Epoch 3 | Batch 2667/2891 | Timestep 11340 | LR 0.0001000000 | Loss 0.077422 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:56 Epoch 3 | Batch 2677/2891 | Timestep 11350 | LR 0.0001000000 | Loss 0.058767 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:03:58 Epoch 3 | Batch 2687/2891 | Timestep 11360 | LR 0.0001000000 | Loss 0.013586 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:00 Epoch 3 | Batch 2697/2891 | Timestep 11370 | LR 0.0001000000 | Loss 0.018489 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:02 Epoch 3 | Batch 2707/2891 | Timestep 11380 | LR 0.0001000000 | Loss 0.032985 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:04 Epoch 3 | Batch 2717/2891 | Timestep 11390 | LR 0.0001000000 | Loss 0.230227 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:06 Epoch 3 | Batch 2727/2891 | Timestep 11400 | LR 0.0001000000 | Loss 0.051413 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:08 Epoch 3 | Batch 2737/2891 | Timestep 11410 | LR 0.0001000000 | Loss 0.030019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:11 Epoch 3 | Batch 2747/2891 | Timestep 11420 | LR 0.0001000000 | Loss 0.100555 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:13 Epoch 3 | Batch 2757/2891 | Timestep 11430 | LR 0.0001000000 | Loss 0.074686 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:15 Epoch 3 | Batch 2767/2891 | Timestep 11440 | LR 0.0001000000 | Loss 0.019899 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:18 Epoch 3 | Batch 2777/2891 | Timestep 11450 | LR 0.0001000000 | Loss 0.200192 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:20 Epoch 3 | Batch 2787/2891 | Timestep 11460 | LR 0.0001000000 | Loss 0.112392 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:22 Epoch 3 | Batch 2797/2891 | Timestep 11470 | LR 0.0001000000 | Loss 0.142781 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:24 Epoch 3 | Batch 2807/2891 | Timestep 11480 | LR 0.0001000000 | Loss 0.060360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:27 Epoch 3 | Batch 2817/2891 | Timestep 11490 | LR 0.0001000000 | Loss 0.014389 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:29 Epoch 3 | Batch 2827/2891 | Timestep 11500 | LR 0.0001000000 | Loss 0.005870 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:31 Epoch 3 | Batch 2837/2891 | Timestep 11510 | LR 0.0001000000 | Loss 0.034343 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:33 Epoch 3 | Batch 2847/2891 | Timestep 11520 | LR 0.0001000000 | Loss 0.048867 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:35 Epoch 3 | Batch 2857/2891 | Timestep 11530 | LR 0.0001000000 | Loss 0.033317 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:37 Epoch 3 | Batch 2867/2891 | Timestep 11540 | LR 0.0001000000 | Loss 0.009217 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:39 Epoch 3 | Batch 2877/2891 | Timestep 11550 | LR 0.0001000000 | Loss 0.019954 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:42 Epoch 3 | Batch 2887/2891 | Timestep 11560 | LR 0.0001000000 | Loss 0.029858 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:04:42 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 19:06:03 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.6612 0.7692 0.7111 104 + CAMP 0.9118 0.8732 0.8921 71 + CARDINAL 0.8521 0.7118 0.7756 170 + CLUSTER 0.6333 0.7308 0.6786 26 + COM 0.6250 0.6410 0.6329 39 + CONTINENT 1.0000 0.8696 0.9302 23 + COUNTRY 0.9783 0.9713 0.9748 835 + CURR 0.9091 0.8333 0.8696 24 + DATE 0.8951 0.9030 0.8990 1691 + EDU 0.8482 0.8716 0.8597 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.6589 0.6815 0.6700 292 + FAC 0.6593 0.8018 0.7236 111 + GOV 0.8393 0.9233 0.8793 860 + GPE 0.9695 0.9690 0.9693 2261 + GPE_ORG 0.7418 0.9461 0.8316 167 + LAND-REGION-NATURAL 0.6190 0.2500 0.3562 52 + LANGUAGE 0.0000 0.0000 0.0000 16 + LAW 0.6212 0.8723 0.7257 47 + LOC 0.7405 0.7638 0.7519 127 + MED 0.9952 0.9857 0.9904 419 + MONEY 0.6296 0.7727 0.6939 22 + NEIGHBORHOOD 0.3333 0.8000 0.4706 5 + NONGOV 0.8852 0.8914 0.8883 571 + NORP 0.6262 0.7205 0.6700 551 + OCC 0.8183 0.8716 0.8442 522 + ORDINAL 0.9642 0.8915 0.9265 544 + ORG 0.9150 0.9263 0.9206 1790 + ORG_FAC 0.1481 0.5714 0.2353 7 + PATH 0.1333 0.3333 0.1905 6 + PERCENT 0.9231 1.0000 0.9600 12 + PERS 0.8731 0.9426 0.9065 679 + PRODUCT 0.2500 0.2500 0.2500 8 + QUANTITY 0.5000 0.6667 0.5714 3 + REGION-GENERAL 0.7714 0.7297 0.7500 37 +REGION-INTERNATIONAL 0.6923 0.7500 0.7200 12 + REL 0.6667 0.6000 0.6316 10 + SCI 0.3043 0.5385 0.3889 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.8410 0.9162 0.8770 179 + SUBAREA-FACILITY 0.5500 0.6875 0.6111 16 + TIME 0.6897 0.6061 0.6452 33 + TOWN 0.9651 0.9540 0.9595 1217 + UNIT 1.0000 0.7500 0.8571 4 + WATER-BODY 0.7778 0.5000 0.6087 14 + WEBSITE 0.5312 0.6375 0.5795 80 + + micro avg 0.8794 0.9012 0.8902 13790 + macro avg 0.6447 0.6807 0.6516 13790 + weighted avg 0.8839 0.9012 0.8912 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:45 Epoch 3 | Timestep 11564 | Train Loss 0.196330 | Val Loss 0.088293 | F1 0.890162 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:46 Epoch 4 | Batch 6/2891 | Timestep 11570 | LR 0.0001000000 | Loss 0.008679 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:48 Epoch 4 | Batch 16/2891 | Timestep 11580 | LR 0.0001000000 | Loss 0.006589 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:50 Epoch 4 | Batch 26/2891 | Timestep 11590 | LR 0.0001000000 | Loss 0.018363 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:53 Epoch 4 | Batch 36/2891 | Timestep 11600 | LR 0.0001000000 | Loss 0.004071 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:55 Epoch 4 | Batch 46/2891 | Timestep 11610 | LR 0.0001000000 | Loss 0.020100 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:57 Epoch 4 | Batch 56/2891 | Timestep 11620 | LR 0.0001000000 | Loss 0.009818 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:06:59 Epoch 4 | Batch 66/2891 | Timestep 11630 | LR 0.0001000000 | Loss 0.015118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:02 Epoch 4 | Batch 76/2891 | Timestep 11640 | LR 0.0001000000 | Loss 0.012473 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:04 Epoch 4 | Batch 86/2891 | Timestep 11650 | LR 0.0001000000 | Loss 0.012464 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:06 Epoch 4 | Batch 96/2891 | Timestep 11660 | LR 0.0001000000 | Loss 0.026360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:08 Epoch 4 | Batch 106/2891 | Timestep 11670 | LR 0.0001000000 | Loss 0.101957 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:10 Epoch 4 | Batch 116/2891 | Timestep 11680 | LR 0.0001000000 | Loss 0.028360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:12 Epoch 4 | Batch 126/2891 | Timestep 11690 | LR 0.0001000000 | Loss 0.002853 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:14 Epoch 4 | Batch 136/2891 | Timestep 11700 | LR 0.0001000000 | Loss 0.006541 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:16 Epoch 4 | Batch 146/2891 | Timestep 11710 | LR 0.0001000000 | Loss 0.050889 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:19 Epoch 4 | Batch 156/2891 | Timestep 11720 | LR 0.0001000000 | Loss 0.064068 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:21 Epoch 4 | Batch 166/2891 | Timestep 11730 | LR 0.0001000000 | Loss 0.187444 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:23 Epoch 4 | Batch 176/2891 | Timestep 11740 | LR 0.0001000000 | Loss 0.006283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:25 Epoch 4 | Batch 186/2891 | Timestep 11750 | LR 0.0001000000 | Loss 0.023693 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:27 Epoch 4 | Batch 196/2891 | Timestep 11760 | LR 0.0001000000 | Loss 0.066489 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:29 Epoch 4 | Batch 206/2891 | Timestep 11770 | LR 0.0001000000 | Loss 0.029311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:31 Epoch 4 | Batch 216/2891 | Timestep 11780 | LR 0.0001000000 | Loss 0.084014 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:33 Epoch 4 | Batch 226/2891 | Timestep 11790 | LR 0.0001000000 | Loss 0.044077 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:35 Epoch 4 | Batch 236/2891 | Timestep 11800 | LR 0.0001000000 | Loss 0.018281 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:37 Epoch 4 | Batch 246/2891 | Timestep 11810 | LR 0.0001000000 | Loss 0.038263 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:39 Epoch 4 | Batch 256/2891 | Timestep 11820 | LR 0.0001000000 | Loss 0.037243 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:41 Epoch 4 | Batch 266/2891 | Timestep 11830 | LR 0.0001000000 | Loss 0.006684 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:43 Epoch 4 | Batch 276/2891 | Timestep 11840 | LR 0.0001000000 | Loss 0.015781 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:46 Epoch 4 | Batch 286/2891 | Timestep 11850 | LR 0.0001000000 | Loss 0.072046 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:48 Epoch 4 | Batch 296/2891 | Timestep 11860 | LR 0.0001000000 | Loss 0.013802 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:50 Epoch 4 | Batch 306/2891 | Timestep 11870 | LR 0.0001000000 | Loss 0.089002 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:52 Epoch 4 | Batch 316/2891 | Timestep 11880 | LR 0.0001000000 | Loss 0.003444 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:54 Epoch 4 | Batch 326/2891 | Timestep 11890 | LR 0.0001000000 | Loss 0.010019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:56 Epoch 4 | Batch 336/2891 | Timestep 11900 | LR 0.0001000000 | Loss 0.016633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:07:59 Epoch 4 | Batch 346/2891 | Timestep 11910 | LR 0.0001000000 | Loss 0.031188 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:02 Epoch 4 | Batch 356/2891 | Timestep 11920 | LR 0.0001000000 | Loss 0.023605 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:04 Epoch 4 | Batch 366/2891 | Timestep 11930 | LR 0.0001000000 | Loss 0.022305 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:06 Epoch 4 | Batch 376/2891 | Timestep 11940 | LR 0.0001000000 | Loss 0.052678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:08 Epoch 4 | Batch 386/2891 | Timestep 11950 | LR 0.0001000000 | Loss 0.016821 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:11 Epoch 4 | Batch 396/2891 | Timestep 11960 | LR 0.0001000000 | Loss 0.016899 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:13 Epoch 4 | Batch 406/2891 | Timestep 11970 | LR 0.0001000000 | Loss 0.061662 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:16 Epoch 4 | Batch 416/2891 | Timestep 11980 | LR 0.0001000000 | Loss 0.063628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:18 Epoch 4 | Batch 426/2891 | Timestep 11990 | LR 0.0001000000 | Loss 0.073984 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:20 Epoch 4 | Batch 436/2891 | Timestep 12000 | LR 0.0001000000 | Loss 0.014955 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:21 Epoch 4 | Batch 446/2891 | Timestep 12010 | LR 0.0001000000 | Loss 0.022891 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:24 Epoch 4 | Batch 456/2891 | Timestep 12020 | LR 0.0001000000 | Loss 0.037249 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:26 Epoch 4 | Batch 466/2891 | Timestep 12030 | LR 0.0001000000 | Loss 0.028340 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:28 Epoch 4 | Batch 476/2891 | Timestep 12040 | LR 0.0001000000 | Loss 0.035739 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:31 Epoch 4 | Batch 486/2891 | Timestep 12050 | LR 0.0001000000 | Loss 0.014781 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:33 Epoch 4 | Batch 496/2891 | Timestep 12060 | LR 0.0001000000 | Loss 0.025580 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:35 Epoch 4 | Batch 506/2891 | Timestep 12070 | LR 0.0001000000 | Loss 0.101117 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:37 Epoch 4 | Batch 516/2891 | Timestep 12080 | LR 0.0001000000 | Loss 0.010986 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:39 Epoch 4 | Batch 526/2891 | Timestep 12090 | LR 0.0001000000 | Loss 0.086897 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:41 Epoch 4 | Batch 536/2891 | Timestep 12100 | LR 0.0001000000 | Loss 0.056397 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:44 Epoch 4 | Batch 546/2891 | Timestep 12110 | LR 0.0001000000 | Loss 0.038655 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:46 Epoch 4 | Batch 556/2891 | Timestep 12120 | LR 0.0001000000 | Loss 0.005384 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:48 Epoch 4 | Batch 566/2891 | Timestep 12130 | LR 0.0001000000 | Loss 0.049866 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:50 Epoch 4 | Batch 576/2891 | Timestep 12140 | LR 0.0001000000 | Loss 0.064287 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:52 Epoch 4 | Batch 586/2891 | Timestep 12150 | LR 0.0001000000 | Loss 0.084618 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:54 Epoch 4 | Batch 596/2891 | Timestep 12160 | LR 0.0001000000 | Loss 0.084628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:56 Epoch 4 | Batch 606/2891 | Timestep 12170 | LR 0.0001000000 | Loss 0.050004 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:08:59 Epoch 4 | Batch 616/2891 | Timestep 12180 | LR 0.0001000000 | Loss 0.008382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:01 Epoch 4 | Batch 626/2891 | Timestep 12190 | LR 0.0001000000 | Loss 0.238426 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:03 Epoch 4 | Batch 636/2891 | Timestep 12200 | LR 0.0001000000 | Loss 0.022231 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:05 Epoch 4 | Batch 646/2891 | Timestep 12210 | LR 0.0001000000 | Loss 0.917261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:07 Epoch 4 | Batch 656/2891 | Timestep 12220 | LR 0.0001000000 | Loss 0.257633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:10 Epoch 4 | Batch 666/2891 | Timestep 12230 | LR 0.0001000000 | Loss 0.218875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:12 Epoch 4 | Batch 676/2891 | Timestep 12240 | LR 0.0001000000 | Loss 0.065745 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:14 Epoch 4 | Batch 686/2891 | Timestep 12250 | LR 0.0001000000 | Loss 0.048243 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:16 Epoch 4 | Batch 696/2891 | Timestep 12260 | LR 0.0001000000 | Loss 0.017117 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:18 Epoch 4 | Batch 706/2891 | Timestep 12270 | LR 0.0001000000 | Loss 0.018451 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:20 Epoch 4 | Batch 716/2891 | Timestep 12280 | LR 0.0001000000 | Loss 0.048405 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:22 Epoch 4 | Batch 726/2891 | Timestep 12290 | LR 0.0001000000 | Loss 0.105769 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:24 Epoch 4 | Batch 736/2891 | Timestep 12300 | LR 0.0001000000 | Loss 0.034038 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:26 Epoch 4 | Batch 746/2891 | Timestep 12310 | LR 0.0001000000 | Loss 0.005228 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:28 Epoch 4 | Batch 756/2891 | Timestep 12320 | LR 0.0001000000 | Loss 0.127199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:30 Epoch 4 | Batch 766/2891 | Timestep 12330 | LR 0.0001000000 | Loss 0.043842 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:32 Epoch 4 | Batch 776/2891 | Timestep 12340 | LR 0.0001000000 | Loss 0.089695 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:34 Epoch 4 | Batch 786/2891 | Timestep 12350 | LR 0.0001000000 | Loss 0.049701 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:37 Epoch 4 | Batch 796/2891 | Timestep 12360 | LR 0.0001000000 | Loss 0.042258 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:39 Epoch 4 | Batch 806/2891 | Timestep 12370 | LR 0.0001000000 | Loss 0.016238 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:41 Epoch 4 | Batch 816/2891 | Timestep 12380 | LR 0.0001000000 | Loss 0.026166 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:43 Epoch 4 | Batch 826/2891 | Timestep 12390 | LR 0.0001000000 | Loss 0.056922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:46 Epoch 4 | Batch 836/2891 | Timestep 12400 | LR 0.0001000000 | Loss 155.005748 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:48 Epoch 4 | Batch 846/2891 | Timestep 12410 | LR 0.0001000000 | Loss 0.064430 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:50 Epoch 4 | Batch 856/2891 | Timestep 12420 | LR 0.0001000000 | Loss 0.065383 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:52 Epoch 4 | Batch 866/2891 | Timestep 12430 | LR 0.0001000000 | Loss 0.032974 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:54 Epoch 4 | Batch 876/2891 | Timestep 12440 | LR 0.0001000000 | Loss 0.041019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:56 Epoch 4 | Batch 886/2891 | Timestep 12450 | LR 0.0001000000 | Loss 0.037010 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:09:59 Epoch 4 | Batch 896/2891 | Timestep 12460 | LR 0.0001000000 | Loss 0.027535 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:01 Epoch 4 | Batch 906/2891 | Timestep 12470 | LR 0.0001000000 | Loss 0.085529 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:03 Epoch 4 | Batch 916/2891 | Timestep 12480 | LR 0.0001000000 | Loss 0.022274 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:05 Epoch 4 | Batch 926/2891 | Timestep 12490 | LR 0.0001000000 | Loss 0.013971 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:08 Epoch 4 | Batch 936/2891 | Timestep 12500 | LR 0.0001000000 | Loss 0.025752 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:10 Epoch 4 | Batch 946/2891 | Timestep 12510 | LR 0.0001000000 | Loss 0.012797 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:12 Epoch 4 | Batch 956/2891 | Timestep 12520 | LR 0.0001000000 | Loss 0.019667 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:14 Epoch 4 | Batch 966/2891 | Timestep 12530 | LR 0.0001000000 | Loss 0.080812 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:16 Epoch 4 | Batch 976/2891 | Timestep 12540 | LR 0.0001000000 | Loss 0.007104 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:19 Epoch 4 | Batch 986/2891 | Timestep 12550 | LR 0.0001000000 | Loss 0.079261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:21 Epoch 4 | Batch 996/2891 | Timestep 12560 | LR 0.0001000000 | Loss 0.003969 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:23 Epoch 4 | Batch 1006/2891 | Timestep 12570 | LR 0.0001000000 | Loss 0.018487 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:25 Epoch 4 | Batch 1016/2891 | Timestep 12580 | LR 0.0001000000 | Loss 0.050912 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:27 Epoch 4 | Batch 1026/2891 | Timestep 12590 | LR 0.0001000000 | Loss 0.011611 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:30 Epoch 4 | Batch 1036/2891 | Timestep 12600 | LR 0.0001000000 | Loss 0.054678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:32 Epoch 4 | Batch 1046/2891 | Timestep 12610 | LR 0.0001000000 | Loss 0.074779 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:34 Epoch 4 | Batch 1056/2891 | Timestep 12620 | LR 0.0001000000 | Loss 0.047486 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:36 Epoch 4 | Batch 1066/2891 | Timestep 12630 | LR 0.0001000000 | Loss 0.040106 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:38 Epoch 4 | Batch 1076/2891 | Timestep 12640 | LR 0.0001000000 | Loss 0.050694 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:40 Epoch 4 | Batch 1086/2891 | Timestep 12650 | LR 0.0001000000 | Loss 0.023916 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:42 Epoch 4 | Batch 1096/2891 | Timestep 12660 | LR 0.0001000000 | Loss 0.062365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:45 Epoch 4 | Batch 1106/2891 | Timestep 12670 | LR 0.0001000000 | Loss 0.092624 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:47 Epoch 4 | Batch 1116/2891 | Timestep 12680 | LR 0.0001000000 | Loss 0.101277 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:50 Epoch 4 | Batch 1126/2891 | Timestep 12690 | LR 0.0001000000 | Loss 0.050157 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:52 Epoch 4 | Batch 1136/2891 | Timestep 12700 | LR 0.0001000000 | Loss 0.036401 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:54 Epoch 4 | Batch 1146/2891 | Timestep 12710 | LR 0.0001000000 | Loss 0.009183 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:56 Epoch 4 | Batch 1156/2891 | Timestep 12720 | LR 0.0001000000 | Loss 0.007846 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:10:58 Epoch 4 | Batch 1166/2891 | Timestep 12730 | LR 0.0001000000 | Loss 0.025729 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:00 Epoch 4 | Batch 1176/2891 | Timestep 12740 | LR 0.0001000000 | Loss 0.026589 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:02 Epoch 4 | Batch 1186/2891 | Timestep 12750 | LR 0.0001000000 | Loss 0.014415 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:04 Epoch 4 | Batch 1196/2891 | Timestep 12760 | LR 0.0001000000 | Loss 0.023038 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:06 Epoch 4 | Batch 1206/2891 | Timestep 12770 | LR 0.0001000000 | Loss 0.089609 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:08 Epoch 4 | Batch 1216/2891 | Timestep 12780 | LR 0.0001000000 | Loss 0.156523 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:11 Epoch 4 | Batch 1226/2891 | Timestep 12790 | LR 0.0001000000 | Loss 0.007464 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:13 Epoch 4 | Batch 1236/2891 | Timestep 12800 | LR 0.0001000000 | Loss 0.076037 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:15 Epoch 4 | Batch 1246/2891 | Timestep 12810 | LR 0.0001000000 | Loss 0.020181 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:17 Epoch 4 | Batch 1256/2891 | Timestep 12820 | LR 0.0001000000 | Loss 0.066897 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:19 Epoch 4 | Batch 1266/2891 | Timestep 12830 | LR 0.0001000000 | Loss 0.048723 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:22 Epoch 4 | Batch 1276/2891 | Timestep 12840 | LR 0.0001000000 | Loss 0.071365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:24 Epoch 4 | Batch 1286/2891 | Timestep 12850 | LR 0.0001000000 | Loss 1.474868 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:26 Epoch 4 | Batch 1296/2891 | Timestep 12860 | LR 0.0001000000 | Loss 2.038094 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:28 Epoch 4 | Batch 1306/2891 | Timestep 12870 | LR 0.0001000000 | Loss 36.890764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:30 Epoch 4 | Batch 1316/2891 | Timestep 12880 | LR 0.0001000000 | Loss 23.979144 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:33 Epoch 4 | Batch 1326/2891 | Timestep 12890 | LR 0.0001000000 | Loss 43.795764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:35 Epoch 4 | Batch 1336/2891 | Timestep 12900 | LR 0.0001000000 | Loss 38.075104 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:37 Epoch 4 | Batch 1346/2891 | Timestep 12910 | LR 0.0001000000 | Loss 38.485277 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:39 Epoch 4 | Batch 1356/2891 | Timestep 12920 | LR 0.0001000000 | Loss 38.796196 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:42 Epoch 4 | Batch 1366/2891 | Timestep 12930 | LR 0.0001000000 | Loss 38.243575 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:44 Epoch 4 | Batch 1376/2891 | Timestep 12940 | LR 0.0001000000 | Loss 46.002284 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:46 Epoch 4 | Batch 1386/2891 | Timestep 12950 | LR 0.0001000000 | Loss 52.681296 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:48 Epoch 4 | Batch 1396/2891 | Timestep 12960 | LR 0.0001000000 | Loss 34.309835 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:50 Epoch 4 | Batch 1406/2891 | Timestep 12970 | LR 0.0001000000 | Loss 34.222922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:54 Epoch 4 | Batch 1416/2891 | Timestep 12980 | LR 0.0001000000 | Loss 35.880307 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:56 Epoch 4 | Batch 1426/2891 | Timestep 12990 | LR 0.0001000000 | Loss 38.709578 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:11:58 Epoch 4 | Batch 1436/2891 | Timestep 13000 | LR 0.0001000000 | Loss 41.229413 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:00 Epoch 4 | Batch 1446/2891 | Timestep 13010 | LR 0.0001000000 | Loss 39.325797 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:02 Epoch 4 | Batch 1456/2891 | Timestep 13020 | LR 0.0001000000 | Loss 36.325210 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:04 Epoch 4 | Batch 1466/2891 | Timestep 13030 | LR 0.0001000000 | Loss 42.374261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:07 Epoch 4 | Batch 1476/2891 | Timestep 13040 | LR 0.0001000000 | Loss 37.639420 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:09 Epoch 4 | Batch 1486/2891 | Timestep 13050 | LR 0.0001000000 | Loss 36.935076 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:11 Epoch 4 | Batch 1496/2891 | Timestep 13060 | LR 0.0001000000 | Loss 40.393558 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:13 Epoch 4 | Batch 1506/2891 | Timestep 13070 | LR 0.0001000000 | Loss 45.973699 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:15 Epoch 4 | Batch 1516/2891 | Timestep 13080 | LR 0.0001000000 | Loss 38.221759 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:17 Epoch 4 | Batch 1526/2891 | Timestep 13090 | LR 0.0001000000 | Loss 32.577461 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:20 Epoch 4 | Batch 1536/2891 | Timestep 13100 | LR 0.0001000000 | Loss 35.746128 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:22 Epoch 4 | Batch 1546/2891 | Timestep 13110 | LR 0.0001000000 | Loss 40.046181 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:24 Epoch 4 | Batch 1556/2891 | Timestep 13120 | LR 0.0001000000 | Loss 42.844560 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:26 Epoch 4 | Batch 1566/2891 | Timestep 13130 | LR 0.0001000000 | Loss 31.952413 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:28 Epoch 4 | Batch 1576/2891 | Timestep 13140 | LR 0.0001000000 | Loss 38.493805 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:30 Epoch 4 | Batch 1586/2891 | Timestep 13150 | LR 0.0001000000 | Loss 37.807597 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:32 Epoch 4 | Batch 1596/2891 | Timestep 13160 | LR 0.0001000000 | Loss 41.013400 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:35 Epoch 4 | Batch 1606/2891 | Timestep 13170 | LR 0.0001000000 | Loss 37.864160 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:37 Epoch 4 | Batch 1616/2891 | Timestep 13180 | LR 0.0001000000 | Loss 36.979077 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:39 Epoch 4 | Batch 1626/2891 | Timestep 13190 | LR 0.0001000000 | Loss 38.742757 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:41 Epoch 4 | Batch 1636/2891 | Timestep 13200 | LR 0.0001000000 | Loss 37.383962 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:44 Epoch 4 | Batch 1646/2891 | Timestep 13210 | LR 0.0001000000 | Loss 39.185381 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:47 Epoch 4 | Batch 1656/2891 | Timestep 13220 | LR 0.0001000000 | Loss 37.504998 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:49 Epoch 4 | Batch 1666/2891 | Timestep 13230 | LR 0.0001000000 | Loss 39.523368 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:51 Epoch 4 | Batch 1676/2891 | Timestep 13240 | LR 0.0001000000 | Loss 37.979240 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:53 Epoch 4 | Batch 1686/2891 | Timestep 13250 | LR 0.0001000000 | Loss 38.328329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:56 Epoch 4 | Batch 1696/2891 | Timestep 13260 | LR 0.0001000000 | Loss 35.286023 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:12:58 Epoch 4 | Batch 1706/2891 | Timestep 13270 | LR 0.0001000000 | Loss 38.125037 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:00 Epoch 4 | Batch 1716/2891 | Timestep 13280 | LR 0.0001000000 | Loss 38.662142 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:02 Epoch 4 | Batch 1726/2891 | Timestep 13290 | LR 0.0001000000 | Loss 37.979282 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:04 Epoch 4 | Batch 1736/2891 | Timestep 13300 | LR 0.0001000000 | Loss 38.320423 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:06 Epoch 4 | Batch 1746/2891 | Timestep 13310 | LR 0.0001000000 | Loss 37.605371 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:09 Epoch 4 | Batch 1756/2891 | Timestep 13320 | LR 0.0001000000 | Loss 42.997982 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:11 Epoch 4 | Batch 1766/2891 | Timestep 13330 | LR 0.0001000000 | Loss 37.710431 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:13 Epoch 4 | Batch 1776/2891 | Timestep 13340 | LR 0.0001000000 | Loss 39.961959 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:15 Epoch 4 | Batch 1786/2891 | Timestep 13350 | LR 0.0001000000 | Loss 37.321168 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:18 Epoch 4 | Batch 1796/2891 | Timestep 13360 | LR 0.0001000000 | Loss 41.917208 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:20 Epoch 4 | Batch 1806/2891 | Timestep 13370 | LR 0.0001000000 | Loss 39.667884 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:22 Epoch 4 | Batch 1816/2891 | Timestep 13380 | LR 0.0001000000 | Loss 39.387778 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:24 Epoch 4 | Batch 1826/2891 | Timestep 13390 | LR 0.0001000000 | Loss 35.750632 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:26 Epoch 4 | Batch 1836/2891 | Timestep 13400 | LR 0.0001000000 | Loss 41.213529 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:28 Epoch 4 | Batch 1846/2891 | Timestep 13410 | LR 0.0001000000 | Loss 36.205628 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:30 Epoch 4 | Batch 1856/2891 | Timestep 13420 | LR 0.0001000000 | Loss 35.751044 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:32 Epoch 4 | Batch 1866/2891 | Timestep 13430 | LR 0.0001000000 | Loss 39.722930 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:34 Epoch 4 | Batch 1876/2891 | Timestep 13440 | LR 0.0001000000 | Loss 37.194817 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:36 Epoch 4 | Batch 1886/2891 | Timestep 13450 | LR 0.0001000000 | Loss 38.788370 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:38 Epoch 4 | Batch 1896/2891 | Timestep 13460 | LR 0.0001000000 | Loss 36.136851 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:41 Epoch 4 | Batch 1906/2891 | Timestep 13470 | LR 0.0001000000 | Loss 37.543942 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:43 Epoch 4 | Batch 1916/2891 | Timestep 13480 | LR 0.0001000000 | Loss 38.566108 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:45 Epoch 4 | Batch 1926/2891 | Timestep 13490 | LR 0.0001000000 | Loss 39.261147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:48 Epoch 4 | Batch 1936/2891 | Timestep 13500 | LR 0.0001000000 | Loss 39.846757 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:50 Epoch 4 | Batch 1946/2891 | Timestep 13510 | LR 0.0001000000 | Loss 37.408045 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:52 Epoch 4 | Batch 1956/2891 | Timestep 13520 | LR 0.0001000000 | Loss 38.679787 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:54 Epoch 4 | Batch 1966/2891 | Timestep 13530 | LR 0.0001000000 | Loss 39.555091 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:56 Epoch 4 | Batch 1976/2891 | Timestep 13540 | LR 0.0001000000 | Loss 37.619881 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:13:59 Epoch 4 | Batch 1986/2891 | Timestep 13550 | LR 0.0001000000 | Loss 37.691877 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:01 Epoch 4 | Batch 1996/2891 | Timestep 13560 | LR 0.0001000000 | Loss 36.456033 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:03 Epoch 4 | Batch 2006/2891 | Timestep 13570 | LR 0.0001000000 | Loss 39.249873 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:05 Epoch 4 | Batch 2016/2891 | Timestep 13580 | LR 0.0001000000 | Loss 38.055484 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:07 Epoch 4 | Batch 2026/2891 | Timestep 13590 | LR 0.0001000000 | Loss 36.853525 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:09 Epoch 4 | Batch 2036/2891 | Timestep 13600 | LR 0.0001000000 | Loss 37.958513 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:12 Epoch 4 | Batch 2046/2891 | Timestep 13610 | LR 0.0001000000 | Loss 35.594434 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:14 Epoch 4 | Batch 2056/2891 | Timestep 13620 | LR 0.0001000000 | Loss 37.398104 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:16 Epoch 4 | Batch 2066/2891 | Timestep 13630 | LR 0.0001000000 | Loss 36.438641 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:18 Epoch 4 | Batch 2076/2891 | Timestep 13640 | LR 0.0001000000 | Loss 38.406678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:20 Epoch 4 | Batch 2086/2891 | Timestep 13650 | LR 0.0001000000 | Loss 39.492311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:22 Epoch 4 | Batch 2096/2891 | Timestep 13660 | LR 0.0001000000 | Loss 39.179467 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:25 Epoch 4 | Batch 2106/2891 | Timestep 13670 | LR 0.0001000000 | Loss 38.517553 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:27 Epoch 4 | Batch 2116/2891 | Timestep 13680 | LR 0.0001000000 | Loss 39.673297 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:29 Epoch 4 | Batch 2126/2891 | Timestep 13690 | LR 0.0001000000 | Loss 39.147688 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:31 Epoch 4 | Batch 2136/2891 | Timestep 13700 | LR 0.0001000000 | Loss 39.737539 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:33 Epoch 4 | Batch 2146/2891 | Timestep 13710 | LR 0.0001000000 | Loss 38.176411 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:35 Epoch 4 | Batch 2156/2891 | Timestep 13720 | LR 0.0001000000 | Loss 36.530706 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:37 Epoch 4 | Batch 2166/2891 | Timestep 13730 | LR 0.0001000000 | Loss 36.270138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:39 Epoch 4 | Batch 2176/2891 | Timestep 13740 | LR 0.0001000000 | Loss 36.753610 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:42 Epoch 4 | Batch 2186/2891 | Timestep 13750 | LR 0.0001000000 | Loss 34.394848 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:44 Epoch 4 | Batch 2196/2891 | Timestep 13760 | LR 0.0001000000 | Loss 37.800897 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:46 Epoch 4 | Batch 2206/2891 | Timestep 13770 | LR 0.0001000000 | Loss 38.180290 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:49 Epoch 4 | Batch 2216/2891 | Timestep 13780 | LR 0.0001000000 | Loss 37.369457 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:51 Epoch 4 | Batch 2226/2891 | Timestep 13790 | LR 0.0001000000 | Loss 38.885795 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:54 Epoch 4 | Batch 2236/2891 | Timestep 13800 | LR 0.0001000000 | Loss 45.649643 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:56 Epoch 4 | Batch 2246/2891 | Timestep 13810 | LR 0.0001000000 | Loss 39.312797 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:14:58 Epoch 4 | Batch 2256/2891 | Timestep 13820 | LR 0.0001000000 | Loss 37.749000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:00 Epoch 4 | Batch 2266/2891 | Timestep 13830 | LR 0.0001000000 | Loss 38.728291 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:02 Epoch 4 | Batch 2276/2891 | Timestep 13840 | LR 0.0001000000 | Loss 32.471138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:05 Epoch 4 | Batch 2286/2891 | Timestep 13850 | LR 0.0001000000 | Loss 41.022947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:07 Epoch 4 | Batch 2296/2891 | Timestep 13860 | LR 0.0001000000 | Loss 35.750710 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:09 Epoch 4 | Batch 2306/2891 | Timestep 13870 | LR 0.0001000000 | Loss 37.822609 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:11 Epoch 4 | Batch 2316/2891 | Timestep 13880 | LR 0.0001000000 | Loss 39.571777 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:13 Epoch 4 | Batch 2326/2891 | Timestep 13890 | LR 0.0001000000 | Loss 38.214774 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:15 Epoch 4 | Batch 2336/2891 | Timestep 13900 | LR 0.0001000000 | Loss 38.401242 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:17 Epoch 4 | Batch 2346/2891 | Timestep 13910 | LR 0.0001000000 | Loss 37.591990 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:20 Epoch 4 | Batch 2356/2891 | Timestep 13920 | LR 0.0001000000 | Loss 34.598627 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:22 Epoch 4 | Batch 2366/2891 | Timestep 13930 | LR 0.0001000000 | Loss 40.411901 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:24 Epoch 4 | Batch 2376/2891 | Timestep 13940 | LR 0.0001000000 | Loss 38.180458 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:26 Epoch 4 | Batch 2386/2891 | Timestep 13950 | LR 0.0001000000 | Loss 37.348970 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:28 Epoch 4 | Batch 2396/2891 | Timestep 13960 | LR 0.0001000000 | Loss 38.235097 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:30 Epoch 4 | Batch 2406/2891 | Timestep 13970 | LR 0.0001000000 | Loss 38.081175 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:32 Epoch 4 | Batch 2416/2891 | Timestep 13980 | LR 0.0001000000 | Loss 39.781120 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:34 Epoch 4 | Batch 2426/2891 | Timestep 13990 | LR 0.0001000000 | Loss 38.425808 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:36 Epoch 4 | Batch 2436/2891 | Timestep 14000 | LR 0.0001000000 | Loss 35.575988 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:38 Epoch 4 | Batch 2446/2891 | Timestep 14010 | LR 0.0001000000 | Loss 37.783477 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:40 Epoch 4 | Batch 2456/2891 | Timestep 14020 | LR 0.0001000000 | Loss 35.536390 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:42 Epoch 4 | Batch 2466/2891 | Timestep 14030 | LR 0.0001000000 | Loss 37.665343 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:44 Epoch 4 | Batch 2476/2891 | Timestep 14040 | LR 0.0001000000 | Loss 38.469892 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:46 Epoch 4 | Batch 2486/2891 | Timestep 14050 | LR 0.0001000000 | Loss 39.735486 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:48 Epoch 4 | Batch 2496/2891 | Timestep 14060 | LR 0.0001000000 | Loss 38.482689 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:50 Epoch 4 | Batch 2506/2891 | Timestep 14070 | LR 0.0001000000 | Loss 38.441507 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:52 Epoch 4 | Batch 2516/2891 | Timestep 14080 | LR 0.0001000000 | Loss 37.097808 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:54 Epoch 4 | Batch 2526/2891 | Timestep 14090 | LR 0.0001000000 | Loss 38.200313 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:56 Epoch 4 | Batch 2536/2891 | Timestep 14100 | LR 0.0001000000 | Loss 37.972707 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:15:58 Epoch 4 | Batch 2546/2891 | Timestep 14110 | LR 0.0001000000 | Loss 39.633880 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:00 Epoch 4 | Batch 2556/2891 | Timestep 14120 | LR 0.0001000000 | Loss 35.522287 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:03 Epoch 4 | Batch 2566/2891 | Timestep 14130 | LR 0.0001000000 | Loss 40.492847 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:05 Epoch 4 | Batch 2576/2891 | Timestep 14140 | LR 0.0001000000 | Loss 39.702161 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:07 Epoch 4 | Batch 2586/2891 | Timestep 14150 | LR 0.0001000000 | Loss 35.705266 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:10 Epoch 4 | Batch 2596/2891 | Timestep 14160 | LR 0.0001000000 | Loss 41.697620 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:12 Epoch 4 | Batch 2606/2891 | Timestep 14170 | LR 0.0001000000 | Loss 34.292415 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:14 Epoch 4 | Batch 2616/2891 | Timestep 14180 | LR 0.0001000000 | Loss 36.851241 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:16 Epoch 4 | Batch 2626/2891 | Timestep 14190 | LR 0.0001000000 | Loss 39.536156 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:18 Epoch 4 | Batch 2636/2891 | Timestep 14200 | LR 0.0001000000 | Loss 36.527038 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:20 Epoch 4 | Batch 2646/2891 | Timestep 14210 | LR 0.0001000000 | Loss 36.437604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:23 Epoch 4 | Batch 2656/2891 | Timestep 14220 | LR 0.0001000000 | Loss 39.595350 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:25 Epoch 4 | Batch 2666/2891 | Timestep 14230 | LR 0.0001000000 | Loss 34.443948 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:27 Epoch 4 | Batch 2676/2891 | Timestep 14240 | LR 0.0001000000 | Loss 37.024343 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:29 Epoch 4 | Batch 2686/2891 | Timestep 14250 | LR 0.0001000000 | Loss 36.374735 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:32 Epoch 4 | Batch 2696/2891 | Timestep 14260 | LR 0.0001000000 | Loss 35.942625 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:34 Epoch 4 | Batch 2706/2891 | Timestep 14270 | LR 0.0001000000 | Loss 41.267206 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:36 Epoch 4 | Batch 2716/2891 | Timestep 14280 | LR 0.0001000000 | Loss 39.016218 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:38 Epoch 4 | Batch 2726/2891 | Timestep 14290 | LR 0.0001000000 | Loss 37.886394 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:41 Epoch 4 | Batch 2736/2891 | Timestep 14300 | LR 0.0001000000 | Loss 36.714451 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:43 Epoch 4 | Batch 2746/2891 | Timestep 14310 | LR 0.0001000000 | Loss 37.437588 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:45 Epoch 4 | Batch 2756/2891 | Timestep 14320 | LR 0.0001000000 | Loss 37.768449 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:47 Epoch 4 | Batch 2766/2891 | Timestep 14330 | LR 0.0001000000 | Loss 36.082767 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:50 Epoch 4 | Batch 2776/2891 | Timestep 14340 | LR 0.0001000000 | Loss 39.502688 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:52 Epoch 4 | Batch 2786/2891 | Timestep 14350 | LR 0.0001000000 | Loss 41.760023 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:54 Epoch 4 | Batch 2796/2891 | Timestep 14360 | LR 0.0001000000 | Loss 36.638792 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:56 Epoch 4 | Batch 2806/2891 | Timestep 14370 | LR 0.0001000000 | Loss 37.670463 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:16:59 Epoch 4 | Batch 2816/2891 | Timestep 14380 | LR 0.0001000000 | Loss 39.064599 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:01 Epoch 4 | Batch 2826/2891 | Timestep 14390 | LR 0.0001000000 | Loss 42.086214 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:04 Epoch 4 | Batch 2836/2891 | Timestep 14400 | LR 0.0001000000 | Loss 36.956379 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:06 Epoch 4 | Batch 2846/2891 | Timestep 14410 | LR 0.0001000000 | Loss 35.692210 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:08 Epoch 4 | Batch 2856/2891 | Timestep 14420 | LR 0.0001000000 | Loss 35.226617 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:10 Epoch 4 | Batch 2866/2891 | Timestep 14430 | LR 0.0001000000 | Loss 38.656978 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:12 Epoch 4 | Batch 2876/2891 | Timestep 14440 | LR 0.0001000000 | Loss 37.285775 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:15 Epoch 4 | Batch 2886/2891 | Timestep 14450 | LR 0.0001000000 | Loss 37.385915 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:17:16 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 19:18:58 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.0000 0.0000 0.0000 104 + CAMP 0.0000 0.0000 0.0000 71 + CARDINAL 0.0000 0.0000 0.0000 170 + CLUSTER 0.0000 0.0000 0.0000 26 + COM 0.0000 0.0000 0.0000 39 + CONTINENT 0.0000 0.0000 0.0000 23 + COUNTRY 0.0000 0.0000 0.0000 835 + CURR 0.0000 0.0000 0.0000 24 + DATE 0.0000 0.0000 0.0000 1691 + EDU 0.0000 0.0000 0.0000 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.0000 0.0000 0.0000 292 + FAC 0.0000 0.0000 0.0000 111 + GOV 0.0000 0.0000 0.0000 860 + GPE 0.0000 0.0000 0.0000 2261 + GPE_ORG 0.0000 0.0000 0.0000 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 0.0000 0.0000 0.0000 16 + LAW 0.0000 0.0000 0.0000 47 + LOC 0.0000 0.0000 0.0000 127 + MED 0.0000 0.0000 0.0000 419 + MONEY 0.0000 0.0000 0.0000 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.0000 0.0000 0.0000 571 + NORP 0.0000 0.0000 0.0000 551 + OCC 0.0000 0.0000 0.0000 522 + ORDINAL 0.0000 0.0000 0.0000 544 + ORG 0.0000 0.0000 0.0000 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.0000 0.0000 0.0000 6 + PERCENT 0.0000 0.0000 0.0000 12 + PERS 0.0000 0.0000 0.0000 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.0000 0.0000 0.0000 3 + REGION-GENERAL 0.0000 0.0000 0.0000 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.0000 0.0000 0.0000 10 + SCI 0.0000 0.0000 0.0000 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.0000 0.0000 0.0000 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.0000 0.0000 0.0000 33 + TOWN 0.0000 0.0000 0.0000 1217 + UNIT 0.0000 0.0000 0.0000 4 + WATER-BODY 0.0000 0.0000 0.0000 14 + WEBSITE 0.0000 0.0000 0.0000 80 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.0000 0.0000 0.0000 13790 + macro avg 0.0000 0.0000 0.0000 13790 + weighted avg 0.0000 0.0000 0.0000 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:02 Epoch 4 | Timestep 14455 | Train Loss 21.243065 | Val Loss 39.250843 | F1 0.000000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:04 Epoch 5 | Batch 5/2891 | Timestep 14460 | LR 0.0001000000 | Loss 36.791951 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:05 Epoch 5 | Batch 15/2891 | Timestep 14470 | LR 0.0001000000 | Loss 42.381456 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:08 Epoch 5 | Batch 25/2891 | Timestep 14480 | LR 0.0001000000 | Loss 36.298883 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:10 Epoch 5 | Batch 35/2891 | Timestep 14490 | LR 0.0001000000 | Loss 38.342771 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:12 Epoch 5 | Batch 45/2891 | Timestep 14500 | LR 0.0001000000 | Loss 34.630823 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:14 Epoch 5 | Batch 55/2891 | Timestep 14510 | LR 0.0001000000 | Loss 36.572476 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:16 Epoch 5 | Batch 65/2891 | Timestep 14520 | LR 0.0001000000 | Loss 38.442303 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:19 Epoch 5 | Batch 75/2891 | Timestep 14530 | LR 0.0001000000 | Loss 37.856288 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:20 Epoch 5 | Batch 85/2891 | Timestep 14540 | LR 0.0001000000 | Loss 39.837517 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:23 Epoch 5 | Batch 95/2891 | Timestep 14550 | LR 0.0001000000 | Loss 39.226579 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:24 Epoch 5 | Batch 105/2891 | Timestep 14560 | LR 0.0001000000 | Loss 38.634520 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:26 Epoch 5 | Batch 115/2891 | Timestep 14570 | LR 0.0001000000 | Loss 38.071981 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:29 Epoch 5 | Batch 125/2891 | Timestep 14580 | LR 0.0001000000 | Loss 35.175665 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:31 Epoch 5 | Batch 135/2891 | Timestep 14590 | LR 0.0001000000 | Loss 36.017551 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:33 Epoch 5 | Batch 145/2891 | Timestep 14600 | LR 0.0001000000 | Loss 38.085633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:35 Epoch 5 | Batch 155/2891 | Timestep 14610 | LR 0.0001000000 | Loss 38.332153 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:37 Epoch 5 | Batch 165/2891 | Timestep 14620 | LR 0.0001000000 | Loss 37.238171 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:39 Epoch 5 | Batch 175/2891 | Timestep 14630 | LR 0.0001000000 | Loss 39.829070 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:41 Epoch 5 | Batch 185/2891 | Timestep 14640 | LR 0.0001000000 | Loss 37.110368 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:43 Epoch 5 | Batch 195/2891 | Timestep 14650 | LR 0.0001000000 | Loss 37.195692 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:45 Epoch 5 | Batch 205/2891 | Timestep 14660 | LR 0.0001000000 | Loss 41.414617 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:48 Epoch 5 | Batch 215/2891 | Timestep 14670 | LR 0.0001000000 | Loss 39.887106 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:50 Epoch 5 | Batch 225/2891 | Timestep 14680 | LR 0.0001000000 | Loss 37.767171 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:52 Epoch 5 | Batch 235/2891 | Timestep 14690 | LR 0.0001000000 | Loss 39.773875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:55 Epoch 5 | Batch 245/2891 | Timestep 14700 | LR 0.0001000000 | Loss 40.842917 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:56 Epoch 5 | Batch 255/2891 | Timestep 14710 | LR 0.0001000000 | Loss 37.846301 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:20:59 Epoch 5 | Batch 265/2891 | Timestep 14720 | LR 0.0001000000 | Loss 38.007880 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:01 Epoch 5 | Batch 275/2891 | Timestep 14730 | LR 0.0001000000 | Loss 37.792907 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:03 Epoch 5 | Batch 285/2891 | Timestep 14740 | LR 0.0001000000 | Loss 36.366935 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:05 Epoch 5 | Batch 295/2891 | Timestep 14750 | LR 0.0001000000 | Loss 38.731992 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:08 Epoch 5 | Batch 305/2891 | Timestep 14760 | LR 0.0001000000 | Loss 38.341171 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:10 Epoch 5 | Batch 315/2891 | Timestep 14770 | LR 0.0001000000 | Loss 38.404587 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:12 Epoch 5 | Batch 325/2891 | Timestep 14780 | LR 0.0001000000 | Loss 37.011200 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:14 Epoch 5 | Batch 335/2891 | Timestep 14790 | LR 0.0001000000 | Loss 37.485997 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:16 Epoch 5 | Batch 345/2891 | Timestep 14800 | LR 0.0001000000 | Loss 36.936100 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:19 Epoch 5 | Batch 355/2891 | Timestep 14810 | LR 0.0001000000 | Loss 36.316143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:21 Epoch 5 | Batch 365/2891 | Timestep 14820 | LR 0.0001000000 | Loss 41.280752 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:23 Epoch 5 | Batch 375/2891 | Timestep 14830 | LR 0.0001000000 | Loss 37.515208 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:25 Epoch 5 | Batch 385/2891 | Timestep 14840 | LR 0.0001000000 | Loss 36.598271 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:27 Epoch 5 | Batch 395/2891 | Timestep 14850 | LR 0.0001000000 | Loss 37.127461 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:30 Epoch 5 | Batch 405/2891 | Timestep 14860 | LR 0.0001000000 | Loss 37.682108 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:32 Epoch 5 | Batch 415/2891 | Timestep 14870 | LR 0.0001000000 | Loss 33.170265 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:35 Epoch 5 | Batch 425/2891 | Timestep 14880 | LR 0.0001000000 | Loss 38.476387 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:37 Epoch 5 | Batch 435/2891 | Timestep 14890 | LR 0.0001000000 | Loss 35.704178 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:39 Epoch 5 | Batch 445/2891 | Timestep 14900 | LR 0.0001000000 | Loss 37.970126 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:41 Epoch 5 | Batch 455/2891 | Timestep 14910 | LR 0.0001000000 | Loss 38.573344 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:43 Epoch 5 | Batch 465/2891 | Timestep 14920 | LR 0.0001000000 | Loss 38.213069 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:45 Epoch 5 | Batch 475/2891 | Timestep 14930 | LR 0.0001000000 | Loss 37.786120 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:48 Epoch 5 | Batch 485/2891 | Timestep 14940 | LR 0.0001000000 | Loss 32.277243 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:50 Epoch 5 | Batch 495/2891 | Timestep 14950 | LR 0.0001000000 | Loss 36.199019 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:52 Epoch 5 | Batch 505/2891 | Timestep 14960 | LR 0.0001000000 | Loss 38.936530 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:54 Epoch 5 | Batch 515/2891 | Timestep 14970 | LR 0.0001000000 | Loss 37.148157 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:56 Epoch 5 | Batch 525/2891 | Timestep 14980 | LR 0.0001000000 | Loss 37.545018 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:21:58 Epoch 5 | Batch 535/2891 | Timestep 14990 | LR 0.0001000000 | Loss 36.430467 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:01 Epoch 5 | Batch 545/2891 | Timestep 15000 | LR 0.0001000000 | Loss 31.943425 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:04 Epoch 5 | Batch 555/2891 | Timestep 15010 | LR 0.0001000000 | Loss 41.227834 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:05 Epoch 5 | Batch 565/2891 | Timestep 15020 | LR 0.0001000000 | Loss 38.436219 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:08 Epoch 5 | Batch 575/2891 | Timestep 15030 | LR 0.0001000000 | Loss 38.361396 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:10 Epoch 5 | Batch 585/2891 | Timestep 15040 | LR 0.0001000000 | Loss 38.504433 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:12 Epoch 5 | Batch 595/2891 | Timestep 15050 | LR 0.0001000000 | Loss 37.145682 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:14 Epoch 5 | Batch 605/2891 | Timestep 15060 | LR 0.0001000000 | Loss 37.693482 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:16 Epoch 5 | Batch 615/2891 | Timestep 15070 | LR 0.0001000000 | Loss 36.979251 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:19 Epoch 5 | Batch 625/2891 | Timestep 15080 | LR 0.0001000000 | Loss 36.605555 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:21 Epoch 5 | Batch 635/2891 | Timestep 15090 | LR 0.0001000000 | Loss 34.717820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:23 Epoch 5 | Batch 645/2891 | Timestep 15100 | LR 0.0001000000 | Loss 36.982029 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:25 Epoch 5 | Batch 655/2891 | Timestep 15110 | LR 0.0001000000 | Loss 36.270484 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:27 Epoch 5 | Batch 665/2891 | Timestep 15120 | LR 0.0001000000 | Loss 38.779204 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:29 Epoch 5 | Batch 675/2891 | Timestep 15130 | LR 0.0001000000 | Loss 38.155310 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:31 Epoch 5 | Batch 685/2891 | Timestep 15140 | LR 0.0001000000 | Loss 36.740506 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:33 Epoch 5 | Batch 695/2891 | Timestep 15150 | LR 0.0001000000 | Loss 38.865043 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:36 Epoch 5 | Batch 705/2891 | Timestep 15160 | LR 0.0001000000 | Loss 41.060749 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:38 Epoch 5 | Batch 715/2891 | Timestep 15170 | LR 0.0001000000 | Loss 36.451131 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:40 Epoch 5 | Batch 725/2891 | Timestep 15180 | LR 0.0001000000 | Loss 37.341382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:42 Epoch 5 | Batch 735/2891 | Timestep 15190 | LR 0.0001000000 | Loss 38.345945 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:44 Epoch 5 | Batch 745/2891 | Timestep 15200 | LR 0.0001000000 | Loss 38.256460 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:46 Epoch 5 | Batch 755/2891 | Timestep 15210 | LR 0.0001000000 | Loss 37.655762 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:49 Epoch 5 | Batch 765/2891 | Timestep 15220 | LR 0.0001000000 | Loss 38.301920 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:51 Epoch 5 | Batch 775/2891 | Timestep 15230 | LR 0.0001000000 | Loss 37.631177 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:53 Epoch 5 | Batch 785/2891 | Timestep 15240 | LR 0.0001000000 | Loss 37.928094 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:55 Epoch 5 | Batch 795/2891 | Timestep 15250 | LR 0.0001000000 | Loss 37.958269 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:22:57 Epoch 5 | Batch 805/2891 | Timestep 15260 | LR 0.0001000000 | Loss 35.742365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:00 Epoch 5 | Batch 815/2891 | Timestep 15270 | LR 0.0001000000 | Loss 38.766328 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:02 Epoch 5 | Batch 825/2891 | Timestep 15280 | LR 0.0001000000 | Loss 39.533542 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:04 Epoch 5 | Batch 835/2891 | Timestep 15290 | LR 0.0001000000 | Loss 37.630063 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:06 Epoch 5 | Batch 845/2891 | Timestep 15300 | LR 0.0001000000 | Loss 37.344169 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:08 Epoch 5 | Batch 855/2891 | Timestep 15310 | LR 0.0001000000 | Loss 37.421824 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:11 Epoch 5 | Batch 865/2891 | Timestep 15320 | LR 0.0001000000 | Loss 37.368309 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:13 Epoch 5 | Batch 875/2891 | Timestep 15330 | LR 0.0001000000 | Loss 38.271491 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:15 Epoch 5 | Batch 885/2891 | Timestep 15340 | LR 0.0001000000 | Loss 38.819246 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:17 Epoch 5 | Batch 895/2891 | Timestep 15350 | LR 0.0001000000 | Loss 37.379690 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:19 Epoch 5 | Batch 905/2891 | Timestep 15360 | LR 0.0001000000 | Loss 37.071852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:21 Epoch 5 | Batch 915/2891 | Timestep 15370 | LR 0.0001000000 | Loss 36.921395 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:23 Epoch 5 | Batch 925/2891 | Timestep 15380 | LR 0.0001000000 | Loss 35.773002 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:25 Epoch 5 | Batch 935/2891 | Timestep 15390 | LR 0.0001000000 | Loss 41.274838 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:27 Epoch 5 | Batch 945/2891 | Timestep 15400 | LR 0.0001000000 | Loss 38.611748 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:29 Epoch 5 | Batch 955/2891 | Timestep 15410 | LR 0.0001000000 | Loss 37.635545 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:32 Epoch 5 | Batch 965/2891 | Timestep 15420 | LR 0.0001000000 | Loss 37.739965 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:34 Epoch 5 | Batch 975/2891 | Timestep 15430 | LR 0.0001000000 | Loss 36.276362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:36 Epoch 5 | Batch 985/2891 | Timestep 15440 | LR 0.0001000000 | Loss 38.580377 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:38 Epoch 5 | Batch 995/2891 | Timestep 15450 | LR 0.0001000000 | Loss 35.776962 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:40 Epoch 5 | Batch 1005/2891 | Timestep 15460 | LR 0.0001000000 | Loss 38.820647 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:43 Epoch 5 | Batch 1015/2891 | Timestep 15470 | LR 0.0001000000 | Loss 36.813762 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:45 Epoch 5 | Batch 1025/2891 | Timestep 15480 | LR 0.0001000000 | Loss 38.017941 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:47 Epoch 5 | Batch 1035/2891 | Timestep 15490 | LR 0.0001000000 | Loss 35.451078 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:50 Epoch 5 | Batch 1045/2891 | Timestep 15500 | LR 0.0001000000 | Loss 33.587237 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:52 Epoch 5 | Batch 1055/2891 | Timestep 15510 | LR 0.0001000000 | Loss 39.426698 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:54 Epoch 5 | Batch 1065/2891 | Timestep 15520 | LR 0.0001000000 | Loss 38.819988 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:56 Epoch 5 | Batch 1075/2891 | Timestep 15530 | LR 0.0001000000 | Loss 37.601447 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:23:59 Epoch 5 | Batch 1085/2891 | Timestep 15540 | LR 0.0001000000 | Loss 39.042170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:01 Epoch 5 | Batch 1095/2891 | Timestep 15550 | LR 0.0001000000 | Loss 38.195837 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:03 Epoch 5 | Batch 1105/2891 | Timestep 15560 | LR 0.0001000000 | Loss 37.200771 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:05 Epoch 5 | Batch 1115/2891 | Timestep 15570 | LR 0.0001000000 | Loss 40.044068 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:07 Epoch 5 | Batch 1125/2891 | Timestep 15580 | LR 0.0001000000 | Loss 36.106538 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:09 Epoch 5 | Batch 1135/2891 | Timestep 15590 | LR 0.0001000000 | Loss 38.201438 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:11 Epoch 5 | Batch 1145/2891 | Timestep 15600 | LR 0.0001000000 | Loss 37.723035 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:13 Epoch 5 | Batch 1155/2891 | Timestep 15610 | LR 0.0001000000 | Loss 37.440107 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:15 Epoch 5 | Batch 1165/2891 | Timestep 15620 | LR 0.0001000000 | Loss 38.606173 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:18 Epoch 5 | Batch 1175/2891 | Timestep 15630 | LR 0.0001000000 | Loss 36.302648 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:20 Epoch 5 | Batch 1185/2891 | Timestep 15640 | LR 0.0001000000 | Loss 37.218026 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:22 Epoch 5 | Batch 1195/2891 | Timestep 15650 | LR 0.0001000000 | Loss 43.348680 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:24 Epoch 5 | Batch 1205/2891 | Timestep 15660 | LR 0.0001000000 | Loss 46.683793 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:26 Epoch 5 | Batch 1215/2891 | Timestep 15670 | LR 0.0001000000 | Loss 42.909451 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:28 Epoch 5 | Batch 1225/2891 | Timestep 15680 | LR 0.0001000000 | Loss 38.837933 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:30 Epoch 5 | Batch 1235/2891 | Timestep 15690 | LR 0.0001000000 | Loss 38.044862 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:32 Epoch 5 | Batch 1245/2891 | Timestep 15700 | LR 0.0001000000 | Loss 38.206369 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:34 Epoch 5 | Batch 1255/2891 | Timestep 15710 | LR 0.0001000000 | Loss 37.183257 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:37 Epoch 5 | Batch 1265/2891 | Timestep 15720 | LR 0.0001000000 | Loss 37.981099 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:39 Epoch 5 | Batch 1275/2891 | Timestep 15730 | LR 0.0001000000 | Loss 41.652118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:41 Epoch 5 | Batch 1285/2891 | Timestep 15740 | LR 0.0001000000 | Loss 36.947406 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:43 Epoch 5 | Batch 1295/2891 | Timestep 15750 | LR 0.0001000000 | Loss 37.109647 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:45 Epoch 5 | Batch 1305/2891 | Timestep 15760 | LR 0.0001000000 | Loss 39.960331 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:47 Epoch 5 | Batch 1315/2891 | Timestep 15770 | LR 0.0001000000 | Loss 37.168671 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:49 Epoch 5 | Batch 1325/2891 | Timestep 15780 | LR 0.0001000000 | Loss 38.456128 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:51 Epoch 5 | Batch 1335/2891 | Timestep 15790 | LR 0.0001000000 | Loss 37.988395 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:53 Epoch 5 | Batch 1345/2891 | Timestep 15800 | LR 0.0001000000 | Loss 38.142577 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:56 Epoch 5 | Batch 1355/2891 | Timestep 15810 | LR 0.0001000000 | Loss 36.772492 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:24:58 Epoch 5 | Batch 1365/2891 | Timestep 15820 | LR 0.0001000000 | Loss 37.184500 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:00 Epoch 5 | Batch 1375/2891 | Timestep 15830 | LR 0.0001000000 | Loss 37.828450 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:02 Epoch 5 | Batch 1385/2891 | Timestep 15840 | LR 0.0001000000 | Loss 37.177808 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:04 Epoch 5 | Batch 1395/2891 | Timestep 15850 | LR 0.0001000000 | Loss 37.200208 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:06 Epoch 5 | Batch 1405/2891 | Timestep 15860 | LR 0.0001000000 | Loss 36.674434 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:09 Epoch 5 | Batch 1415/2891 | Timestep 15870 | LR 0.0001000000 | Loss 36.734755 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:11 Epoch 5 | Batch 1425/2891 | Timestep 15880 | LR 0.0001000000 | Loss 37.338110 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:13 Epoch 5 | Batch 1435/2891 | Timestep 15890 | LR 0.0001000000 | Loss 38.201354 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:15 Epoch 5 | Batch 1445/2891 | Timestep 15900 | LR 0.0001000000 | Loss 38.228845 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:17 Epoch 5 | Batch 1455/2891 | Timestep 15910 | LR 0.0001000000 | Loss 37.330312 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:19 Epoch 5 | Batch 1465/2891 | Timestep 15920 | LR 0.0001000000 | Loss 37.577699 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:21 Epoch 5 | Batch 1475/2891 | Timestep 15930 | LR 0.0001000000 | Loss 39.839729 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:23 Epoch 5 | Batch 1485/2891 | Timestep 15940 | LR 0.0001000000 | Loss 37.827953 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:25 Epoch 5 | Batch 1495/2891 | Timestep 15950 | LR 0.0001000000 | Loss 37.665831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:27 Epoch 5 | Batch 1505/2891 | Timestep 15960 | LR 0.0001000000 | Loss 38.416737 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:29 Epoch 5 | Batch 1515/2891 | Timestep 15970 | LR 0.0001000000 | Loss 36.085437 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:32 Epoch 5 | Batch 1525/2891 | Timestep 15980 | LR 0.0001000000 | Loss 38.057964 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:33 Epoch 5 | Batch 1535/2891 | Timestep 15990 | LR 0.0001000000 | Loss 39.913543 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:36 Epoch 5 | Batch 1545/2891 | Timestep 16000 | LR 0.0001000000 | Loss 37.957793 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:38 Epoch 5 | Batch 1555/2891 | Timestep 16010 | LR 0.0001000000 | Loss 38.836501 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:40 Epoch 5 | Batch 1565/2891 | Timestep 16020 | LR 0.0001000000 | Loss 37.037787 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:42 Epoch 5 | Batch 1575/2891 | Timestep 16030 | LR 0.0001000000 | Loss 37.696930 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:45 Epoch 5 | Batch 1585/2891 | Timestep 16040 | LR 0.0001000000 | Loss 32.358839 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:47 Epoch 5 | Batch 1595/2891 | Timestep 16050 | LR 0.0001000000 | Loss 42.550738 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:49 Epoch 5 | Batch 1605/2891 | Timestep 16060 | LR 0.0001000000 | Loss 36.404908 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:51 Epoch 5 | Batch 1615/2891 | Timestep 16070 | LR 0.0001000000 | Loss 39.217483 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:54 Epoch 5 | Batch 1625/2891 | Timestep 16080 | LR 0.0001000000 | Loss 39.748820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:56 Epoch 5 | Batch 1635/2891 | Timestep 16090 | LR 0.0001000000 | Loss 33.473357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:25:58 Epoch 5 | Batch 1645/2891 | Timestep 16100 | LR 0.0001000000 | Loss 39.106064 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:01 Epoch 5 | Batch 1655/2891 | Timestep 16110 | LR 0.0001000000 | Loss 37.038657 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:03 Epoch 5 | Batch 1665/2891 | Timestep 16120 | LR 0.0001000000 | Loss 38.227976 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:05 Epoch 5 | Batch 1675/2891 | Timestep 16130 | LR 0.0001000000 | Loss 38.192439 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:07 Epoch 5 | Batch 1685/2891 | Timestep 16140 | LR 0.0001000000 | Loss 38.440294 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:09 Epoch 5 | Batch 1695/2891 | Timestep 16150 | LR 0.0001000000 | Loss 40.435574 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:11 Epoch 5 | Batch 1705/2891 | Timestep 16160 | LR 0.0001000000 | Loss 39.062826 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:13 Epoch 5 | Batch 1715/2891 | Timestep 16170 | LR 0.0001000000 | Loss 40.461467 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:16 Epoch 5 | Batch 1725/2891 | Timestep 16180 | LR 0.0001000000 | Loss 35.129604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:18 Epoch 5 | Batch 1735/2891 | Timestep 16190 | LR 0.0001000000 | Loss 39.707678 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:20 Epoch 5 | Batch 1745/2891 | Timestep 16200 | LR 0.0001000000 | Loss 38.229938 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:23 Epoch 5 | Batch 1755/2891 | Timestep 16210 | LR 0.0001000000 | Loss 37.056226 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:25 Epoch 5 | Batch 1765/2891 | Timestep 16220 | LR 0.0001000000 | Loss 37.897086 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:27 Epoch 5 | Batch 1775/2891 | Timestep 16230 | LR 0.0001000000 | Loss 36.716923 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:29 Epoch 5 | Batch 1785/2891 | Timestep 16240 | LR 0.0001000000 | Loss 34.511259 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:32 Epoch 5 | Batch 1795/2891 | Timestep 16250 | LR 0.0001000000 | Loss 37.161708 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:34 Epoch 5 | Batch 1805/2891 | Timestep 16260 | LR 0.0001000000 | Loss 34.911369 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:36 Epoch 5 | Batch 1815/2891 | Timestep 16270 | LR 0.0001000000 | Loss 37.339382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:38 Epoch 5 | Batch 1825/2891 | Timestep 16280 | LR 0.0001000000 | Loss 36.911644 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:40 Epoch 5 | Batch 1835/2891 | Timestep 16290 | LR 0.0001000000 | Loss 38.361710 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:42 Epoch 5 | Batch 1845/2891 | Timestep 16300 | LR 0.0001000000 | Loss 36.447817 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:44 Epoch 5 | Batch 1855/2891 | Timestep 16310 | LR 0.0001000000 | Loss 38.865011 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:47 Epoch 5 | Batch 1865/2891 | Timestep 16320 | LR 0.0001000000 | Loss 37.922873 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:49 Epoch 5 | Batch 1875/2891 | Timestep 16330 | LR 0.0001000000 | Loss 37.119204 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:51 Epoch 5 | Batch 1885/2891 | Timestep 16340 | LR 0.0001000000 | Loss 36.610476 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:53 Epoch 5 | Batch 1895/2891 | Timestep 16350 | LR 0.0001000000 | Loss 31.800199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:55 Epoch 5 | Batch 1905/2891 | Timestep 16360 | LR 0.0001000000 | Loss 39.594597 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:26:58 Epoch 5 | Batch 1915/2891 | Timestep 16370 | LR 0.0001000000 | Loss 36.430048 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:00 Epoch 5 | Batch 1925/2891 | Timestep 16380 | LR 0.0001000000 | Loss 37.546841 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:03 Epoch 5 | Batch 1935/2891 | Timestep 16390 | LR 0.0001000000 | Loss 41.527190 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:05 Epoch 5 | Batch 1945/2891 | Timestep 16400 | LR 0.0001000000 | Loss 38.481127 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:07 Epoch 5 | Batch 1955/2891 | Timestep 16410 | LR 0.0001000000 | Loss 37.463211 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:09 Epoch 5 | Batch 1965/2891 | Timestep 16420 | LR 0.0001000000 | Loss 36.257690 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:11 Epoch 5 | Batch 1975/2891 | Timestep 16430 | LR 0.0001000000 | Loss 38.455494 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:13 Epoch 5 | Batch 1985/2891 | Timestep 16440 | LR 0.0001000000 | Loss 39.256956 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:15 Epoch 5 | Batch 1995/2891 | Timestep 16450 | LR 0.0001000000 | Loss 38.417663 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:18 Epoch 5 | Batch 2005/2891 | Timestep 16460 | LR 0.0001000000 | Loss 37.613423 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:20 Epoch 5 | Batch 2015/2891 | Timestep 16470 | LR 0.0001000000 | Loss 35.864372 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:22 Epoch 5 | Batch 2025/2891 | Timestep 16480 | LR 0.0001000000 | Loss 38.527275 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:24 Epoch 5 | Batch 2035/2891 | Timestep 16490 | LR 0.0001000000 | Loss 35.879706 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:26 Epoch 5 | Batch 2045/2891 | Timestep 16500 | LR 0.0001000000 | Loss 38.783441 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:29 Epoch 5 | Batch 2055/2891 | Timestep 16510 | LR 0.0001000000 | Loss 36.954367 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:31 Epoch 5 | Batch 2065/2891 | Timestep 16520 | LR 0.0001000000 | Loss 36.467012 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:33 Epoch 5 | Batch 2075/2891 | Timestep 16530 | LR 0.0001000000 | Loss 40.046598 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:36 Epoch 5 | Batch 2085/2891 | Timestep 16540 | LR 0.0001000000 | Loss 33.265885 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:38 Epoch 5 | Batch 2095/2891 | Timestep 16550 | LR 0.0001000000 | Loss 38.343765 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:40 Epoch 5 | Batch 2105/2891 | Timestep 16560 | LR 0.0001000000 | Loss 36.283720 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:42 Epoch 5 | Batch 2115/2891 | Timestep 16570 | LR 0.0001000000 | Loss 37.026133 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:44 Epoch 5 | Batch 2125/2891 | Timestep 16580 | LR 0.0001000000 | Loss 35.532192 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:46 Epoch 5 | Batch 2135/2891 | Timestep 16590 | LR 0.0001000000 | Loss 43.435840 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:48 Epoch 5 | Batch 2145/2891 | Timestep 16600 | LR 0.0001000000 | Loss 37.383389 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:50 Epoch 5 | Batch 2155/2891 | Timestep 16610 | LR 0.0001000000 | Loss 37.055711 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:52 Epoch 5 | Batch 2165/2891 | Timestep 16620 | LR 0.0001000000 | Loss 37.605040 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:54 Epoch 5 | Batch 2175/2891 | Timestep 16630 | LR 0.0001000000 | Loss 38.330141 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:57 Epoch 5 | Batch 2185/2891 | Timestep 16640 | LR 0.0001000000 | Loss 36.319690 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:27:59 Epoch 5 | Batch 2195/2891 | Timestep 16650 | LR 0.0001000000 | Loss 35.792329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:01 Epoch 5 | Batch 2205/2891 | Timestep 16660 | LR 0.0001000000 | Loss 39.315050 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:03 Epoch 5 | Batch 2215/2891 | Timestep 16670 | LR 0.0001000000 | Loss 37.941096 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:05 Epoch 5 | Batch 2225/2891 | Timestep 16680 | LR 0.0001000000 | Loss 37.177763 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:07 Epoch 5 | Batch 2235/2891 | Timestep 16690 | LR 0.0001000000 | Loss 38.209883 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:09 Epoch 5 | Batch 2245/2891 | Timestep 16700 | LR 0.0001000000 | Loss 37.879824 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:11 Epoch 5 | Batch 2255/2891 | Timestep 16710 | LR 0.0001000000 | Loss 40.567013 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:14 Epoch 5 | Batch 2265/2891 | Timestep 16720 | LR 0.0001000000 | Loss 39.246567 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:16 Epoch 5 | Batch 2275/2891 | Timestep 16730 | LR 0.0001000000 | Loss 40.008566 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:19 Epoch 5 | Batch 2285/2891 | Timestep 16740 | LR 0.0001000000 | Loss 39.075627 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:21 Epoch 5 | Batch 2295/2891 | Timestep 16750 | LR 0.0001000000 | Loss 34.467166 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:23 Epoch 5 | Batch 2305/2891 | Timestep 16760 | LR 0.0001000000 | Loss 33.372122 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:25 Epoch 5 | Batch 2315/2891 | Timestep 16770 | LR 0.0001000000 | Loss 38.535809 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:28 Epoch 5 | Batch 2325/2891 | Timestep 16780 | LR 0.0001000000 | Loss 34.118558 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:30 Epoch 5 | Batch 2335/2891 | Timestep 16790 | LR 0.0001000000 | Loss 38.439458 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:32 Epoch 5 | Batch 2345/2891 | Timestep 16800 | LR 0.0001000000 | Loss 39.484875 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:34 Epoch 5 | Batch 2355/2891 | Timestep 16810 | LR 0.0001000000 | Loss 34.957910 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:37 Epoch 5 | Batch 2365/2891 | Timestep 16820 | LR 0.0001000000 | Loss 36.526053 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:39 Epoch 5 | Batch 2375/2891 | Timestep 16830 | LR 0.0001000000 | Loss 38.897278 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:41 Epoch 5 | Batch 2385/2891 | Timestep 16840 | LR 0.0001000000 | Loss 38.682297 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:43 Epoch 5 | Batch 2395/2891 | Timestep 16850 | LR 0.0001000000 | Loss 37.384760 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:46 Epoch 5 | Batch 2405/2891 | Timestep 16860 | LR 0.0001000000 | Loss 34.852639 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:48 Epoch 5 | Batch 2415/2891 | Timestep 16870 | LR 0.0001000000 | Loss 39.634456 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:50 Epoch 5 | Batch 2425/2891 | Timestep 16880 | LR 0.0001000000 | Loss 35.878294 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:52 Epoch 5 | Batch 2435/2891 | Timestep 16890 | LR 0.0001000000 | Loss 37.711689 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:55 Epoch 5 | Batch 2445/2891 | Timestep 16900 | LR 0.0001000000 | Loss 33.433071 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:57 Epoch 5 | Batch 2455/2891 | Timestep 16910 | LR 0.0001000000 | Loss 34.666624 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:28:59 Epoch 5 | Batch 2465/2891 | Timestep 16920 | LR 0.0001000000 | Loss 38.043995 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:01 Epoch 5 | Batch 2475/2891 | Timestep 16930 | LR 0.0001000000 | Loss 37.293765 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:04 Epoch 5 | Batch 2485/2891 | Timestep 16940 | LR 0.0001000000 | Loss 37.118530 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:06 Epoch 5 | Batch 2495/2891 | Timestep 16950 | LR 0.0001000000 | Loss 40.095118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:08 Epoch 5 | Batch 2505/2891 | Timestep 16960 | LR 0.0001000000 | Loss 34.031887 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:10 Epoch 5 | Batch 2515/2891 | Timestep 16970 | LR 0.0001000000 | Loss 39.123084 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:12 Epoch 5 | Batch 2525/2891 | Timestep 16980 | LR 0.0001000000 | Loss 36.319511 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:15 Epoch 5 | Batch 2535/2891 | Timestep 16990 | LR 0.0001000000 | Loss 38.812885 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:17 Epoch 5 | Batch 2545/2891 | Timestep 17000 | LR 0.0001000000 | Loss 34.880534 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:19 Epoch 5 | Batch 2555/2891 | Timestep 17010 | LR 0.0001000000 | Loss 37.457147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:21 Epoch 5 | Batch 2565/2891 | Timestep 17020 | LR 0.0001000000 | Loss 37.357728 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:23 Epoch 5 | Batch 2575/2891 | Timestep 17030 | LR 0.0001000000 | Loss 38.038553 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:25 Epoch 5 | Batch 2585/2891 | Timestep 17040 | LR 0.0001000000 | Loss 37.103464 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:27 Epoch 5 | Batch 2595/2891 | Timestep 17050 | LR 0.0001000000 | Loss 37.266058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:30 Epoch 5 | Batch 2605/2891 | Timestep 17060 | LR 0.0001000000 | Loss 39.440273 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:32 Epoch 5 | Batch 2615/2891 | Timestep 17070 | LR 0.0001000000 | Loss 36.522139 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:35 Epoch 5 | Batch 2625/2891 | Timestep 17080 | LR 0.0001000000 | Loss 37.278518 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:37 Epoch 5 | Batch 2635/2891 | Timestep 17090 | LR 0.0001000000 | Loss 35.982416 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:39 Epoch 5 | Batch 2645/2891 | Timestep 17100 | LR 0.0001000000 | Loss 35.858397 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:41 Epoch 5 | Batch 2655/2891 | Timestep 17110 | LR 0.0001000000 | Loss 34.842259 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:43 Epoch 5 | Batch 2665/2891 | Timestep 17120 | LR 0.0001000000 | Loss 38.189390 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:46 Epoch 5 | Batch 2675/2891 | Timestep 17130 | LR 0.0001000000 | Loss 35.507753 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:48 Epoch 5 | Batch 2685/2891 | Timestep 17140 | LR 0.0001000000 | Loss 38.923047 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:50 Epoch 5 | Batch 2695/2891 | Timestep 17150 | LR 0.0001000000 | Loss 38.382357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:52 Epoch 5 | Batch 2705/2891 | Timestep 17160 | LR 0.0001000000 | Loss 39.116841 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:55 Epoch 5 | Batch 2715/2891 | Timestep 17170 | LR 0.0001000000 | Loss 36.689163 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:57 Epoch 5 | Batch 2725/2891 | Timestep 17180 | LR 0.0001000000 | Loss 36.869991 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:29:59 Epoch 5 | Batch 2735/2891 | Timestep 17190 | LR 0.0001000000 | Loss 40.765382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:01 Epoch 5 | Batch 2745/2891 | Timestep 17200 | LR 0.0001000000 | Loss 38.645972 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:03 Epoch 5 | Batch 2755/2891 | Timestep 17210 | LR 0.0001000000 | Loss 37.142388 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:05 Epoch 5 | Batch 2765/2891 | Timestep 17220 | LR 0.0001000000 | Loss 36.969734 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:07 Epoch 5 | Batch 2775/2891 | Timestep 17230 | LR 0.0001000000 | Loss 35.877318 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:09 Epoch 5 | Batch 2785/2891 | Timestep 17240 | LR 0.0001000000 | Loss 35.534928 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:12 Epoch 5 | Batch 2795/2891 | Timestep 17250 | LR 0.0001000000 | Loss 38.958550 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:14 Epoch 5 | Batch 2805/2891 | Timestep 17260 | LR 0.0001000000 | Loss 42.326905 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:16 Epoch 5 | Batch 2815/2891 | Timestep 17270 | LR 0.0001000000 | Loss 39.167566 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:18 Epoch 5 | Batch 2825/2891 | Timestep 17280 | LR 0.0001000000 | Loss 38.931619 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:20 Epoch 5 | Batch 2835/2891 | Timestep 17290 | LR 0.0001000000 | Loss 37.038122 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:23 Epoch 5 | Batch 2845/2891 | Timestep 17300 | LR 0.0001000000 | Loss 37.398333 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:25 Epoch 5 | Batch 2855/2891 | Timestep 17310 | LR 0.0001000000 | Loss 35.092499 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:28 Epoch 5 | Batch 2865/2891 | Timestep 17320 | LR 0.0001000000 | Loss 32.263283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:30 Epoch 5 | Batch 2875/2891 | Timestep 17330 | LR 0.0001000000 | Loss 37.117801 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:32 Epoch 5 | Batch 2885/2891 | Timestep 17340 | LR 0.0001000000 | Loss 38.025140 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:30:33 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 19:32:15 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.0000 0.0000 0.0000 104 + CAMP 0.0000 0.0000 0.0000 71 + CARDINAL 0.0000 0.0000 0.0000 170 + CLUSTER 0.0000 0.0000 0.0000 26 + COM 0.0000 0.0000 0.0000 39 + CONTINENT 0.0000 0.0000 0.0000 23 + COUNTRY 0.0000 0.0000 0.0000 835 + CURR 0.0000 0.0000 0.0000 24 + DATE 0.0000 0.0000 0.0000 1691 + EDU 0.0000 0.0000 0.0000 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.0000 0.0000 0.0000 292 + FAC 0.0000 0.0000 0.0000 111 + GOV 0.0000 0.0000 0.0000 860 + GPE 0.0000 0.0000 0.0000 2261 + GPE_ORG 0.0000 0.0000 0.0000 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 0.0000 0.0000 0.0000 16 + LAW 0.0000 0.0000 0.0000 47 + LOC 0.0000 0.0000 0.0000 127 + MED 0.0000 0.0000 0.0000 419 + MONEY 0.0000 0.0000 0.0000 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.0000 0.0000 0.0000 571 + NORP 0.0000 0.0000 0.0000 551 + OCC 0.0000 0.0000 0.0000 522 + ORDINAL 0.0000 0.0000 0.0000 544 + ORG 0.0000 0.0000 0.0000 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.0000 0.0000 0.0000 6 + PERCENT 0.0000 0.0000 0.0000 12 + PERS 0.0000 0.0000 0.0000 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.0000 0.0000 0.0000 3 + REGION-GENERAL 0.0000 0.0000 0.0000 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.0000 0.0000 0.0000 10 + SCI 0.0000 0.0000 0.0000 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.0000 0.0000 0.0000 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.0000 0.0000 0.0000 33 + TOWN 0.0000 0.0000 0.0000 1217 + UNIT 0.0000 0.0000 0.0000 4 + WATER-BODY 0.0000 0.0000 0.0000 14 + WEBSITE 0.0000 0.0000 0.0000 80 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.0000 0.0000 0.0000 13790 + macro avg 0.0000 0.0000 0.0000 13790 + weighted avg 0.0000 0.0000 0.0000 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:19 Epoch 5 | Timestep 17346 | Train Loss 37.553594 | Val Loss 38.780254 | F1 0.000000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:20 Epoch 6 | Batch 4/2891 | Timestep 17350 | LR 0.0001000000 | Loss 37.676041 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:22 Epoch 6 | Batch 14/2891 | Timestep 17360 | LR 0.0001000000 | Loss 37.767049 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:24 Epoch 6 | Batch 24/2891 | Timestep 17370 | LR 0.0001000000 | Loss 36.198621 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:26 Epoch 6 | Batch 34/2891 | Timestep 17380 | LR 0.0001000000 | Loss 37.614416 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:28 Epoch 6 | Batch 44/2891 | Timestep 17390 | LR 0.0001000000 | Loss 38.490746 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:30 Epoch 6 | Batch 54/2891 | Timestep 17400 | LR 0.0001000000 | Loss 37.774131 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:33 Epoch 6 | Batch 64/2891 | Timestep 17410 | LR 0.0001000000 | Loss 39.107401 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:35 Epoch 6 | Batch 74/2891 | Timestep 17420 | LR 0.0001000000 | Loss 34.136596 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:37 Epoch 6 | Batch 84/2891 | Timestep 17430 | LR 0.0001000000 | Loss 35.993304 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:39 Epoch 6 | Batch 94/2891 | Timestep 17440 | LR 0.0001000000 | Loss 38.002414 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:41 Epoch 6 | Batch 104/2891 | Timestep 17450 | LR 0.0001000000 | Loss 36.269266 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:44 Epoch 6 | Batch 114/2891 | Timestep 17460 | LR 0.0001000000 | Loss 39.725256 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:45 Epoch 6 | Batch 124/2891 | Timestep 17470 | LR 0.0001000000 | Loss 38.536961 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:48 Epoch 6 | Batch 134/2891 | Timestep 17480 | LR 0.0001000000 | Loss 37.517839 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:50 Epoch 6 | Batch 144/2891 | Timestep 17490 | LR 0.0001000000 | Loss 37.979489 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:52 Epoch 6 | Batch 154/2891 | Timestep 17500 | LR 0.0001000000 | Loss 37.604110 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:54 Epoch 6 | Batch 164/2891 | Timestep 17510 | LR 0.0001000000 | Loss 37.967067 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:56 Epoch 6 | Batch 174/2891 | Timestep 17520 | LR 0.0001000000 | Loss 38.749771 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:33:58 Epoch 6 | Batch 184/2891 | Timestep 17530 | LR 0.0001000000 | Loss 35.315437 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:00 Epoch 6 | Batch 194/2891 | Timestep 17540 | LR 0.0001000000 | Loss 41.152663 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:03 Epoch 6 | Batch 204/2891 | Timestep 17550 | LR 0.0001000000 | Loss 36.852458 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:05 Epoch 6 | Batch 214/2891 | Timestep 17560 | LR 0.0001000000 | Loss 38.479942 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:07 Epoch 6 | Batch 224/2891 | Timestep 17570 | LR 0.0001000000 | Loss 40.306563 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:08 Epoch 6 | Batch 234/2891 | Timestep 17580 | LR 0.0001000000 | Loss 36.949919 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:11 Epoch 6 | Batch 244/2891 | Timestep 17590 | LR 0.0001000000 | Loss 37.371162 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:13 Epoch 6 | Batch 254/2891 | Timestep 17600 | LR 0.0001000000 | Loss 39.580944 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:15 Epoch 6 | Batch 264/2891 | Timestep 17610 | LR 0.0001000000 | Loss 38.933126 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:17 Epoch 6 | Batch 274/2891 | Timestep 17620 | LR 0.0001000000 | Loss 36.496463 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:20 Epoch 6 | Batch 284/2891 | Timestep 17630 | LR 0.0001000000 | Loss 36.780184 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:22 Epoch 6 | Batch 294/2891 | Timestep 17640 | LR 0.0001000000 | Loss 36.528777 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:24 Epoch 6 | Batch 304/2891 | Timestep 17650 | LR 0.0001000000 | Loss 37.648347 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:26 Epoch 6 | Batch 314/2891 | Timestep 17660 | LR 0.0001000000 | Loss 36.395946 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:28 Epoch 6 | Batch 324/2891 | Timestep 17670 | LR 0.0001000000 | Loss 35.898852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:30 Epoch 6 | Batch 334/2891 | Timestep 17680 | LR 0.0001000000 | Loss 44.428446 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:32 Epoch 6 | Batch 344/2891 | Timestep 17690 | LR 0.0001000000 | Loss 38.616831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:34 Epoch 6 | Batch 354/2891 | Timestep 17700 | LR 0.0001000000 | Loss 38.677730 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:36 Epoch 6 | Batch 364/2891 | Timestep 17710 | LR 0.0001000000 | Loss 37.199036 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:38 Epoch 6 | Batch 374/2891 | Timestep 17720 | LR 0.0001000000 | Loss 37.450320 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:40 Epoch 6 | Batch 384/2891 | Timestep 17730 | LR 0.0001000000 | Loss 37.508857 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:43 Epoch 6 | Batch 394/2891 | Timestep 17740 | LR 0.0001000000 | Loss 37.046152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:45 Epoch 6 | Batch 404/2891 | Timestep 17750 | LR 0.0001000000 | Loss 36.978955 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:47 Epoch 6 | Batch 414/2891 | Timestep 17760 | LR 0.0001000000 | Loss 37.607996 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:49 Epoch 6 | Batch 424/2891 | Timestep 17770 | LR 0.0001000000 | Loss 34.835201 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:51 Epoch 6 | Batch 434/2891 | Timestep 17780 | LR 0.0001000000 | Loss 38.183397 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:54 Epoch 6 | Batch 444/2891 | Timestep 17790 | LR 0.0001000000 | Loss 39.743709 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:56 Epoch 6 | Batch 454/2891 | Timestep 17800 | LR 0.0001000000 | Loss 34.546098 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:34:58 Epoch 6 | Batch 464/2891 | Timestep 17810 | LR 0.0001000000 | Loss 36.600362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:00 Epoch 6 | Batch 474/2891 | Timestep 17820 | LR 0.0001000000 | Loss 38.301464 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:02 Epoch 6 | Batch 484/2891 | Timestep 17830 | LR 0.0001000000 | Loss 38.000310 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:04 Epoch 6 | Batch 494/2891 | Timestep 17840 | LR 0.0001000000 | Loss 37.970283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:06 Epoch 6 | Batch 504/2891 | Timestep 17850 | LR 0.0001000000 | Loss 38.038038 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:08 Epoch 6 | Batch 514/2891 | Timestep 17860 | LR 0.0001000000 | Loss 38.256862 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:10 Epoch 6 | Batch 524/2891 | Timestep 17870 | LR 0.0001000000 | Loss 37.529580 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:12 Epoch 6 | Batch 534/2891 | Timestep 17880 | LR 0.0001000000 | Loss 36.699128 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:15 Epoch 6 | Batch 544/2891 | Timestep 17890 | LR 0.0001000000 | Loss 37.846636 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:17 Epoch 6 | Batch 554/2891 | Timestep 17900 | LR 0.0001000000 | Loss 36.711830 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:19 Epoch 6 | Batch 564/2891 | Timestep 17910 | LR 0.0001000000 | Loss 37.643024 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:21 Epoch 6 | Batch 574/2891 | Timestep 17920 | LR 0.0001000000 | Loss 37.298362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:23 Epoch 6 | Batch 584/2891 | Timestep 17930 | LR 0.0001000000 | Loss 36.723831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:25 Epoch 6 | Batch 594/2891 | Timestep 17940 | LR 0.0001000000 | Loss 36.171261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:27 Epoch 6 | Batch 604/2891 | Timestep 17950 | LR 0.0001000000 | Loss 37.763852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:29 Epoch 6 | Batch 614/2891 | Timestep 17960 | LR 0.0001000000 | Loss 37.418809 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:31 Epoch 6 | Batch 624/2891 | Timestep 17970 | LR 0.0001000000 | Loss 38.151438 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:33 Epoch 6 | Batch 634/2891 | Timestep 17980 | LR 0.0001000000 | Loss 38.220099 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:35 Epoch 6 | Batch 644/2891 | Timestep 17990 | LR 0.0001000000 | Loss 36.334024 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:37 Epoch 6 | Batch 654/2891 | Timestep 18000 | LR 0.0001000000 | Loss 39.121552 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:39 Epoch 6 | Batch 664/2891 | Timestep 18010 | LR 0.0001000000 | Loss 36.096042 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:41 Epoch 6 | Batch 674/2891 | Timestep 18020 | LR 0.0001000000 | Loss 36.539918 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:44 Epoch 6 | Batch 684/2891 | Timestep 18030 | LR 0.0001000000 | Loss 34.530898 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:46 Epoch 6 | Batch 694/2891 | Timestep 18040 | LR 0.0001000000 | Loss 37.874165 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:48 Epoch 6 | Batch 704/2891 | Timestep 18050 | LR 0.0001000000 | Loss 36.533209 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:50 Epoch 6 | Batch 714/2891 | Timestep 18060 | LR 0.0001000000 | Loss 41.220834 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:53 Epoch 6 | Batch 724/2891 | Timestep 18070 | LR 0.0001000000 | Loss 35.863465 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:55 Epoch 6 | Batch 734/2891 | Timestep 18080 | LR 0.0001000000 | Loss 37.356931 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:57 Epoch 6 | Batch 744/2891 | Timestep 18090 | LR 0.0001000000 | Loss 41.360395 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:35:59 Epoch 6 | Batch 754/2891 | Timestep 18100 | LR 0.0001000000 | Loss 39.347298 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:01 Epoch 6 | Batch 764/2891 | Timestep 18110 | LR 0.0001000000 | Loss 37.715158 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:04 Epoch 6 | Batch 774/2891 | Timestep 18120 | LR 0.0001000000 | Loss 37.929805 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:06 Epoch 6 | Batch 784/2891 | Timestep 18130 | LR 0.0001000000 | Loss 37.552981 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:08 Epoch 6 | Batch 794/2891 | Timestep 18140 | LR 0.0001000000 | Loss 38.802285 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:10 Epoch 6 | Batch 804/2891 | Timestep 18150 | LR 0.0001000000 | Loss 36.539521 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:12 Epoch 6 | Batch 814/2891 | Timestep 18160 | LR 0.0001000000 | Loss 36.820060 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:14 Epoch 6 | Batch 824/2891 | Timestep 18170 | LR 0.0001000000 | Loss 41.570331 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:16 Epoch 6 | Batch 834/2891 | Timestep 18180 | LR 0.0001000000 | Loss 36.583241 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:19 Epoch 6 | Batch 844/2891 | Timestep 18190 | LR 0.0001000000 | Loss 37.217979 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:21 Epoch 6 | Batch 854/2891 | Timestep 18200 | LR 0.0001000000 | Loss 37.193524 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:23 Epoch 6 | Batch 864/2891 | Timestep 18210 | LR 0.0001000000 | Loss 39.316879 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:25 Epoch 6 | Batch 874/2891 | Timestep 18220 | LR 0.0001000000 | Loss 34.156444 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:27 Epoch 6 | Batch 884/2891 | Timestep 18230 | LR 0.0001000000 | Loss 36.192612 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:29 Epoch 6 | Batch 894/2891 | Timestep 18240 | LR 0.0001000000 | Loss 40.882663 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:32 Epoch 6 | Batch 904/2891 | Timestep 18250 | LR 0.0001000000 | Loss 38.031904 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:34 Epoch 6 | Batch 914/2891 | Timestep 18260 | LR 0.0001000000 | Loss 41.928917 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:36 Epoch 6 | Batch 924/2891 | Timestep 18270 | LR 0.0001000000 | Loss 36.341166 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:38 Epoch 6 | Batch 934/2891 | Timestep 18280 | LR 0.0001000000 | Loss 37.232321 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:40 Epoch 6 | Batch 944/2891 | Timestep 18290 | LR 0.0001000000 | Loss 38.635254 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:43 Epoch 6 | Batch 954/2891 | Timestep 18300 | LR 0.0001000000 | Loss 37.633552 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:45 Epoch 6 | Batch 964/2891 | Timestep 18310 | LR 0.0001000000 | Loss 36.738183 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:47 Epoch 6 | Batch 974/2891 | Timestep 18320 | LR 0.0001000000 | Loss 35.347045 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:49 Epoch 6 | Batch 984/2891 | Timestep 18330 | LR 0.0001000000 | Loss 40.023152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:51 Epoch 6 | Batch 994/2891 | Timestep 18340 | LR 0.0001000000 | Loss 37.502686 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:53 Epoch 6 | Batch 1004/2891 | Timestep 18350 | LR 0.0001000000 | Loss 36.783632 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:56 Epoch 6 | Batch 1014/2891 | Timestep 18360 | LR 0.0001000000 | Loss 36.848050 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:36:58 Epoch 6 | Batch 1024/2891 | Timestep 18370 | LR 0.0001000000 | Loss 40.266170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:00 Epoch 6 | Batch 1034/2891 | Timestep 18380 | LR 0.0001000000 | Loss 35.618975 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:02 Epoch 6 | Batch 1044/2891 | Timestep 18390 | LR 0.0001000000 | Loss 37.356561 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:04 Epoch 6 | Batch 1054/2891 | Timestep 18400 | LR 0.0001000000 | Loss 38.299572 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:06 Epoch 6 | Batch 1064/2891 | Timestep 18410 | LR 0.0001000000 | Loss 37.778728 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:08 Epoch 6 | Batch 1074/2891 | Timestep 18420 | LR 0.0001000000 | Loss 37.460398 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:11 Epoch 6 | Batch 1084/2891 | Timestep 18430 | LR 0.0001000000 | Loss 35.345199 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:13 Epoch 6 | Batch 1094/2891 | Timestep 18440 | LR 0.0001000000 | Loss 40.213508 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:15 Epoch 6 | Batch 1104/2891 | Timestep 18450 | LR 0.0001000000 | Loss 43.527693 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:18 Epoch 6 | Batch 1114/2891 | Timestep 18460 | LR 0.0001000000 | Loss 39.037424 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:20 Epoch 6 | Batch 1124/2891 | Timestep 18470 | LR 0.0001000000 | Loss 38.070154 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:22 Epoch 6 | Batch 1134/2891 | Timestep 18480 | LR 0.0001000000 | Loss 37.482714 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:24 Epoch 6 | Batch 1144/2891 | Timestep 18490 | LR 0.0001000000 | Loss 38.115650 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:27 Epoch 6 | Batch 1154/2891 | Timestep 18500 | LR 0.0001000000 | Loss 37.492995 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:29 Epoch 6 | Batch 1164/2891 | Timestep 18510 | LR 0.0001000000 | Loss 38.653587 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:31 Epoch 6 | Batch 1174/2891 | Timestep 18520 | LR 0.0001000000 | Loss 36.899517 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:33 Epoch 6 | Batch 1184/2891 | Timestep 18530 | LR 0.0001000000 | Loss 37.610269 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:35 Epoch 6 | Batch 1194/2891 | Timestep 18540 | LR 0.0001000000 | Loss 38.099152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:37 Epoch 6 | Batch 1204/2891 | Timestep 18550 | LR 0.0001000000 | Loss 37.623780 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:40 Epoch 6 | Batch 1214/2891 | Timestep 18560 | LR 0.0001000000 | Loss 37.779921 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:42 Epoch 6 | Batch 1224/2891 | Timestep 18570 | LR 0.0001000000 | Loss 37.354731 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:44 Epoch 6 | Batch 1234/2891 | Timestep 18580 | LR 0.0001000000 | Loss 36.664301 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:46 Epoch 6 | Batch 1244/2891 | Timestep 18590 | LR 0.0001000000 | Loss 38.398027 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:49 Epoch 6 | Batch 1254/2891 | Timestep 18600 | LR 0.0001000000 | Loss 37.553428 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:51 Epoch 6 | Batch 1264/2891 | Timestep 18610 | LR 0.0001000000 | Loss 37.221051 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:53 Epoch 6 | Batch 1274/2891 | Timestep 18620 | LR 0.0001000000 | Loss 38.770980 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:55 Epoch 6 | Batch 1284/2891 | Timestep 18630 | LR 0.0001000000 | Loss 37.488067 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:57 Epoch 6 | Batch 1294/2891 | Timestep 18640 | LR 0.0001000000 | Loss 38.340935 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:37:59 Epoch 6 | Batch 1304/2891 | Timestep 18650 | LR 0.0001000000 | Loss 37.510435 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:01 Epoch 6 | Batch 1314/2891 | Timestep 18660 | LR 0.0001000000 | Loss 37.646876 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:03 Epoch 6 | Batch 1324/2891 | Timestep 18670 | LR 0.0001000000 | Loss 37.136076 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:05 Epoch 6 | Batch 1334/2891 | Timestep 18680 | LR 0.0001000000 | Loss 37.374042 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:07 Epoch 6 | Batch 1344/2891 | Timestep 18690 | LR 0.0001000000 | Loss 37.374704 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:09 Epoch 6 | Batch 1354/2891 | Timestep 18700 | LR 0.0001000000 | Loss 37.683764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:12 Epoch 6 | Batch 1364/2891 | Timestep 18710 | LR 0.0001000000 | Loss 38.030370 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:13 Epoch 6 | Batch 1374/2891 | Timestep 18720 | LR 0.0001000000 | Loss 36.053488 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:15 Epoch 6 | Batch 1384/2891 | Timestep 18730 | LR 0.0001000000 | Loss 38.395444 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:18 Epoch 6 | Batch 1394/2891 | Timestep 18740 | LR 0.0001000000 | Loss 37.283030 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:20 Epoch 6 | Batch 1404/2891 | Timestep 18750 | LR 0.0001000000 | Loss 36.471594 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:22 Epoch 6 | Batch 1414/2891 | Timestep 18760 | LR 0.0001000000 | Loss 36.568237 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:24 Epoch 6 | Batch 1424/2891 | Timestep 18770 | LR 0.0001000000 | Loss 35.442532 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:27 Epoch 6 | Batch 1434/2891 | Timestep 18780 | LR 0.0001000000 | Loss 38.308342 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:30 Epoch 6 | Batch 1444/2891 | Timestep 18790 | LR 0.0001000000 | Loss 41.554373 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:32 Epoch 6 | Batch 1454/2891 | Timestep 18800 | LR 0.0001000000 | Loss 37.008416 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:34 Epoch 6 | Batch 1464/2891 | Timestep 18810 | LR 0.0001000000 | Loss 38.728329 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:36 Epoch 6 | Batch 1474/2891 | Timestep 18820 | LR 0.0001000000 | Loss 37.435488 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:38 Epoch 6 | Batch 1484/2891 | Timestep 18830 | LR 0.0001000000 | Loss 37.629816 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:40 Epoch 6 | Batch 1494/2891 | Timestep 18840 | LR 0.0001000000 | Loss 37.351754 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:42 Epoch 6 | Batch 1504/2891 | Timestep 18850 | LR 0.0001000000 | Loss 37.139409 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:45 Epoch 6 | Batch 1514/2891 | Timestep 18860 | LR 0.0001000000 | Loss 37.097826 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:47 Epoch 6 | Batch 1524/2891 | Timestep 18870 | LR 0.0001000000 | Loss 36.311314 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:49 Epoch 6 | Batch 1534/2891 | Timestep 18880 | LR 0.0001000000 | Loss 36.953301 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:51 Epoch 6 | Batch 1544/2891 | Timestep 18890 | LR 0.0001000000 | Loss 38.562294 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:54 Epoch 6 | Batch 1554/2891 | Timestep 18900 | LR 0.0001000000 | Loss 40.656555 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:56 Epoch 6 | Batch 1564/2891 | Timestep 18910 | LR 0.0001000000 | Loss 40.129542 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:38:58 Epoch 6 | Batch 1574/2891 | Timestep 18920 | LR 0.0001000000 | Loss 39.600600 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:00 Epoch 6 | Batch 1584/2891 | Timestep 18930 | LR 0.0001000000 | Loss 38.560058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:02 Epoch 6 | Batch 1594/2891 | Timestep 18940 | LR 0.0001000000 | Loss 39.478448 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:04 Epoch 6 | Batch 1604/2891 | Timestep 18950 | LR 0.0001000000 | Loss 37.814101 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:07 Epoch 6 | Batch 1614/2891 | Timestep 18960 | LR 0.0001000000 | Loss 38.106281 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:10 Epoch 6 | Batch 1624/2891 | Timestep 18970 | LR 0.0001000000 | Loss 38.671853 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:12 Epoch 6 | Batch 1634/2891 | Timestep 18980 | LR 0.0001000000 | Loss 36.750311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:14 Epoch 6 | Batch 1644/2891 | Timestep 18990 | LR 0.0001000000 | Loss 41.549185 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:16 Epoch 6 | Batch 1654/2891 | Timestep 19000 | LR 0.0001000000 | Loss 38.864906 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:18 Epoch 6 | Batch 1664/2891 | Timestep 19010 | LR 0.0001000000 | Loss 37.919162 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:20 Epoch 6 | Batch 1674/2891 | Timestep 19020 | LR 0.0001000000 | Loss 36.333602 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:22 Epoch 6 | Batch 1684/2891 | Timestep 19030 | LR 0.0001000000 | Loss 38.022474 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:24 Epoch 6 | Batch 1694/2891 | Timestep 19040 | LR 0.0001000000 | Loss 37.235686 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:27 Epoch 6 | Batch 1704/2891 | Timestep 19050 | LR 0.0001000000 | Loss 38.853760 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:29 Epoch 6 | Batch 1714/2891 | Timestep 19060 | LR 0.0001000000 | Loss 38.482339 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:32 Epoch 6 | Batch 1724/2891 | Timestep 19070 | LR 0.0001000000 | Loss 37.919755 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:34 Epoch 6 | Batch 1734/2891 | Timestep 19080 | LR 0.0001000000 | Loss 37.084585 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:36 Epoch 6 | Batch 1744/2891 | Timestep 19090 | LR 0.0001000000 | Loss 36.650842 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:39 Epoch 6 | Batch 1754/2891 | Timestep 19100 | LR 0.0001000000 | Loss 37.332568 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:41 Epoch 6 | Batch 1764/2891 | Timestep 19110 | LR 0.0001000000 | Loss 37.999720 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:43 Epoch 6 | Batch 1774/2891 | Timestep 19120 | LR 0.0001000000 | Loss 39.247958 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:45 Epoch 6 | Batch 1784/2891 | Timestep 19130 | LR 0.0001000000 | Loss 37.261308 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:47 Epoch 6 | Batch 1794/2891 | Timestep 19140 | LR 0.0001000000 | Loss 38.239072 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:49 Epoch 6 | Batch 1804/2891 | Timestep 19150 | LR 0.0001000000 | Loss 38.287218 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:51 Epoch 6 | Batch 1814/2891 | Timestep 19160 | LR 0.0001000000 | Loss 36.463503 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:54 Epoch 6 | Batch 1824/2891 | Timestep 19170 | LR 0.0001000000 | Loss 37.113918 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:56 Epoch 6 | Batch 1834/2891 | Timestep 19180 | LR 0.0001000000 | Loss 37.556047 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:39:58 Epoch 6 | Batch 1844/2891 | Timestep 19190 | LR 0.0001000000 | Loss 34.050040 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:01 Epoch 6 | Batch 1854/2891 | Timestep 19200 | LR 0.0001000000 | Loss 33.497771 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:03 Epoch 6 | Batch 1864/2891 | Timestep 19210 | LR 0.0001000000 | Loss 35.532314 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:06 Epoch 6 | Batch 1874/2891 | Timestep 19220 | LR 0.0001000000 | Loss 38.551549 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:08 Epoch 6 | Batch 1884/2891 | Timestep 19230 | LR 0.0001000000 | Loss 38.397987 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:10 Epoch 6 | Batch 1894/2891 | Timestep 19240 | LR 0.0001000000 | Loss 37.535752 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:12 Epoch 6 | Batch 1904/2891 | Timestep 19250 | LR 0.0001000000 | Loss 37.453608 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:14 Epoch 6 | Batch 1914/2891 | Timestep 19260 | LR 0.0001000000 | Loss 37.655991 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:16 Epoch 6 | Batch 1924/2891 | Timestep 19270 | LR 0.0001000000 | Loss 36.106614 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:18 Epoch 6 | Batch 1934/2891 | Timestep 19280 | LR 0.0001000000 | Loss 37.036044 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:20 Epoch 6 | Batch 1944/2891 | Timestep 19290 | LR 0.0001000000 | Loss 37.206294 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:22 Epoch 6 | Batch 1954/2891 | Timestep 19300 | LR 0.0001000000 | Loss 36.779147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:25 Epoch 6 | Batch 1964/2891 | Timestep 19310 | LR 0.0001000000 | Loss 42.045569 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:27 Epoch 6 | Batch 1974/2891 | Timestep 19320 | LR 0.0001000000 | Loss 35.094888 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:29 Epoch 6 | Batch 1984/2891 | Timestep 19330 | LR 0.0001000000 | Loss 37.041973 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:31 Epoch 6 | Batch 1994/2891 | Timestep 19340 | LR 0.0001000000 | Loss 37.586546 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:33 Epoch 6 | Batch 2004/2891 | Timestep 19350 | LR 0.0001000000 | Loss 37.822638 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:35 Epoch 6 | Batch 2014/2891 | Timestep 19360 | LR 0.0001000000 | Loss 37.561179 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:37 Epoch 6 | Batch 2024/2891 | Timestep 19370 | LR 0.0001000000 | Loss 37.022911 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:40 Epoch 6 | Batch 2034/2891 | Timestep 19380 | LR 0.0001000000 | Loss 38.138143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:42 Epoch 6 | Batch 2044/2891 | Timestep 19390 | LR 0.0001000000 | Loss 37.915795 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:45 Epoch 6 | Batch 2054/2891 | Timestep 19400 | LR 0.0001000000 | Loss 39.390918 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:47 Epoch 6 | Batch 2064/2891 | Timestep 19410 | LR 0.0001000000 | Loss 38.017641 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:49 Epoch 6 | Batch 2074/2891 | Timestep 19420 | LR 0.0001000000 | Loss 37.059922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:51 Epoch 6 | Batch 2084/2891 | Timestep 19430 | LR 0.0001000000 | Loss 37.280264 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:53 Epoch 6 | Batch 2094/2891 | Timestep 19440 | LR 0.0001000000 | Loss 37.572784 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:55 Epoch 6 | Batch 2104/2891 | Timestep 19450 | LR 0.0001000000 | Loss 37.646974 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:40:58 Epoch 6 | Batch 2114/2891 | Timestep 19460 | LR 0.0001000000 | Loss 36.919161 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:00 Epoch 6 | Batch 2124/2891 | Timestep 19470 | LR 0.0001000000 | Loss 35.438118 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:02 Epoch 6 | Batch 2134/2891 | Timestep 19480 | LR 0.0001000000 | Loss 38.767613 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:04 Epoch 6 | Batch 2144/2891 | Timestep 19490 | LR 0.0001000000 | Loss 37.831840 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:07 Epoch 6 | Batch 2154/2891 | Timestep 19500 | LR 0.0001000000 | Loss 37.831252 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:09 Epoch 6 | Batch 2164/2891 | Timestep 19510 | LR 0.0001000000 | Loss 36.007519 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:11 Epoch 6 | Batch 2174/2891 | Timestep 19520 | LR 0.0001000000 | Loss 39.527531 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:13 Epoch 6 | Batch 2184/2891 | Timestep 19530 | LR 0.0001000000 | Loss 38.901061 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:16 Epoch 6 | Batch 2194/2891 | Timestep 19540 | LR 0.0001000000 | Loss 37.148104 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:18 Epoch 6 | Batch 2204/2891 | Timestep 19550 | LR 0.0001000000 | Loss 40.492533 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:20 Epoch 6 | Batch 2214/2891 | Timestep 19560 | LR 0.0001000000 | Loss 38.377840 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:22 Epoch 6 | Batch 2224/2891 | Timestep 19570 | LR 0.0001000000 | Loss 37.020082 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:24 Epoch 6 | Batch 2234/2891 | Timestep 19580 | LR 0.0001000000 | Loss 36.808487 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:26 Epoch 6 | Batch 2244/2891 | Timestep 19590 | LR 0.0001000000 | Loss 37.131445 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:28 Epoch 6 | Batch 2254/2891 | Timestep 19600 | LR 0.0001000000 | Loss 38.269833 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:31 Epoch 6 | Batch 2264/2891 | Timestep 19610 | LR 0.0001000000 | Loss 37.123092 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:33 Epoch 6 | Batch 2274/2891 | Timestep 19620 | LR 0.0001000000 | Loss 37.060167 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:35 Epoch 6 | Batch 2284/2891 | Timestep 19630 | LR 0.0001000000 | Loss 39.497844 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:37 Epoch 6 | Batch 2294/2891 | Timestep 19640 | LR 0.0001000000 | Loss 37.860256 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:39 Epoch 6 | Batch 2304/2891 | Timestep 19650 | LR 0.0001000000 | Loss 36.238832 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:41 Epoch 6 | Batch 2314/2891 | Timestep 19660 | LR 0.0001000000 | Loss 38.079064 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:43 Epoch 6 | Batch 2324/2891 | Timestep 19670 | LR 0.0001000000 | Loss 38.840581 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:45 Epoch 6 | Batch 2334/2891 | Timestep 19680 | LR 0.0001000000 | Loss 36.879406 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:48 Epoch 6 | Batch 2344/2891 | Timestep 19690 | LR 0.0001000000 | Loss 35.837189 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:50 Epoch 6 | Batch 2354/2891 | Timestep 19700 | LR 0.0001000000 | Loss 38.804644 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:52 Epoch 6 | Batch 2364/2891 | Timestep 19710 | LR 0.0001000000 | Loss 38.596439 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:54 Epoch 6 | Batch 2374/2891 | Timestep 19720 | LR 0.0001000000 | Loss 40.333166 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:56 Epoch 6 | Batch 2384/2891 | Timestep 19730 | LR 0.0001000000 | Loss 39.656406 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:41:58 Epoch 6 | Batch 2394/2891 | Timestep 19740 | LR 0.0001000000 | Loss 38.184455 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:00 Epoch 6 | Batch 2404/2891 | Timestep 19750 | LR 0.0001000000 | Loss 36.505633 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:03 Epoch 6 | Batch 2414/2891 | Timestep 19760 | LR 0.0001000000 | Loss 38.120733 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:05 Epoch 6 | Batch 2424/2891 | Timestep 19770 | LR 0.0001000000 | Loss 34.338005 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:08 Epoch 6 | Batch 2434/2891 | Timestep 19780 | LR 0.0001000000 | Loss 34.073419 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:10 Epoch 6 | Batch 2444/2891 | Timestep 19790 | LR 0.0001000000 | Loss 36.619334 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:12 Epoch 6 | Batch 2454/2891 | Timestep 19800 | LR 0.0001000000 | Loss 32.325701 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:15 Epoch 6 | Batch 2464/2891 | Timestep 19810 | LR 0.0001000000 | Loss 39.054965 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:17 Epoch 6 | Batch 2474/2891 | Timestep 19820 | LR 0.0001000000 | Loss 38.968044 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:19 Epoch 6 | Batch 2484/2891 | Timestep 19830 | LR 0.0001000000 | Loss 40.219015 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:21 Epoch 6 | Batch 2494/2891 | Timestep 19840 | LR 0.0001000000 | Loss 36.857283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:23 Epoch 6 | Batch 2504/2891 | Timestep 19850 | LR 0.0001000000 | Loss 37.083416 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:25 Epoch 6 | Batch 2514/2891 | Timestep 19860 | LR 0.0001000000 | Loss 40.106178 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:28 Epoch 6 | Batch 2524/2891 | Timestep 19870 | LR 0.0001000000 | Loss 39.965789 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:30 Epoch 6 | Batch 2534/2891 | Timestep 19880 | LR 0.0001000000 | Loss 37.358012 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:33 Epoch 6 | Batch 2544/2891 | Timestep 19890 | LR 0.0001000000 | Loss 35.744466 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:35 Epoch 6 | Batch 2554/2891 | Timestep 19900 | LR 0.0001000000 | Loss 39.597808 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:37 Epoch 6 | Batch 2564/2891 | Timestep 19910 | LR 0.0001000000 | Loss 41.864187 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:39 Epoch 6 | Batch 2574/2891 | Timestep 19920 | LR 0.0001000000 | Loss 40.042570 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:42 Epoch 6 | Batch 2584/2891 | Timestep 19930 | LR 0.0001000000 | Loss 36.565426 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:44 Epoch 6 | Batch 2594/2891 | Timestep 19940 | LR 0.0001000000 | Loss 35.161425 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:46 Epoch 6 | Batch 2604/2891 | Timestep 19950 | LR 0.0001000000 | Loss 35.402017 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:48 Epoch 6 | Batch 2614/2891 | Timestep 19960 | LR 0.0001000000 | Loss 37.716353 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:50 Epoch 6 | Batch 2624/2891 | Timestep 19970 | LR 0.0001000000 | Loss 37.852061 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:52 Epoch 6 | Batch 2634/2891 | Timestep 19980 | LR 0.0001000000 | Loss 37.671261 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:55 Epoch 6 | Batch 2644/2891 | Timestep 19990 | LR 0.0001000000 | Loss 35.835885 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:57 Epoch 6 | Batch 2654/2891 | Timestep 20000 | LR 0.0001000000 | Loss 36.884405 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:42:59 Epoch 6 | Batch 2664/2891 | Timestep 20010 | LR 0.0001000000 | Loss 38.483462 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:01 Epoch 6 | Batch 2674/2891 | Timestep 20020 | LR 0.0001000000 | Loss 38.543648 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:03 Epoch 6 | Batch 2684/2891 | Timestep 20030 | LR 0.0001000000 | Loss 38.316262 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:06 Epoch 6 | Batch 2694/2891 | Timestep 20040 | LR 0.0001000000 | Loss 37.879231 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:08 Epoch 6 | Batch 2704/2891 | Timestep 20050 | LR 0.0001000000 | Loss 37.020305 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:10 Epoch 6 | Batch 2714/2891 | Timestep 20060 | LR 0.0001000000 | Loss 36.169742 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:12 Epoch 6 | Batch 2724/2891 | Timestep 20070 | LR 0.0001000000 | Loss 37.619477 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:14 Epoch 6 | Batch 2734/2891 | Timestep 20080 | LR 0.0001000000 | Loss 37.951247 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:16 Epoch 6 | Batch 2744/2891 | Timestep 20090 | LR 0.0001000000 | Loss 36.757836 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:19 Epoch 6 | Batch 2754/2891 | Timestep 20100 | LR 0.0001000000 | Loss 37.344680 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:21 Epoch 6 | Batch 2764/2891 | Timestep 20110 | LR 0.0001000000 | Loss 34.171240 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:23 Epoch 6 | Batch 2774/2891 | Timestep 20120 | LR 0.0001000000 | Loss 37.003683 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:25 Epoch 6 | Batch 2784/2891 | Timestep 20130 | LR 0.0001000000 | Loss 36.154422 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:27 Epoch 6 | Batch 2794/2891 | Timestep 20140 | LR 0.0001000000 | Loss 36.602086 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:29 Epoch 6 | Batch 2804/2891 | Timestep 20150 | LR 0.0001000000 | Loss 32.407158 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:32 Epoch 6 | Batch 2814/2891 | Timestep 20160 | LR 0.0001000000 | Loss 35.440410 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:34 Epoch 6 | Batch 2824/2891 | Timestep 20170 | LR 0.0001000000 | Loss 43.928731 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:36 Epoch 6 | Batch 2834/2891 | Timestep 20180 | LR 0.0001000000 | Loss 38.669984 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:39 Epoch 6 | Batch 2844/2891 | Timestep 20190 | LR 0.0001000000 | Loss 38.104191 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:41 Epoch 6 | Batch 2854/2891 | Timestep 20200 | LR 0.0001000000 | Loss 38.046943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:43 Epoch 6 | Batch 2864/2891 | Timestep 20210 | LR 0.0001000000 | Loss 37.516366 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:46 Epoch 6 | Batch 2874/2891 | Timestep 20220 | LR 0.0001000000 | Loss 37.232030 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:48 Epoch 6 | Batch 2884/2891 | Timestep 20230 | LR 0.0001000000 | Loss 37.095488 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:43:49 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 19:45:32 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.0000 0.0000 0.0000 104 + CAMP 0.0000 0.0000 0.0000 71 + CARDINAL 0.0000 0.0000 0.0000 170 + CLUSTER 0.0000 0.0000 0.0000 26 + COM 0.0000 0.0000 0.0000 39 + CONTINENT 0.0000 0.0000 0.0000 23 + COUNTRY 0.0000 0.0000 0.0000 835 + CURR 0.0000 0.0000 0.0000 24 + DATE 0.0000 0.0000 0.0000 1691 + EDU 0.0000 0.0000 0.0000 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.0000 0.0000 0.0000 292 + FAC 0.0000 0.0000 0.0000 111 + GOV 0.0000 0.0000 0.0000 860 + GPE 0.0000 0.0000 0.0000 2261 + GPE_ORG 0.0000 0.0000 0.0000 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 0.0000 0.0000 0.0000 16 + LAW 0.0000 0.0000 0.0000 47 + LOC 0.0000 0.0000 0.0000 127 + MED 0.0000 0.0000 0.0000 419 + MONEY 0.0000 0.0000 0.0000 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.0000 0.0000 0.0000 571 + NORP 0.0000 0.0000 0.0000 551 + OCC 0.0000 0.0000 0.0000 522 + ORDINAL 0.0000 0.0000 0.0000 544 + ORG 0.0000 0.0000 0.0000 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.0000 0.0000 0.0000 6 + PERCENT 0.0000 0.0000 0.0000 12 + PERS 0.0000 0.0000 0.0000 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.0000 0.0000 0.0000 3 + REGION-GENERAL 0.0000 0.0000 0.0000 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.0000 0.0000 0.0000 10 + SCI 0.0000 0.0000 0.0000 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.0000 0.0000 0.0000 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.0000 0.0000 0.0000 33 + TOWN 0.0000 0.0000 0.0000 1217 + UNIT 0.0000 0.0000 0.0000 4 + WATER-BODY 0.0000 0.0000 0.0000 14 + WEBSITE 0.0000 0.0000 0.0000 80 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.0000 0.0000 0.0000 13790 + macro avg 0.0000 0.0000 0.0000 13790 + weighted avg 0.0000 0.0000 0.0000 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:37 Epoch 6 | Timestep 20237 | Train Loss 37.478293 | Val Loss 42.590721 | F1 0.000000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:37 Epoch 7 | Batch 3/2891 | Timestep 20240 | LR 0.0001000000 | Loss 36.630976 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:39 Epoch 7 | Batch 13/2891 | Timestep 20250 | LR 0.0001000000 | Loss 39.653764 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:41 Epoch 7 | Batch 23/2891 | Timestep 20260 | LR 0.0001000000 | Loss 35.603994 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:43 Epoch 7 | Batch 33/2891 | Timestep 20270 | LR 0.0001000000 | Loss 37.746612 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:45 Epoch 7 | Batch 43/2891 | Timestep 20280 | LR 0.0001000000 | Loss 38.458881 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:47 Epoch 7 | Batch 53/2891 | Timestep 20290 | LR 0.0001000000 | Loss 38.728509 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:50 Epoch 7 | Batch 63/2891 | Timestep 20300 | LR 0.0001000000 | Loss 37.194866 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:52 Epoch 7 | Batch 73/2891 | Timestep 20310 | LR 0.0001000000 | Loss 38.372466 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:54 Epoch 7 | Batch 83/2891 | Timestep 20320 | LR 0.0001000000 | Loss 36.767022 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:56 Epoch 7 | Batch 93/2891 | Timestep 20330 | LR 0.0001000000 | Loss 39.079808 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:46:58 Epoch 7 | Batch 103/2891 | Timestep 20340 | LR 0.0001000000 | Loss 37.502512 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:01 Epoch 7 | Batch 113/2891 | Timestep 20350 | LR 0.0001000000 | Loss 37.237657 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:03 Epoch 7 | Batch 123/2891 | Timestep 20360 | LR 0.0001000000 | Loss 39.997766 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:05 Epoch 7 | Batch 133/2891 | Timestep 20370 | LR 0.0001000000 | Loss 38.527900 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:07 Epoch 7 | Batch 143/2891 | Timestep 20380 | LR 0.0001000000 | Loss 36.439951 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:10 Epoch 7 | Batch 153/2891 | Timestep 20390 | LR 0.0001000000 | Loss 37.705430 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:12 Epoch 7 | Batch 163/2891 | Timestep 20400 | LR 0.0001000000 | Loss 37.625357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:14 Epoch 7 | Batch 173/2891 | Timestep 20410 | LR 0.0001000000 | Loss 39.055345 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:16 Epoch 7 | Batch 183/2891 | Timestep 20420 | LR 0.0001000000 | Loss 37.485892 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:18 Epoch 7 | Batch 193/2891 | Timestep 20430 | LR 0.0001000000 | Loss 37.211848 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:20 Epoch 7 | Batch 203/2891 | Timestep 20440 | LR 0.0001000000 | Loss 37.785513 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:22 Epoch 7 | Batch 213/2891 | Timestep 20450 | LR 0.0001000000 | Loss 37.211820 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:24 Epoch 7 | Batch 223/2891 | Timestep 20460 | LR 0.0001000000 | Loss 38.111572 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:26 Epoch 7 | Batch 233/2891 | Timestep 20470 | LR 0.0001000000 | Loss 37.113739 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:28 Epoch 7 | Batch 243/2891 | Timestep 20480 | LR 0.0001000000 | Loss 36.648857 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:30 Epoch 7 | Batch 253/2891 | Timestep 20490 | LR 0.0001000000 | Loss 37.710353 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:32 Epoch 7 | Batch 263/2891 | Timestep 20500 | LR 0.0001000000 | Loss 38.041164 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:35 Epoch 7 | Batch 273/2891 | Timestep 20510 | LR 0.0001000000 | Loss 37.207755 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:37 Epoch 7 | Batch 283/2891 | Timestep 20520 | LR 0.0001000000 | Loss 39.050490 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:39 Epoch 7 | Batch 293/2891 | Timestep 20530 | LR 0.0001000000 | Loss 36.073692 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:41 Epoch 7 | Batch 303/2891 | Timestep 20540 | LR 0.0001000000 | Loss 38.473152 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:44 Epoch 7 | Batch 313/2891 | Timestep 20550 | LR 0.0001000000 | Loss 38.140669 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:46 Epoch 7 | Batch 323/2891 | Timestep 20560 | LR 0.0001000000 | Loss 37.409262 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:48 Epoch 7 | Batch 333/2891 | Timestep 20570 | LR 0.0001000000 | Loss 36.870672 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:50 Epoch 7 | Batch 343/2891 | Timestep 20580 | LR 0.0001000000 | Loss 39.340369 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:52 Epoch 7 | Batch 353/2891 | Timestep 20590 | LR 0.0001000000 | Loss 37.902641 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:54 Epoch 7 | Batch 363/2891 | Timestep 20600 | LR 0.0001000000 | Loss 36.741589 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:56 Epoch 7 | Batch 373/2891 | Timestep 20610 | LR 0.0001000000 | Loss 38.185939 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:47:58 Epoch 7 | Batch 383/2891 | Timestep 20620 | LR 0.0001000000 | Loss 37.559626 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:00 Epoch 7 | Batch 393/2891 | Timestep 20630 | LR 0.0001000000 | Loss 37.187382 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:03 Epoch 7 | Batch 403/2891 | Timestep 20640 | LR 0.0001000000 | Loss 37.112134 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:05 Epoch 7 | Batch 413/2891 | Timestep 20650 | LR 0.0001000000 | Loss 35.158457 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:07 Epoch 7 | Batch 423/2891 | Timestep 20660 | LR 0.0001000000 | Loss 37.566185 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:09 Epoch 7 | Batch 433/2891 | Timestep 20670 | LR 0.0001000000 | Loss 37.931571 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:11 Epoch 7 | Batch 443/2891 | Timestep 20680 | LR 0.0001000000 | Loss 37.690236 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:13 Epoch 7 | Batch 453/2891 | Timestep 20690 | LR 0.0001000000 | Loss 37.834867 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:15 Epoch 7 | Batch 463/2891 | Timestep 20700 | LR 0.0001000000 | Loss 38.284069 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:18 Epoch 7 | Batch 473/2891 | Timestep 20710 | LR 0.0001000000 | Loss 36.443138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:20 Epoch 7 | Batch 483/2891 | Timestep 20720 | LR 0.0001000000 | Loss 39.046646 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:23 Epoch 7 | Batch 493/2891 | Timestep 20730 | LR 0.0001000000 | Loss 38.112414 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:25 Epoch 7 | Batch 503/2891 | Timestep 20740 | LR 0.0001000000 | Loss 37.414652 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:27 Epoch 7 | Batch 513/2891 | Timestep 20750 | LR 0.0001000000 | Loss 39.529693 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:29 Epoch 7 | Batch 523/2891 | Timestep 20760 | LR 0.0001000000 | Loss 36.502671 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:31 Epoch 7 | Batch 533/2891 | Timestep 20770 | LR 0.0001000000 | Loss 38.060710 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:33 Epoch 7 | Batch 543/2891 | Timestep 20780 | LR 0.0001000000 | Loss 38.557317 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:36 Epoch 7 | Batch 553/2891 | Timestep 20790 | LR 0.0001000000 | Loss 41.680180 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:39 Epoch 7 | Batch 563/2891 | Timestep 20800 | LR 0.0001000000 | Loss 39.049877 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:41 Epoch 7 | Batch 573/2891 | Timestep 20810 | LR 0.0001000000 | Loss 35.606600 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:43 Epoch 7 | Batch 583/2891 | Timestep 20820 | LR 0.0001000000 | Loss 35.165760 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:45 Epoch 7 | Batch 593/2891 | Timestep 20830 | LR 0.0001000000 | Loss 37.639782 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:48 Epoch 7 | Batch 603/2891 | Timestep 20840 | LR 0.0001000000 | Loss 38.668698 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:50 Epoch 7 | Batch 613/2891 | Timestep 20850 | LR 0.0001000000 | Loss 36.904853 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:52 Epoch 7 | Batch 623/2891 | Timestep 20860 | LR 0.0001000000 | Loss 37.883500 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:54 Epoch 7 | Batch 633/2891 | Timestep 20870 | LR 0.0001000000 | Loss 35.665226 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:56 Epoch 7 | Batch 643/2891 | Timestep 20880 | LR 0.0001000000 | Loss 44.139799 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:48:58 Epoch 7 | Batch 653/2891 | Timestep 20890 | LR 0.0001000000 | Loss 36.424230 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:01 Epoch 7 | Batch 663/2891 | Timestep 20900 | LR 0.0001000000 | Loss 39.108266 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:03 Epoch 7 | Batch 673/2891 | Timestep 20910 | LR 0.0001000000 | Loss 37.766836 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:05 Epoch 7 | Batch 683/2891 | Timestep 20920 | LR 0.0001000000 | Loss 36.369664 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:08 Epoch 7 | Batch 693/2891 | Timestep 20930 | LR 0.0001000000 | Loss 34.882823 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:10 Epoch 7 | Batch 703/2891 | Timestep 20940 | LR 0.0001000000 | Loss 37.399360 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:12 Epoch 7 | Batch 713/2891 | Timestep 20950 | LR 0.0001000000 | Loss 34.915963 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:14 Epoch 7 | Batch 723/2891 | Timestep 20960 | LR 0.0001000000 | Loss 37.737954 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:16 Epoch 7 | Batch 733/2891 | Timestep 20970 | LR 0.0001000000 | Loss 37.871787 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:19 Epoch 7 | Batch 743/2891 | Timestep 20980 | LR 0.0001000000 | Loss 35.796193 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:21 Epoch 7 | Batch 753/2891 | Timestep 20990 | LR 0.0001000000 | Loss 39.849981 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:23 Epoch 7 | Batch 763/2891 | Timestep 21000 | LR 0.0001000000 | Loss 37.708138 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:25 Epoch 7 | Batch 773/2891 | Timestep 21010 | LR 0.0001000000 | Loss 35.514800 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:27 Epoch 7 | Batch 783/2891 | Timestep 21020 | LR 0.0001000000 | Loss 35.551183 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:30 Epoch 7 | Batch 793/2891 | Timestep 21030 | LR 0.0001000000 | Loss 40.050653 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:32 Epoch 7 | Batch 803/2891 | Timestep 21040 | LR 0.0001000000 | Loss 41.762442 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:35 Epoch 7 | Batch 813/2891 | Timestep 21050 | LR 0.0001000000 | Loss 37.072897 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:37 Epoch 7 | Batch 823/2891 | Timestep 21060 | LR 0.0001000000 | Loss 32.268342 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:39 Epoch 7 | Batch 833/2891 | Timestep 21070 | LR 0.0001000000 | Loss 34.496357 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:41 Epoch 7 | Batch 843/2891 | Timestep 21080 | LR 0.0001000000 | Loss 37.419889 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:43 Epoch 7 | Batch 853/2891 | Timestep 21090 | LR 0.0001000000 | Loss 38.205950 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:45 Epoch 7 | Batch 863/2891 | Timestep 21100 | LR 0.0001000000 | Loss 37.442659 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:48 Epoch 7 | Batch 873/2891 | Timestep 21110 | LR 0.0001000000 | Loss 37.689337 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:50 Epoch 7 | Batch 883/2891 | Timestep 21120 | LR 0.0001000000 | Loss 37.447789 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:52 Epoch 7 | Batch 893/2891 | Timestep 21130 | LR 0.0001000000 | Loss 39.069839 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:55 Epoch 7 | Batch 903/2891 | Timestep 21140 | LR 0.0001000000 | Loss 34.781929 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:49:58 Epoch 7 | Batch 913/2891 | Timestep 21150 | LR 0.0001000000 | Loss 34.778922 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:00 Epoch 7 | Batch 923/2891 | Timestep 21160 | LR 0.0001000000 | Loss 36.508440 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:02 Epoch 7 | Batch 933/2891 | Timestep 21170 | LR 0.0001000000 | Loss 35.138201 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:04 Epoch 7 | Batch 943/2891 | Timestep 21180 | LR 0.0001000000 | Loss 39.413771 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:06 Epoch 7 | Batch 953/2891 | Timestep 21190 | LR 0.0001000000 | Loss 37.047428 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:08 Epoch 7 | Batch 963/2891 | Timestep 21200 | LR 0.0001000000 | Loss 36.401983 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:11 Epoch 7 | Batch 973/2891 | Timestep 21210 | LR 0.0001000000 | Loss 36.072828 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:13 Epoch 7 | Batch 983/2891 | Timestep 21220 | LR 0.0001000000 | Loss 32.190755 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:15 Epoch 7 | Batch 993/2891 | Timestep 21230 | LR 0.0001000000 | Loss 32.367462 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:18 Epoch 7 | Batch 1003/2891 | Timestep 21240 | LR 0.0001000000 | Loss 33.109541 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:20 Epoch 7 | Batch 1013/2891 | Timestep 21250 | LR 0.0001000000 | Loss 36.225643 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:22 Epoch 7 | Batch 1023/2891 | Timestep 21260 | LR 0.0001000000 | Loss 35.985852 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:24 Epoch 7 | Batch 1033/2891 | Timestep 21270 | LR 0.0001000000 | Loss 41.182365 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:26 Epoch 7 | Batch 1043/2891 | Timestep 21280 | LR 0.0001000000 | Loss 36.917954 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:28 Epoch 7 | Batch 1053/2891 | Timestep 21290 | LR 0.0001000000 | Loss 36.227866 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:30 Epoch 7 | Batch 1063/2891 | Timestep 21300 | LR 0.0001000000 | Loss 35.476550 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:33 Epoch 7 | Batch 1073/2891 | Timestep 21310 | LR 0.0001000000 | Loss 38.065232 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:35 Epoch 7 | Batch 1083/2891 | Timestep 21320 | LR 0.0001000000 | Loss 38.246410 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:37 Epoch 7 | Batch 1093/2891 | Timestep 21330 | LR 0.0001000000 | Loss 37.892958 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:39 Epoch 7 | Batch 1103/2891 | Timestep 21340 | LR 0.0001000000 | Loss 38.551200 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:41 Epoch 7 | Batch 1113/2891 | Timestep 21350 | LR 0.0001000000 | Loss 36.375032 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:43 Epoch 7 | Batch 1123/2891 | Timestep 21360 | LR 0.0001000000 | Loss 37.626283 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:46 Epoch 7 | Batch 1133/2891 | Timestep 21370 | LR 0.0001000000 | Loss 38.963906 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:48 Epoch 7 | Batch 1143/2891 | Timestep 21380 | LR 0.0001000000 | Loss 40.706147 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:50 Epoch 7 | Batch 1153/2891 | Timestep 21390 | LR 0.0001000000 | Loss 38.904058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:53 Epoch 7 | Batch 1163/2891 | Timestep 21400 | LR 0.0001000000 | Loss 36.321766 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:55 Epoch 7 | Batch 1173/2891 | Timestep 21410 | LR 0.0001000000 | Loss 35.007907 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:50:57 Epoch 7 | Batch 1183/2891 | Timestep 21420 | LR 0.0001000000 | Loss 41.196029 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:00 Epoch 7 | Batch 1193/2891 | Timestep 21430 | LR 0.0001000000 | Loss 39.106744 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:02 Epoch 7 | Batch 1203/2891 | Timestep 21440 | LR 0.0001000000 | Loss 34.557795 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:04 Epoch 7 | Batch 1213/2891 | Timestep 21450 | LR 0.0001000000 | Loss 38.272715 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:06 Epoch 7 | Batch 1223/2891 | Timestep 21460 | LR 0.0001000000 | Loss 36.336079 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:08 Epoch 7 | Batch 1233/2891 | Timestep 21470 | LR 0.0001000000 | Loss 36.143831 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:10 Epoch 7 | Batch 1243/2891 | Timestep 21480 | LR 0.0001000000 | Loss 37.373163 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:12 Epoch 7 | Batch 1253/2891 | Timestep 21490 | LR 0.0001000000 | Loss 35.057170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:15 Epoch 7 | Batch 1263/2891 | Timestep 21500 | LR 0.0001000000 | Loss 35.571953 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:17 Epoch 7 | Batch 1273/2891 | Timestep 21510 | LR 0.0001000000 | Loss 37.139669 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:19 Epoch 7 | Batch 1283/2891 | Timestep 21520 | LR 0.0001000000 | Loss 35.380343 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:21 Epoch 7 | Batch 1293/2891 | Timestep 21530 | LR 0.0001000000 | Loss 39.100175 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:24 Epoch 7 | Batch 1303/2891 | Timestep 21540 | LR 0.0001000000 | Loss 38.383919 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:26 Epoch 7 | Batch 1313/2891 | Timestep 21550 | LR 0.0001000000 | Loss 39.417162 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:28 Epoch 7 | Batch 1323/2891 | Timestep 21560 | LR 0.0001000000 | Loss 37.526734 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:30 Epoch 7 | Batch 1333/2891 | Timestep 21570 | LR 0.0001000000 | Loss 37.438581 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:32 Epoch 7 | Batch 1343/2891 | Timestep 21580 | LR 0.0001000000 | Loss 37.588540 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:34 Epoch 7 | Batch 1353/2891 | Timestep 21590 | LR 0.0001000000 | Loss 37.967233 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:36 Epoch 7 | Batch 1363/2891 | Timestep 21600 | LR 0.0001000000 | Loss 37.933829 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:38 Epoch 7 | Batch 1373/2891 | Timestep 21610 | LR 0.0001000000 | Loss 38.079043 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:40 Epoch 7 | Batch 1383/2891 | Timestep 21620 | LR 0.0001000000 | Loss 38.099804 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:42 Epoch 7 | Batch 1393/2891 | Timestep 21630 | LR 0.0001000000 | Loss 37.952987 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:45 Epoch 7 | Batch 1403/2891 | Timestep 21640 | LR 0.0001000000 | Loss 36.843232 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:47 Epoch 7 | Batch 1413/2891 | Timestep 21650 | LR 0.0001000000 | Loss 36.949756 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:49 Epoch 7 | Batch 1423/2891 | Timestep 21660 | LR 0.0001000000 | Loss 38.257157 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:51 Epoch 7 | Batch 1433/2891 | Timestep 21670 | LR 0.0001000000 | Loss 35.458081 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:53 Epoch 7 | Batch 1443/2891 | Timestep 21680 | LR 0.0001000000 | Loss 36.439528 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:56 Epoch 7 | Batch 1453/2891 | Timestep 21690 | LR 0.0001000000 | Loss 37.917892 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:51:58 Epoch 7 | Batch 1463/2891 | Timestep 21700 | LR 0.0001000000 | Loss 35.376247 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:01 Epoch 7 | Batch 1473/2891 | Timestep 21710 | LR 0.0001000000 | Loss 36.776788 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:03 Epoch 7 | Batch 1483/2891 | Timestep 21720 | LR 0.0001000000 | Loss 35.163869 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:05 Epoch 7 | Batch 1493/2891 | Timestep 21730 | LR 0.0001000000 | Loss 37.034140 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:07 Epoch 7 | Batch 1503/2891 | Timestep 21740 | LR 0.0001000000 | Loss 37.793321 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:09 Epoch 7 | Batch 1513/2891 | Timestep 21750 | LR 0.0001000000 | Loss 36.990348 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:11 Epoch 7 | Batch 1523/2891 | Timestep 21760 | LR 0.0001000000 | Loss 38.315492 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:14 Epoch 7 | Batch 1533/2891 | Timestep 21770 | LR 0.0001000000 | Loss 37.950768 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:16 Epoch 7 | Batch 1543/2891 | Timestep 21780 | LR 0.0001000000 | Loss 39.213930 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:18 Epoch 7 | Batch 1553/2891 | Timestep 21790 | LR 0.0001000000 | Loss 36.810418 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:20 Epoch 7 | Batch 1563/2891 | Timestep 21800 | LR 0.0001000000 | Loss 38.107446 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:22 Epoch 7 | Batch 1573/2891 | Timestep 21810 | LR 0.0001000000 | Loss 38.732058 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:24 Epoch 7 | Batch 1583/2891 | Timestep 21820 | LR 0.0001000000 | Loss 36.801679 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:27 Epoch 7 | Batch 1593/2891 | Timestep 21830 | LR 0.0001000000 | Loss 36.495175 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:30 Epoch 7 | Batch 1603/2891 | Timestep 21840 | LR 0.0001000000 | Loss 36.995078 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:32 Epoch 7 | Batch 1613/2891 | Timestep 21850 | LR 0.0001000000 | Loss 37.013392 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:34 Epoch 7 | Batch 1623/2891 | Timestep 21860 | LR 0.0001000000 | Loss 36.124615 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:36 Epoch 7 | Batch 1633/2891 | Timestep 21870 | LR 0.0001000000 | Loss 37.754942 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:38 Epoch 7 | Batch 1643/2891 | Timestep 21880 | LR 0.0001000000 | Loss 35.115342 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:41 Epoch 7 | Batch 1653/2891 | Timestep 21890 | LR 0.0001000000 | Loss 37.303134 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:43 Epoch 7 | Batch 1663/2891 | Timestep 21900 | LR 0.0001000000 | Loss 36.057311 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:45 Epoch 7 | Batch 1673/2891 | Timestep 21910 | LR 0.0001000000 | Loss 44.487395 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:48 Epoch 7 | Batch 1683/2891 | Timestep 21920 | LR 0.0001000000 | Loss 39.642867 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:50 Epoch 7 | Batch 1693/2891 | Timestep 21930 | LR 0.0001000000 | Loss 31.475837 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:52 Epoch 7 | Batch 1703/2891 | Timestep 21940 | LR 0.0001000000 | Loss 41.648404 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:55 Epoch 7 | Batch 1713/2891 | Timestep 21950 | LR 0.0001000000 | Loss 45.373634 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:57 Epoch 7 | Batch 1723/2891 | Timestep 21960 | LR 0.0001000000 | Loss 38.808108 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:52:59 Epoch 7 | Batch 1733/2891 | Timestep 21970 | LR 0.0001000000 | Loss 39.639908 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:02 Epoch 7 | Batch 1743/2891 | Timestep 21980 | LR 0.0001000000 | Loss 36.175269 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:04 Epoch 7 | Batch 1753/2891 | Timestep 21990 | LR 0.0001000000 | Loss 36.411561 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:06 Epoch 7 | Batch 1763/2891 | Timestep 22000 | LR 0.0001000000 | Loss 37.692495 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:08 Epoch 7 | Batch 1773/2891 | Timestep 22010 | LR 0.0001000000 | Loss 38.194548 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:10 Epoch 7 | Batch 1783/2891 | Timestep 22020 | LR 0.0001000000 | Loss 37.934298 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:12 Epoch 7 | Batch 1793/2891 | Timestep 22030 | LR 0.0001000000 | Loss 37.850072 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:15 Epoch 7 | Batch 1803/2891 | Timestep 22040 | LR 0.0001000000 | Loss 38.083947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:17 Epoch 7 | Batch 1813/2891 | Timestep 22050 | LR 0.0001000000 | Loss 39.834219 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:19 Epoch 7 | Batch 1823/2891 | Timestep 22060 | LR 0.0001000000 | Loss 38.586106 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:21 Epoch 7 | Batch 1833/2891 | Timestep 22070 | LR 0.0001000000 | Loss 37.643949 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:24 Epoch 7 | Batch 1843/2891 | Timestep 22080 | LR 0.0001000000 | Loss 37.366817 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:26 Epoch 7 | Batch 1853/2891 | Timestep 22090 | LR 0.0001000000 | Loss 35.396723 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:28 Epoch 7 | Batch 1863/2891 | Timestep 22100 | LR 0.0001000000 | Loss 33.410872 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:31 Epoch 7 | Batch 1873/2891 | Timestep 22110 | LR 0.0001000000 | Loss 37.487453 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:33 Epoch 7 | Batch 1883/2891 | Timestep 22120 | LR 0.0001000000 | Loss 35.178070 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:35 Epoch 7 | Batch 1893/2891 | Timestep 22130 | LR 0.0001000000 | Loss 38.907076 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:37 Epoch 7 | Batch 1903/2891 | Timestep 22140 | LR 0.0001000000 | Loss 38.152163 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:38 Epoch 7 | Batch 1913/2891 | Timestep 22150 | LR 0.0001000000 | Loss 37.746742 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:40 Epoch 7 | Batch 1923/2891 | Timestep 22160 | LR 0.0001000000 | Loss 37.354189 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:43 Epoch 7 | Batch 1933/2891 | Timestep 22170 | LR 0.0001000000 | Loss 37.254224 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:45 Epoch 7 | Batch 1943/2891 | Timestep 22180 | LR 0.0001000000 | Loss 37.632143 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:47 Epoch 7 | Batch 1953/2891 | Timestep 22190 | LR 0.0001000000 | Loss 34.892677 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:49 Epoch 7 | Batch 1963/2891 | Timestep 22200 | LR 0.0001000000 | Loss 38.222248 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:52 Epoch 7 | Batch 1973/2891 | Timestep 22210 | LR 0.0001000000 | Loss 39.005749 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:54 Epoch 7 | Batch 1983/2891 | Timestep 22220 | LR 0.0001000000 | Loss 37.348796 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:56 Epoch 7 | Batch 1993/2891 | Timestep 22230 | LR 0.0001000000 | Loss 38.047775 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:53:59 Epoch 7 | Batch 2003/2891 | Timestep 22240 | LR 0.0001000000 | Loss 37.821145 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:01 Epoch 7 | Batch 2013/2891 | Timestep 22250 | LR 0.0001000000 | Loss 35.385506 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:03 Epoch 7 | Batch 2023/2891 | Timestep 22260 | LR 0.0001000000 | Loss 36.772981 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:05 Epoch 7 | Batch 2033/2891 | Timestep 22270 | LR 0.0001000000 | Loss 37.626211 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:07 Epoch 7 | Batch 2043/2891 | Timestep 22280 | LR 0.0001000000 | Loss 37.530543 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:09 Epoch 7 | Batch 2053/2891 | Timestep 22290 | LR 0.0001000000 | Loss 37.972059 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:12 Epoch 7 | Batch 2063/2891 | Timestep 22300 | LR 0.0001000000 | Loss 37.827174 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:14 Epoch 7 | Batch 2073/2891 | Timestep 22310 | LR 0.0001000000 | Loss 36.415313 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:16 Epoch 7 | Batch 2083/2891 | Timestep 22320 | LR 0.0001000000 | Loss 39.132708 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:18 Epoch 7 | Batch 2093/2891 | Timestep 22330 | LR 0.0001000000 | Loss 38.032191 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:20 Epoch 7 | Batch 2103/2891 | Timestep 22340 | LR 0.0001000000 | Loss 38.067970 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:22 Epoch 7 | Batch 2113/2891 | Timestep 22350 | LR 0.0001000000 | Loss 38.434847 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:25 Epoch 7 | Batch 2123/2891 | Timestep 22360 | LR 0.0001000000 | Loss 36.579247 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:27 Epoch 7 | Batch 2133/2891 | Timestep 22370 | LR 0.0001000000 | Loss 39.007692 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:29 Epoch 7 | Batch 2143/2891 | Timestep 22380 | LR 0.0001000000 | Loss 37.287241 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:31 Epoch 7 | Batch 2153/2891 | Timestep 22390 | LR 0.0001000000 | Loss 37.193854 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:33 Epoch 7 | Batch 2163/2891 | Timestep 22400 | LR 0.0001000000 | Loss 37.311683 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:36 Epoch 7 | Batch 2173/2891 | Timestep 22410 | LR 0.0001000000 | Loss 37.003803 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:38 Epoch 7 | Batch 2183/2891 | Timestep 22420 | LR 0.0001000000 | Loss 37.371023 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:40 Epoch 7 | Batch 2193/2891 | Timestep 22430 | LR 0.0001000000 | Loss 38.986165 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:42 Epoch 7 | Batch 2203/2891 | Timestep 22440 | LR 0.0001000000 | Loss 38.817476 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:44 Epoch 7 | Batch 2213/2891 | Timestep 22450 | LR 0.0001000000 | Loss 38.176746 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:46 Epoch 7 | Batch 2223/2891 | Timestep 22460 | LR 0.0001000000 | Loss 41.884863 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:48 Epoch 7 | Batch 2233/2891 | Timestep 22470 | LR 0.0001000000 | Loss 36.337250 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:50 Epoch 7 | Batch 2243/2891 | Timestep 22480 | LR 0.0001000000 | Loss 37.461101 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:52 Epoch 7 | Batch 2253/2891 | Timestep 22490 | LR 0.0001000000 | Loss 39.352848 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:54 Epoch 7 | Batch 2263/2891 | Timestep 22500 | LR 0.0001000000 | Loss 38.568010 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:56 Epoch 7 | Batch 2273/2891 | Timestep 22510 | LR 0.0001000000 | Loss 36.255943 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:54:59 Epoch 7 | Batch 2283/2891 | Timestep 22520 | LR 0.0001000000 | Loss 37.463308 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:01 Epoch 7 | Batch 2293/2891 | Timestep 22530 | LR 0.0001000000 | Loss 38.961437 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:03 Epoch 7 | Batch 2303/2891 | Timestep 22540 | LR 0.0001000000 | Loss 37.562969 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:06 Epoch 7 | Batch 2313/2891 | Timestep 22550 | LR 0.0001000000 | Loss 38.805030 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:08 Epoch 7 | Batch 2323/2891 | Timestep 22560 | LR 0.0001000000 | Loss 36.032179 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:10 Epoch 7 | Batch 2333/2891 | Timestep 22570 | LR 0.0001000000 | Loss 35.843794 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:12 Epoch 7 | Batch 2343/2891 | Timestep 22580 | LR 0.0001000000 | Loss 37.639544 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:14 Epoch 7 | Batch 2353/2891 | Timestep 22590 | LR 0.0001000000 | Loss 39.061243 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:16 Epoch 7 | Batch 2363/2891 | Timestep 22600 | LR 0.0001000000 | Loss 36.875659 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:18 Epoch 7 | Batch 2373/2891 | Timestep 22610 | LR 0.0001000000 | Loss 35.715613 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:21 Epoch 7 | Batch 2383/2891 | Timestep 22620 | LR 0.0001000000 | Loss 36.289501 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:23 Epoch 7 | Batch 2393/2891 | Timestep 22630 | LR 0.0001000000 | Loss 39.027460 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:25 Epoch 7 | Batch 2403/2891 | Timestep 22640 | LR 0.0001000000 | Loss 38.305608 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:27 Epoch 7 | Batch 2413/2891 | Timestep 22650 | LR 0.0001000000 | Loss 35.054414 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:29 Epoch 7 | Batch 2423/2891 | Timestep 22660 | LR 0.0001000000 | Loss 36.347932 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:32 Epoch 7 | Batch 2433/2891 | Timestep 22670 | LR 0.0001000000 | Loss 40.664170 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:34 Epoch 7 | Batch 2443/2891 | Timestep 22680 | LR 0.0001000000 | Loss 42.163249 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:37 Epoch 7 | Batch 2453/2891 | Timestep 22690 | LR 0.0001000000 | Loss 38.829123 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:39 Epoch 7 | Batch 2463/2891 | Timestep 22700 | LR 0.0001000000 | Loss 40.182518 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:41 Epoch 7 | Batch 2473/2891 | Timestep 22710 | LR 0.0001000000 | Loss 36.429507 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:43 Epoch 7 | Batch 2483/2891 | Timestep 22720 | LR 0.0001000000 | Loss 36.975046 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:45 Epoch 7 | Batch 2493/2891 | Timestep 22730 | LR 0.0001000000 | Loss 37.633039 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:47 Epoch 7 | Batch 2503/2891 | Timestep 22740 | LR 0.0001000000 | Loss 37.905724 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:49 Epoch 7 | Batch 2513/2891 | Timestep 22750 | LR 0.0001000000 | Loss 38.304993 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:51 Epoch 7 | Batch 2523/2891 | Timestep 22760 | LR 0.0001000000 | Loss 37.213667 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:53 Epoch 7 | Batch 2533/2891 | Timestep 22770 | LR 0.0001000000 | Loss 36.354064 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:56 Epoch 7 | Batch 2543/2891 | Timestep 22780 | LR 0.0001000000 | Loss 37.300762 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:55:58 Epoch 7 | Batch 2553/2891 | Timestep 22790 | LR 0.0001000000 | Loss 35.841931 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:00 Epoch 7 | Batch 2563/2891 | Timestep 22800 | LR 0.0001000000 | Loss 37.148794 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:02 Epoch 7 | Batch 2573/2891 | Timestep 22810 | LR 0.0001000000 | Loss 41.356721 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:04 Epoch 7 | Batch 2583/2891 | Timestep 22820 | LR 0.0001000000 | Loss 37.070474 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:06 Epoch 7 | Batch 2593/2891 | Timestep 22830 | LR 0.0001000000 | Loss 34.844604 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:08 Epoch 7 | Batch 2603/2891 | Timestep 22840 | LR 0.0001000000 | Loss 36.343282 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:11 Epoch 7 | Batch 2613/2891 | Timestep 22850 | LR 0.0001000000 | Loss 37.937859 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:13 Epoch 7 | Batch 2623/2891 | Timestep 22860 | LR 0.0001000000 | Loss 37.508993 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:15 Epoch 7 | Batch 2633/2891 | Timestep 22870 | LR 0.0001000000 | Loss 37.804155 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:17 Epoch 7 | Batch 2643/2891 | Timestep 22880 | LR 0.0001000000 | Loss 37.487333 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:19 Epoch 7 | Batch 2653/2891 | Timestep 22890 | LR 0.0001000000 | Loss 39.000846 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:21 Epoch 7 | Batch 2663/2891 | Timestep 22900 | LR 0.0001000000 | Loss 37.785947 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:23 Epoch 7 | Batch 2673/2891 | Timestep 22910 | LR 0.0001000000 | Loss 36.588009 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:26 Epoch 7 | Batch 2683/2891 | Timestep 22920 | LR 0.0001000000 | Loss 34.484758 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:28 Epoch 7 | Batch 2693/2891 | Timestep 22930 | LR 0.0001000000 | Loss 38.721195 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:30 Epoch 7 | Batch 2703/2891 | Timestep 22940 | LR 0.0001000000 | Loss 36.304486 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:32 Epoch 7 | Batch 2713/2891 | Timestep 22950 | LR 0.0001000000 | Loss 39.535730 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:34 Epoch 7 | Batch 2723/2891 | Timestep 22960 | LR 0.0001000000 | Loss 38.057440 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:36 Epoch 7 | Batch 2733/2891 | Timestep 22970 | LR 0.0001000000 | Loss 37.442146 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:38 Epoch 7 | Batch 2743/2891 | Timestep 22980 | LR 0.0001000000 | Loss 38.067719 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:41 Epoch 7 | Batch 2753/2891 | Timestep 22990 | LR 0.0001000000 | Loss 37.018146 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:43 Epoch 7 | Batch 2763/2891 | Timestep 23000 | LR 0.0001000000 | Loss 35.429619 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:45 Epoch 7 | Batch 2773/2891 | Timestep 23010 | LR 0.0001000000 | Loss 36.805193 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:47 Epoch 7 | Batch 2783/2891 | Timestep 23020 | LR 0.0001000000 | Loss 38.698632 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:50 Epoch 7 | Batch 2793/2891 | Timestep 23030 | LR 0.0001000000 | Loss 38.443078 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:52 Epoch 7 | Batch 2803/2891 | Timestep 23040 | LR 0.0001000000 | Loss 35.526467 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:54 Epoch 7 | Batch 2813/2891 | Timestep 23050 | LR 0.0001000000 | Loss 37.264568 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:56 Epoch 7 | Batch 2823/2891 | Timestep 23060 | LR 0.0001000000 | Loss 37.871094 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:56:58 Epoch 7 | Batch 2833/2891 | Timestep 23070 | LR 0.0001000000 | Loss 38.204362 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:00 Epoch 7 | Batch 2843/2891 | Timestep 23080 | LR 0.0001000000 | Loss 38.694631 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:02 Epoch 7 | Batch 2853/2891 | Timestep 23090 | LR 0.0001000000 | Loss 35.470569 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:05 Epoch 7 | Batch 2863/2891 | Timestep 23100 | LR 0.0001000000 | Loss 35.416501 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:07 Epoch 7 | Batch 2873/2891 | Timestep 23110 | LR 0.0001000000 | Loss 34.749727 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:09 Epoch 7 | Batch 2883/2891 | Timestep 23120 | LR 0.0001000000 | Loss 38.161754 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:57:11 ** Evaluating on validation dataset ** +INFO root Tue, 26 Mar 2024 19:58:52 + precision recall f1-score support + + BOUNDARY 0.0000 0.0000 0.0000 4 + BUILDING-OR-GROUNDS 0.0000 0.0000 0.0000 104 + CAMP 0.0000 0.0000 0.0000 71 + CARDINAL 0.0000 0.0000 0.0000 170 + CLUSTER 0.0000 0.0000 0.0000 26 + COM 0.0000 0.0000 0.0000 39 + CONTINENT 0.0000 0.0000 0.0000 23 + COUNTRY 0.0000 0.0000 0.0000 835 + CURR 0.0000 0.0000 0.0000 24 + DATE 0.0000 0.0000 0.0000 1691 + EDU 0.0000 0.0000 0.0000 109 + ENT 0.0000 0.0000 0.0000 1 + EVENT 0.0000 0.0000 0.0000 292 + FAC 0.0000 0.0000 0.0000 111 + GOV 0.0000 0.0000 0.0000 860 + GPE 0.0000 0.0000 0.0000 2261 + GPE_ORG 0.0000 0.0000 0.0000 167 + LAND-REGION-NATURAL 0.0000 0.0000 0.0000 52 + LANGUAGE 0.0000 0.0000 0.0000 16 + LAW 0.0000 0.0000 0.0000 47 + LOC 0.0000 0.0000 0.0000 127 + MED 0.0000 0.0000 0.0000 419 + MONEY 0.0000 0.0000 0.0000 22 + NEIGHBORHOOD 0.0000 0.0000 0.0000 5 + NONGOV 0.0000 0.0000 0.0000 571 + NORP 0.0000 0.0000 0.0000 551 + OCC 0.0000 0.0000 0.0000 522 + ORDINAL 0.0000 0.0000 0.0000 544 + ORG 0.0000 0.0000 0.0000 1790 + ORG_FAC 0.0000 0.0000 0.0000 7 + PATH 0.0000 0.0000 0.0000 6 + PERCENT 0.0000 0.0000 0.0000 12 + PERS 0.0000 0.0000 0.0000 679 + PRODUCT 0.0000 0.0000 0.0000 8 + QUANTITY 0.0000 0.0000 0.0000 3 + REGION-GENERAL 0.0000 0.0000 0.0000 37 +REGION-INTERNATIONAL 0.0000 0.0000 0.0000 12 + REL 0.0000 0.0000 0.0000 10 + SCI 0.0000 0.0000 0.0000 13 + SPO 0.0000 0.0000 0.0000 2 + SPORT 0.0000 0.0000 0.0000 4 + STATE-OR-PROVINCE 0.0000 0.0000 0.0000 179 + SUBAREA-FACILITY 0.0000 0.0000 0.0000 16 + TIME 0.0000 0.0000 0.0000 33 + TOWN 0.0000 0.0000 0.0000 1217 + UNIT 0.0000 0.0000 0.0000 4 + WATER-BODY 0.0000 0.0000 0.0000 14 + WEBSITE 0.0000 0.0000 0.0000 80 + pad> 0.0000 0.0000 0.0000 0 + + micro avg 0.0000 0.0000 0.0000 13790 + macro avg 0.0000 0.0000 0.0000 13790 + weighted avg 0.0000 0.0000 0.0000 13790 + +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:59:57 Epoch 7 | Timestep 23128 | Train Loss 37.471028 | Val Loss 40.454304 | F1 0.000000 +INFO arabiner.trainers.BertNestedTrainer Tue, 26 Mar 2024 19:59:57 Early termination triggered