Upload trainer_log.jsonl
Browse files- trainer_log.jsonl +167 -0
trainer_log.jsonl
ADDED
|
@@ -0,0 +1,167 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"current_steps": 5, "total_steps": 832, "loss": 1.9665, "lr": 2.9761904761904763e-06, "epoch": 0.01199760047990402, "percentage": 0.6, "elapsed_time": "0:03:51", "remaining_time": "10:39:01"}
|
| 2 |
+
{"current_steps": 10, "total_steps": 832, "loss": 1.6691, "lr": 5.9523809523809525e-06, "epoch": 0.02399520095980804, "percentage": 1.2, "elapsed_time": "0:08:17", "remaining_time": "11:22:01"}
|
| 3 |
+
{"current_steps": 15, "total_steps": 832, "loss": 1.441, "lr": 8.92857142857143e-06, "epoch": 0.035992801439712056, "percentage": 1.8, "elapsed_time": "0:11:58", "remaining_time": "10:52:30"}
|
| 4 |
+
{"current_steps": 20, "total_steps": 832, "loss": 1.3171, "lr": 1.1904761904761905e-05, "epoch": 0.04799040191961608, "percentage": 2.4, "elapsed_time": "0:16:39", "remaining_time": "11:16:08"}
|
| 5 |
+
{"current_steps": 25, "total_steps": 832, "loss": 1.2588, "lr": 1.4880952380952381e-05, "epoch": 0.059988002399520096, "percentage": 3.0, "elapsed_time": "0:21:13", "remaining_time": "11:24:57"}
|
| 6 |
+
{"current_steps": 30, "total_steps": 832, "loss": 1.2021, "lr": 1.785714285714286e-05, "epoch": 0.07198560287942411, "percentage": 3.61, "elapsed_time": "0:25:14", "remaining_time": "11:14:47"}
|
| 7 |
+
{"current_steps": 35, "total_steps": 832, "loss": 1.1645, "lr": 2.0833333333333336e-05, "epoch": 0.08398320335932813, "percentage": 4.21, "elapsed_time": "0:29:40", "remaining_time": "11:15:48"}
|
| 8 |
+
{"current_steps": 40, "total_steps": 832, "loss": 1.1652, "lr": 2.380952380952381e-05, "epoch": 0.09598080383923216, "percentage": 4.81, "elapsed_time": "0:33:53", "remaining_time": "11:11:11"}
|
| 9 |
+
{"current_steps": 45, "total_steps": 832, "loss": 1.1492, "lr": 2.6785714285714288e-05, "epoch": 0.10797840431913618, "percentage": 5.41, "elapsed_time": "0:37:49", "remaining_time": "11:01:39"}
|
| 10 |
+
{"current_steps": 50, "total_steps": 832, "loss": 1.146, "lr": 2.9761904761904762e-05, "epoch": 0.11997600479904019, "percentage": 6.01, "elapsed_time": "0:41:56", "remaining_time": "10:55:54"}
|
| 11 |
+
{"current_steps": 55, "total_steps": 832, "loss": 1.1312, "lr": 3.273809523809524e-05, "epoch": 0.13197360527894422, "percentage": 6.61, "elapsed_time": "0:46:30", "remaining_time": "10:57:07"}
|
| 12 |
+
{"current_steps": 60, "total_steps": 832, "loss": 1.1158, "lr": 3.571428571428572e-05, "epoch": 0.14397120575884823, "percentage": 7.21, "elapsed_time": "0:51:08", "remaining_time": "10:57:57"}
|
| 13 |
+
{"current_steps": 65, "total_steps": 832, "loss": 1.112, "lr": 3.8690476190476195e-05, "epoch": 0.15596880623875226, "percentage": 7.81, "elapsed_time": "0:55:21", "remaining_time": "10:53:11"}
|
| 14 |
+
{"current_steps": 70, "total_steps": 832, "loss": 1.1216, "lr": 4.166666666666667e-05, "epoch": 0.16796640671865626, "percentage": 8.41, "elapsed_time": "0:59:46", "remaining_time": "10:50:40"}
|
| 15 |
+
{"current_steps": 75, "total_steps": 832, "loss": 1.1154, "lr": 4.464285714285715e-05, "epoch": 0.1799640071985603, "percentage": 9.01, "elapsed_time": "1:03:44", "remaining_time": "10:43:22"}
|
| 16 |
+
{"current_steps": 80, "total_steps": 832, "loss": 1.115, "lr": 4.761904761904762e-05, "epoch": 0.19196160767846432, "percentage": 9.62, "elapsed_time": "1:08:35", "remaining_time": "10:44:47"}
|
| 17 |
+
{"current_steps": 85, "total_steps": 832, "loss": 1.1166, "lr": 4.9999779501355384e-05, "epoch": 0.20395920815836832, "percentage": 10.22, "elapsed_time": "1:12:47", "remaining_time": "10:39:38"}
|
| 18 |
+
{"current_steps": 90, "total_steps": 832, "loss": 1.126, "lr": 4.9992062457191e-05, "epoch": 0.21595680863827235, "percentage": 10.82, "elapsed_time": "1:16:47", "remaining_time": "10:33:10"}
|
| 19 |
+
{"current_steps": 95, "total_steps": 832, "loss": 1.1183, "lr": 4.997332437005931e-05, "epoch": 0.22795440911817635, "percentage": 11.42, "elapsed_time": "1:20:52", "remaining_time": "10:27:24"}
|
| 20 |
+
{"current_steps": 100, "total_steps": 832, "loss": 1.1341, "lr": 4.99435735031144e-05, "epoch": 0.23995200959808038, "percentage": 12.02, "elapsed_time": "1:24:42", "remaining_time": "10:20:06"}
|
| 21 |
+
{"current_steps": 105, "total_steps": 832, "loss": 1.1111, "lr": 4.990282297594509e-05, "epoch": 0.2519496100779844, "percentage": 12.62, "elapsed_time": "1:29:00", "remaining_time": "10:16:14"}
|
| 22 |
+
{"current_steps": 110, "total_steps": 832, "loss": 1.1085, "lr": 4.98510907587894e-05, "epoch": 0.26394721055788845, "percentage": 13.22, "elapsed_time": "1:33:37", "remaining_time": "10:14:31"}
|
| 23 |
+
{"current_steps": 115, "total_steps": 832, "loss": 1.1081, "lr": 4.9788399664609985e-05, "epoch": 0.27594481103779245, "percentage": 13.82, "elapsed_time": "1:37:48", "remaining_time": "10:09:46"}
|
| 24 |
+
{"current_steps": 120, "total_steps": 832, "loss": 1.1187, "lr": 4.97147773390341e-05, "epoch": 0.28794241151769645, "percentage": 14.42, "elapsed_time": "1:42:19", "remaining_time": "10:07:07"}
|
| 25 |
+
{"current_steps": 125, "total_steps": 832, "loss": 1.0934, "lr": 4.963025624816232e-05, "epoch": 0.29994001199760045, "percentage": 15.02, "elapsed_time": "1:46:51", "remaining_time": "10:04:24"}
|
| 26 |
+
{"current_steps": 130, "total_steps": 832, "loss": 1.0939, "lr": 4.953487366425163e-05, "epoch": 0.3119376124775045, "percentage": 15.62, "elapsed_time": "1:51:34", "remaining_time": "10:02:32"}
|
| 27 |
+
{"current_steps": 135, "total_steps": 832, "loss": 1.1016, "lr": 4.942867164927899e-05, "epoch": 0.3239352129574085, "percentage": 16.23, "elapsed_time": "1:56:04", "remaining_time": "9:59:18"}
|
| 28 |
+
{"current_steps": 140, "total_steps": 832, "loss": 1.0755, "lr": 4.931169703639282e-05, "epoch": 0.3359328134373125, "percentage": 16.83, "elapsed_time": "2:00:14", "remaining_time": "9:54:18"}
|
| 29 |
+
{"current_steps": 145, "total_steps": 832, "loss": 1.0772, "lr": 4.918400140926042e-05, "epoch": 0.3479304139172166, "percentage": 17.43, "elapsed_time": "2:04:21", "remaining_time": "9:49:10"}
|
| 30 |
+
{"current_steps": 150, "total_steps": 832, "loss": 1.0975, "lr": 4.9045641079320484e-05, "epoch": 0.3599280143971206, "percentage": 18.03, "elapsed_time": "2:08:27", "remaining_time": "9:44:03"}
|
| 31 |
+
{"current_steps": 155, "total_steps": 832, "loss": 1.0894, "lr": 4.889667706095084e-05, "epoch": 0.3719256148770246, "percentage": 18.63, "elapsed_time": "2:12:42", "remaining_time": "9:39:36"}
|
| 32 |
+
{"current_steps": 160, "total_steps": 832, "loss": 1.0899, "lr": 4.873717504456219e-05, "epoch": 0.38392321535692864, "percentage": 19.23, "elapsed_time": "2:17:07", "remaining_time": "9:35:55"}
|
| 33 |
+
{"current_steps": 165, "total_steps": 832, "loss": 1.0954, "lr": 4.8567205367629835e-05, "epoch": 0.39592081583683264, "percentage": 19.83, "elapsed_time": "2:21:47", "remaining_time": "9:33:09"}
|
| 34 |
+
{"current_steps": 170, "total_steps": 832, "loss": 1.1022, "lr": 4.8386842983676164e-05, "epoch": 0.40791841631673664, "percentage": 20.43, "elapsed_time": "2:25:38", "remaining_time": "9:27:10"}
|
| 35 |
+
{"current_steps": 175, "total_steps": 832, "loss": 1.0858, "lr": 4.8196167429217474e-05, "epoch": 0.41991601679664065, "percentage": 21.03, "elapsed_time": "2:30:28", "remaining_time": "9:24:54"}
|
| 36 |
+
{"current_steps": 180, "total_steps": 832, "loss": 1.0776, "lr": 4.799526278868987e-05, "epoch": 0.4319136172765447, "percentage": 21.63, "elapsed_time": "2:35:08", "remaining_time": "9:21:56"}
|
| 37 |
+
{"current_steps": 185, "total_steps": 832, "loss": 1.0656, "lr": 4.778421765736951e-05, "epoch": 0.4439112177564487, "percentage": 22.24, "elapsed_time": "2:39:42", "remaining_time": "9:18:34"}
|
| 38 |
+
{"current_steps": 190, "total_steps": 832, "loss": 1.0701, "lr": 4.7563125102303766e-05, "epoch": 0.4559088182363527, "percentage": 22.84, "elapsed_time": "2:44:26", "remaining_time": "9:15:38"}
|
| 39 |
+
{"current_steps": 195, "total_steps": 832, "loss": 1.078, "lr": 4.7332082621270326e-05, "epoch": 0.46790641871625677, "percentage": 23.44, "elapsed_time": "2:48:51", "remaining_time": "9:11:36"}
|
| 40 |
+
{"current_steps": 200, "total_steps": 832, "loss": 1.0748, "lr": 4.709119209978242e-05, "epoch": 0.47990401919616077, "percentage": 24.04, "elapsed_time": "2:52:57", "remaining_time": "9:06:33"}
|
| 41 |
+
{"current_steps": 205, "total_steps": 832, "loss": 1.0728, "lr": 4.684055976615924e-05, "epoch": 0.49190161967606477, "percentage": 24.64, "elapsed_time": "2:57:44", "remaining_time": "9:03:37"}
|
| 42 |
+
{"current_steps": 210, "total_steps": 832, "loss": 1.0741, "lr": 4.6580296144681157e-05, "epoch": 0.5038992201559688, "percentage": 25.24, "elapsed_time": "3:02:07", "remaining_time": "8:59:25"}
|
| 43 |
+
{"current_steps": 215, "total_steps": 832, "loss": 1.0545, "lr": 4.631051600685051e-05, "epoch": 0.5158968206358728, "percentage": 25.84, "elapsed_time": "3:06:10", "remaining_time": "8:54:17"}
|
| 44 |
+
{"current_steps": 220, "total_steps": 832, "loss": 1.0466, "lr": 4.6031338320779534e-05, "epoch": 0.5278944211157769, "percentage": 26.44, "elapsed_time": "3:09:51", "remaining_time": "8:48:09"}
|
| 45 |
+
{"current_steps": 225, "total_steps": 832, "loss": 1.0757, "lr": 4.57428861987275e-05, "epoch": 0.5398920215956808, "percentage": 27.04, "elapsed_time": "3:14:26", "remaining_time": "8:44:34"}
|
| 46 |
+
{"current_steps": 230, "total_steps": 832, "loss": 1.0659, "lr": 4.544528684281056e-05, "epoch": 0.5518896220755849, "percentage": 27.64, "elapsed_time": "3:19:21", "remaining_time": "8:41:47"}
|
| 47 |
+
{"current_steps": 235, "total_steps": 832, "loss": 1.0731, "lr": 4.513867148890788e-05, "epoch": 0.563887222555489, "percentage": 28.25, "elapsed_time": "3:24:02", "remaining_time": "8:38:20"}
|
| 48 |
+
{"current_steps": 240, "total_steps": 832, "loss": 1.0724, "lr": 4.482317534878901e-05, "epoch": 0.5758848230353929, "percentage": 28.85, "elapsed_time": "3:28:36", "remaining_time": "8:34:34"}
|
| 49 |
+
{"current_steps": 245, "total_steps": 832, "loss": 1.0538, "lr": 4.449893755048799e-05, "epoch": 0.587882423515297, "percentage": 29.45, "elapsed_time": "3:32:40", "remaining_time": "8:29:33"}
|
| 50 |
+
{"current_steps": 250, "total_steps": 832, "loss": 1.0653, "lr": 4.416610107695042e-05, "epoch": 0.5998800239952009, "percentage": 30.05, "elapsed_time": "3:37:08", "remaining_time": "8:25:30"}
|
| 51 |
+
{"current_steps": 255, "total_steps": 832, "loss": 1.0593, "lr": 4.3824812702980595e-05, "epoch": 0.611877624475105, "percentage": 30.65, "elapsed_time": "3:40:49", "remaining_time": "8:19:40"}
|
| 52 |
+
{"current_steps": 260, "total_steps": 832, "loss": 1.0728, "lr": 4.347522293051648e-05, "epoch": 0.623875224955009, "percentage": 31.25, "elapsed_time": "3:44:45", "remaining_time": "8:14:28"}
|
| 53 |
+
{"current_steps": 265, "total_steps": 832, "loss": 1.0683, "lr": 4.3117485922261136e-05, "epoch": 0.635872825434913, "percentage": 31.85, "elapsed_time": "3:49:53", "remaining_time": "8:11:52"}
|
| 54 |
+
{"current_steps": 270, "total_steps": 832, "loss": 1.0493, "lr": 4.275175943369975e-05, "epoch": 0.647870425914817, "percentage": 32.45, "elapsed_time": "3:54:38", "remaining_time": "8:08:25"}
|
| 55 |
+
{"current_steps": 275, "total_steps": 832, "loss": 1.0779, "lr": 4.2378204743532377e-05, "epoch": 0.6598680263947211, "percentage": 33.05, "elapsed_time": "3:59:39", "remaining_time": "8:05:25"}
|
| 56 |
+
{"current_steps": 280, "total_steps": 832, "loss": 1.0507, "lr": 4.199698658255298e-05, "epoch": 0.671865626874625, "percentage": 33.65, "elapsed_time": "4:03:57", "remaining_time": "8:00:57"}
|
| 57 |
+
{"current_steps": 285, "total_steps": 832, "loss": 1.0541, "lr": 4.160827306100611e-05, "epoch": 0.6838632273545291, "percentage": 34.25, "elapsed_time": "4:07:30", "remaining_time": "7:55:03"}
|
| 58 |
+
{"current_steps": 290, "total_steps": 832, "loss": 1.0507, "lr": 4.121223559445343e-05, "epoch": 0.6958608278344331, "percentage": 34.86, "elapsed_time": "4:12:01", "remaining_time": "7:51:01"}
|
| 59 |
+
{"current_steps": 295, "total_steps": 832, "loss": 1.0529, "lr": 4.0809048828182534e-05, "epoch": 0.7078584283143371, "percentage": 35.46, "elapsed_time": "4:16:10", "remaining_time": "7:46:20"}
|
| 60 |
+
{"current_steps": 300, "total_steps": 832, "loss": 1.0611, "lr": 4.039889056019159e-05, "epoch": 0.7198560287942412, "percentage": 36.06, "elapsed_time": "4:20:41", "remaining_time": "7:42:17"}
|
| 61 |
+
{"current_steps": 305, "total_steps": 832, "loss": 1.0477, "lr": 3.9981941662783674e-05, "epoch": 0.7318536292741452, "percentage": 36.66, "elapsed_time": "4:25:44", "remaining_time": "7:39:10"}
|
| 62 |
+
{"current_steps": 310, "total_steps": 832, "loss": 1.0425, "lr": 3.955838600280535e-05, "epoch": 0.7438512297540492, "percentage": 37.26, "elapsed_time": "4:30:13", "remaining_time": "7:35:00"}
|
| 63 |
+
{"current_steps": 315, "total_steps": 832, "loss": 1.053, "lr": 3.91284103605648e-05, "epoch": 0.7558488302339532, "percentage": 37.86, "elapsed_time": "4:34:21", "remaining_time": "7:30:17"}
|
| 64 |
+
{"current_steps": 320, "total_steps": 832, "loss": 1.0469, "lr": 3.869220434746509e-05, "epoch": 0.7678464307138573, "percentage": 38.46, "elapsed_time": "4:38:39", "remaining_time": "7:25:51"}
|
| 65 |
+
{"current_steps": 325, "total_steps": 832, "loss": 1.0507, "lr": 3.8249960322389e-05, "epoch": 0.7798440311937612, "percentage": 39.06, "elapsed_time": "4:42:42", "remaining_time": "7:21:00"}
|
| 66 |
+
{"current_steps": 330, "total_steps": 832, "loss": 1.0286, "lr": 3.780187330687231e-05, "epoch": 0.7918416316736653, "percentage": 39.66, "elapsed_time": "4:47:15", "remaining_time": "7:16:58"}
|
| 67 |
+
{"current_steps": 335, "total_steps": 832, "loss": 1.0275, "lr": 3.734814089910283e-05, "epoch": 0.8038392321535693, "percentage": 40.26, "elapsed_time": "4:51:48", "remaining_time": "7:12:55"}
|
| 68 |
+
{"current_steps": 340, "total_steps": 832, "loss": 1.0152, "lr": 3.6888963186783224e-05, "epoch": 0.8158368326334733, "percentage": 40.87, "elapsed_time": "4:55:46", "remaining_time": "7:08:00"}
|
| 69 |
+
{"current_steps": 345, "total_steps": 832, "loss": 1.0329, "lr": 3.6424542658895944e-05, "epoch": 0.8278344331133773, "percentage": 41.47, "elapsed_time": "5:00:56", "remaining_time": "7:04:48"}
|
| 70 |
+
{"current_steps": 350, "total_steps": 832, "loss": 1.0358, "lr": 3.5955084116409385e-05, "epoch": 0.8398320335932813, "percentage": 42.07, "elapsed_time": "5:05:03", "remaining_time": "7:00:06"}
|
| 71 |
+
{"current_steps": 355, "total_steps": 832, "loss": 1.0257, "lr": 3.5480794581964304e-05, "epoch": 0.8518296340731853, "percentage": 42.67, "elapsed_time": "5:08:51", "remaining_time": "6:55:00"}
|
| 72 |
+
{"current_steps": 360, "total_steps": 832, "loss": 1.0462, "lr": 3.5001883208580665e-05, "epoch": 0.8638272345530894, "percentage": 43.27, "elapsed_time": "5:12:44", "remaining_time": "6:50:01"}
|
| 73 |
+
{"current_steps": 365, "total_steps": 832, "loss": 1.0457, "lr": 3.451856118742498e-05, "epoch": 0.8758248350329934, "percentage": 43.87, "elapsed_time": "5:16:59", "remaining_time": "6:45:34"}
|
| 74 |
+
{"current_steps": 370, "total_steps": 832, "loss": 1.0273, "lr": 3.403104165467883e-05, "epoch": 0.8878224355128974, "percentage": 44.47, "elapsed_time": "5:21:29", "remaining_time": "6:41:25"}
|
| 75 |
+
{"current_steps": 375, "total_steps": 832, "loss": 1.0063, "lr": 3.353953959754973e-05, "epoch": 0.8998200359928015, "percentage": 45.07, "elapsed_time": "5:26:11", "remaining_time": "6:37:30"}
|
| 76 |
+
{"current_steps": 380, "total_steps": 832, "loss": 1.0155, "lr": 3.30442717594657e-05, "epoch": 0.9118176364727054, "percentage": 45.67, "elapsed_time": "5:30:28", "remaining_time": "6:33:05"}
|
| 77 |
+
{"current_steps": 385, "total_steps": 832, "loss": 1.025, "lr": 3.2545456544495365e-05, "epoch": 0.9238152369526095, "percentage": 46.27, "elapsed_time": "5:34:38", "remaining_time": "6:28:31"}
|
| 78 |
+
{"current_steps": 390, "total_steps": 832, "loss": 1.0328, "lr": 3.2043313921035743e-05, "epoch": 0.9358128374325135, "percentage": 46.88, "elapsed_time": "5:38:41", "remaining_time": "6:23:51"}
|
| 79 |
+
{"current_steps": 395, "total_steps": 832, "loss": 1.0248, "lr": 3.1538065324810206e-05, "epoch": 0.9478104379124175, "percentage": 47.48, "elapsed_time": "5:43:35", "remaining_time": "6:20:07"}
|
| 80 |
+
{"current_steps": 400, "total_steps": 832, "loss": 1.0027, "lr": 3.1029933561219375e-05, "epoch": 0.9598080383923215, "percentage": 48.08, "elapsed_time": "5:48:31", "remaining_time": "6:16:24"}
|
| 81 |
+
{"current_steps": 405, "total_steps": 832, "loss": 1.0116, "lr": 3.0519142707088026e-05, "epoch": 0.9718056388722256, "percentage": 48.68, "elapsed_time": "5:53:06", "remaining_time": "6:12:17"}
|
| 82 |
+
{"current_steps": 410, "total_steps": 832, "loss": 1.0147, "lr": 3.000591801185124e-05, "epoch": 0.9838032393521295, "percentage": 49.28, "elapsed_time": "5:58:13", "remaining_time": "6:08:42"}
|
| 83 |
+
{"current_steps": 415, "total_steps": 832, "loss": 1.0312, "lr": 2.9490485798223623e-05, "epoch": 0.9958008398320336, "percentage": 49.88, "elapsed_time": "6:03:29", "remaining_time": "6:05:14"}
|
| 84 |
+
{"current_steps": 420, "total_steps": 832, "loss": 1.0189, "lr": 2.8973073362394998e-05, "epoch": 1.0095980803839233, "percentage": 50.48, "elapsed_time": "6:08:01", "remaining_time": "6:01:00"}
|
| 85 |
+
{"current_steps": 425, "total_steps": 832, "loss": 0.8115, "lr": 2.8453908873797058e-05, "epoch": 1.0215956808638271, "percentage": 51.08, "elapsed_time": "6:12:12", "remaining_time": "5:56:26"}
|
| 86 |
+
{"current_steps": 430, "total_steps": 832, "loss": 0.8041, "lr": 2.7933221274484723e-05, "epoch": 1.0335932813437312, "percentage": 51.68, "elapsed_time": "6:16:51", "remaining_time": "5:52:19"}
|
| 87 |
+
{"current_steps": 435, "total_steps": 832, "loss": 0.8078, "lr": 2.7411240178176927e-05, "epoch": 1.0455908818236352, "percentage": 52.28, "elapsed_time": "6:21:31", "remaining_time": "5:48:11"}
|
| 88 |
+
{"current_steps": 440, "total_steps": 832, "loss": 0.8179, "lr": 2.6888195769001146e-05, "epoch": 1.0575884823035393, "percentage": 52.88, "elapsed_time": "6:25:56", "remaining_time": "5:43:50"}
|
| 89 |
+
{"current_steps": 445, "total_steps": 832, "loss": 0.8072, "lr": 2.63643186999864e-05, "epoch": 1.0695860827834434, "percentage": 53.49, "elapsed_time": "6:30:35", "remaining_time": "5:39:40"}
|
| 90 |
+
{"current_steps": 450, "total_steps": 832, "loss": 0.8099, "lr": 2.5839839991349506e-05, "epoch": 1.0815836832633474, "percentage": 54.09, "elapsed_time": "6:34:59", "remaining_time": "5:35:18"}
|
| 91 |
+
{"current_steps": 455, "total_steps": 832, "loss": 0.7985, "lr": 2.5314990928619337e-05, "epoch": 1.0935812837432513, "percentage": 54.69, "elapsed_time": "6:39:39", "remaining_time": "5:31:08"}
|
| 92 |
+
{"current_steps": 460, "total_steps": 832, "loss": 0.8224, "lr": 2.479000296064417e-05, "epoch": 1.1055788842231553, "percentage": 55.29, "elapsed_time": "6:44:28", "remaining_time": "5:27:05"}
|
| 93 |
+
{"current_steps": 465, "total_steps": 832, "loss": 0.8156, "lr": 2.4265107597526946e-05, "epoch": 1.1175764847030594, "percentage": 55.89, "elapsed_time": "6:48:41", "remaining_time": "5:22:33"}
|
| 94 |
+
{"current_steps": 470, "total_steps": 832, "loss": 0.8113, "lr": 2.374053630853358e-05, "epoch": 1.1295740851829634, "percentage": 56.49, "elapsed_time": "6:53:22", "remaining_time": "5:18:23"}
|
| 95 |
+
{"current_steps": 475, "total_steps": 832, "loss": 0.8078, "lr": 2.3216520420019195e-05, "epoch": 1.1415716856628675, "percentage": 57.09, "elapsed_time": "6:57:03", "remaining_time": "5:13:27"}
|
| 96 |
+
{"current_steps": 480, "total_steps": 832, "loss": 0.7979, "lr": 2.2693291013417453e-05, "epoch": 1.1535692861427713, "percentage": 57.69, "elapsed_time": "7:01:37", "remaining_time": "5:09:11"}
|
| 97 |
+
{"current_steps": 485, "total_steps": 832, "loss": 0.8114, "lr": 2.2171078823337863e-05, "epoch": 1.1655668866226754, "percentage": 58.29, "elapsed_time": "7:05:32", "remaining_time": "5:04:27"}
|
| 98 |
+
{"current_steps": 490, "total_steps": 832, "loss": 0.8068, "lr": 2.165011413581605e-05, "epoch": 1.1775644871025794, "percentage": 58.89, "elapsed_time": "7:10:58", "remaining_time": "5:00:47"}
|
| 99 |
+
{"current_steps": 495, "total_steps": 832, "loss": 0.7931, "lr": 2.1130626686761762e-05, "epoch": 1.1895620875824835, "percentage": 59.5, "elapsed_time": "7:15:00", "remaining_time": "4:56:09"}
|
| 100 |
+
{"current_steps": 500, "total_steps": 832, "loss": 0.7961, "lr": 2.0612845560649603e-05, "epoch": 1.2015596880623876, "percentage": 60.1, "elapsed_time": "7:18:44", "remaining_time": "4:51:19"}
|
| 101 |
+
{"current_steps": 505, "total_steps": 832, "loss": 0.7949, "lr": 2.0096999089496913e-05, "epoch": 1.2135572885422916, "percentage": 60.7, "elapsed_time": "7:23:08", "remaining_time": "4:46:56"}
|
| 102 |
+
{"current_steps": 510, "total_steps": 832, "loss": 0.8081, "lr": 1.958331475217357e-05, "epoch": 1.2255548890221957, "percentage": 61.3, "elapsed_time": "7:27:25", "remaining_time": "4:42:29"}
|
| 103 |
+
{"current_steps": 515, "total_steps": 832, "loss": 0.7944, "lr": 1.9072019074087876e-05, "epoch": 1.2375524895020995, "percentage": 61.9, "elapsed_time": "7:31:45", "remaining_time": "4:38:04"}
|
| 104 |
+
{"current_steps": 520, "total_steps": 832, "loss": 0.7982, "lr": 1.856333752729311e-05, "epoch": 1.2495500899820036, "percentage": 62.5, "elapsed_time": "7:36:19", "remaining_time": "4:33:47"}
|
| 105 |
+
{"current_steps": 525, "total_steps": 832, "loss": 0.8013, "lr": 1.8057494431058365e-05, "epoch": 1.2615476904619076, "percentage": 63.1, "elapsed_time": "7:40:34", "remaining_time": "4:29:19"}
|
| 106 |
+
{"current_steps": 530, "total_steps": 832, "loss": 0.8031, "lr": 1.7554712852947913e-05, "epoch": 1.2735452909418117, "percentage": 63.7, "elapsed_time": "7:45:07", "remaining_time": "4:25:01"}
|
| 107 |
+
{"current_steps": 535, "total_steps": 832, "loss": 0.7924, "lr": 1.705521451045246e-05, "epoch": 1.2855428914217157, "percentage": 64.3, "elapsed_time": "7:49:25", "remaining_time": "4:20:35"}
|
| 108 |
+
{"current_steps": 540, "total_steps": 832, "loss": 0.784, "lr": 1.6559219673215784e-05, "epoch": 1.2975404919016196, "percentage": 64.9, "elapsed_time": "7:54:13", "remaining_time": "4:16:26"}
|
| 109 |
+
{"current_steps": 545, "total_steps": 832, "loss": 0.795, "lr": 1.6066947065899847e-05, "epoch": 1.3095380923815236, "percentage": 65.5, "elapsed_time": "7:58:57", "remaining_time": "4:12:13"}
|
| 110 |
+
{"current_steps": 550, "total_steps": 832, "loss": 0.7903, "lr": 1.5578613771731213e-05, "epoch": 1.3215356928614277, "percentage": 66.11, "elapsed_time": "8:02:38", "remaining_time": "4:07:27"}
|
| 111 |
+
{"current_steps": 555, "total_steps": 832, "loss": 0.7841, "lr": 1.509443513677134e-05, "epoch": 1.3335332933413317, "percentage": 66.71, "elapsed_time": "8:06:36", "remaining_time": "4:02:51"}
|
| 112 |
+
{"current_steps": 560, "total_steps": 832, "loss": 0.7932, "lr": 1.4614624674952842e-05, "epoch": 1.3455308938212358, "percentage": 67.31, "elapsed_time": "8:10:59", "remaining_time": "3:58:28"}
|
| 113 |
+
{"current_steps": 565, "total_steps": 832, "loss": 0.7815, "lr": 1.4139393973923798e-05, "epoch": 1.3575284943011399, "percentage": 67.91, "elapsed_time": "8:15:17", "remaining_time": "3:54:03"}
|
| 114 |
+
{"current_steps": 570, "total_steps": 832, "loss": 0.7899, "lr": 1.3668952601741441e-05, "epoch": 1.369526094781044, "percentage": 68.51, "elapsed_time": "8:20:04", "remaining_time": "3:49:51"}
|
| 115 |
+
{"current_steps": 575, "total_steps": 832, "loss": 0.7745, "lr": 1.320350801445649e-05, "epoch": 1.3815236952609478, "percentage": 69.11, "elapsed_time": "8:24:33", "remaining_time": "3:45:30"}
|
| 116 |
+
{"current_steps": 580, "total_steps": 832, "loss": 0.7761, "lr": 1.2743265464628786e-05, "epoch": 1.3935212957408518, "percentage": 69.71, "elapsed_time": "8:29:00", "remaining_time": "3:41:09"}
|
| 117 |
+
{"current_steps": 585, "total_steps": 832, "loss": 0.7549, "lr": 1.2288427910814699e-05, "epoch": 1.4055188962207559, "percentage": 70.31, "elapsed_time": "8:33:35", "remaining_time": "3:36:51"}
|
| 118 |
+
{"current_steps": 590, "total_steps": 832, "loss": 0.7887, "lr": 1.1839195928066102e-05, "epoch": 1.41751649670066, "percentage": 70.91, "elapsed_time": "8:37:48", "remaining_time": "3:32:23"}
|
| 119 |
+
{"current_steps": 595, "total_steps": 832, "loss": 0.7891, "lr": 1.1395767619480451e-05, "epoch": 1.4295140971805638, "percentage": 71.51, "elapsed_time": "8:42:14", "remaining_time": "3:28:01"}
|
| 120 |
+
{"current_steps": 600, "total_steps": 832, "loss": 0.7828, "lr": 1.0958338528840893e-05, "epoch": 1.4415116976604678, "percentage": 72.12, "elapsed_time": "8:46:47", "remaining_time": "3:23:41"}
|
| 121 |
+
{"current_steps": 605, "total_steps": 832, "loss": 0.7985, "lr": 1.052710155438506e-05, "epoch": 1.4535092981403719, "percentage": 72.72, "elapsed_time": "8:51:44", "remaining_time": "3:19:30"}
|
| 122 |
+
{"current_steps": 610, "total_steps": 832, "loss": 0.7712, "lr": 1.0102246863740496e-05, "epoch": 1.465506898620276, "percentage": 73.32, "elapsed_time": "8:56:08", "remaining_time": "3:15:07"}
|
| 123 |
+
{"current_steps": 615, "total_steps": 832, "loss": 0.7813, "lr": 9.683961810064176e-06, "epoch": 1.47750449910018, "percentage": 73.92, "elapsed_time": "9:00:41", "remaining_time": "3:10:46"}
|
| 124 |
+
{"current_steps": 620, "total_steps": 832, "loss": 0.774, "lr": 9.272430849423174e-06, "epoch": 1.489502099580084, "percentage": 74.52, "elapsed_time": "9:05:04", "remaining_time": "3:06:22"}
|
| 125 |
+
{"current_steps": 625, "total_steps": 832, "loss": 0.7756, "lr": 8.867835459452925e-06, "epoch": 1.5014997000599881, "percentage": 75.12, "elapsed_time": "9:09:38", "remaining_time": "3:02:02"}
|
| 126 |
+
{"current_steps": 630, "total_steps": 832, "loss": 0.7683, "lr": 8.470354059328919e-06, "epoch": 1.5134973005398922, "percentage": 75.72, "elapsed_time": "9:13:40", "remaining_time": "2:57:31"}
|
| 127 |
+
{"current_steps": 635, "total_steps": 832, "loss": 0.7827, "lr": 8.080161931087094e-06, "epoch": 1.525494901019796, "percentage": 76.32, "elapsed_time": "9:18:27", "remaining_time": "2:53:15"}
|
| 128 |
+
{"current_steps": 640, "total_steps": 832, "loss": 0.7787, "lr": 7.697431142327632e-06, "epoch": 1.5374925014997, "percentage": 76.92, "elapsed_time": "9:22:54", "remaining_time": "2:48:52"}
|
| 129 |
+
{"current_steps": 645, "total_steps": 832, "loss": 0.7858, "lr": 7.3223304703363135e-06, "epoch": 1.5494901019796041, "percentage": 77.52, "elapsed_time": "9:27:05", "remaining_time": "2:44:24"}
|
| 130 |
+
{"current_steps": 650, "total_steps": 832, "loss": 0.766, "lr": 6.955025327656839e-06, "epoch": 1.561487702459508, "percentage": 78.12, "elapsed_time": "9:31:49", "remaining_time": "2:40:06"}
|
| 131 |
+
{"current_steps": 655, "total_steps": 832, "loss": 0.7694, "lr": 6.5956776891468925e-06, "epoch": 1.573485302939412, "percentage": 78.73, "elapsed_time": "9:36:00", "remaining_time": "2:35:39"}
|
| 132 |
+
{"current_steps": 660, "total_steps": 832, "loss": 0.7627, "lr": 6.244446020550182e-06, "epoch": 1.585482903419316, "percentage": 79.33, "elapsed_time": "9:40:49", "remaining_time": "2:31:21"}
|
| 133 |
+
{"current_steps": 665, "total_steps": 832, "loss": 0.7672, "lr": 5.901485208615948e-06, "epoch": 1.5974805038992201, "percentage": 79.93, "elapsed_time": "9:44:55", "remaining_time": "2:26:53"}
|
| 134 |
+
{"current_steps": 670, "total_steps": 832, "loss": 0.7783, "lr": 5.5669464927967655e-06, "epoch": 1.6094781043791242, "percentage": 80.53, "elapsed_time": "9:49:06", "remaining_time": "2:22:26"}
|
| 135 |
+
{"current_steps": 675, "total_steps": 832, "loss": 0.7578, "lr": 5.240977398554673e-06, "epoch": 1.6214757048590283, "percentage": 81.13, "elapsed_time": "9:53:29", "remaining_time": "2:18:02"}
|
| 136 |
+
{"current_steps": 680, "total_steps": 832, "loss": 0.7681, "lr": 4.9237216723051485e-06, "epoch": 1.6334733053389323, "percentage": 81.73, "elapsed_time": "9:58:06", "remaining_time": "2:13:41"}
|
| 137 |
+
{"current_steps": 685, "total_steps": 832, "loss": 0.773, "lr": 4.615319218027561e-06, "epoch": 1.6454709058188364, "percentage": 82.33, "elapsed_time": "10:02:32", "remaining_time": "2:09:18"}
|
| 138 |
+
{"current_steps": 690, "total_steps": 832, "loss": 0.7541, "lr": 4.315906035570094e-06, "epoch": 1.6574685062987402, "percentage": 82.93, "elapsed_time": "10:06:23", "remaining_time": "2:04:47"}
|
| 139 |
+
{"current_steps": 695, "total_steps": 832, "loss": 0.7744, "lr": 4.0256141606762836e-06, "epoch": 1.6694661067786443, "percentage": 83.53, "elapsed_time": "10:11:07", "remaining_time": "2:00:27"}
|
| 140 |
+
{"current_steps": 700, "total_steps": 832, "loss": 0.7472, "lr": 3.7445716067596503e-06, "epoch": 1.6814637072585483, "percentage": 84.13, "elapsed_time": "10:15:36", "remaining_time": "1:56:05"}
|
| 141 |
+
{"current_steps": 705, "total_steps": 832, "loss": 0.7499, "lr": 3.4729023084521417e-06, "epoch": 1.6934613077384522, "percentage": 84.74, "elapsed_time": "10:19:57", "remaining_time": "1:51:40"}
|
| 142 |
+
{"current_steps": 710, "total_steps": 832, "loss": 0.7539, "lr": 3.2107260669512336e-06, "epoch": 1.7054589082183562, "percentage": 85.34, "elapsed_time": "10:24:05", "remaining_time": "1:47:14"}
|
| 143 |
+
{"current_steps": 715, "total_steps": 832, "loss": 0.7731, "lr": 2.9581584971897697e-06, "epoch": 1.7174565086982603, "percentage": 85.94, "elapsed_time": "10:28:36", "remaining_time": "1:42:51"}
|
| 144 |
+
{"current_steps": 720, "total_steps": 832, "loss": 0.7495, "lr": 2.7153109768518925e-06, "epoch": 1.7294541091781643, "percentage": 86.54, "elapsed_time": "10:33:37", "remaining_time": "1:38:33"}
|
| 145 |
+
{"current_steps": 725, "total_steps": 832, "loss": 0.7649, "lr": 2.4822905972575167e-06, "epoch": 1.7414517096580684, "percentage": 87.14, "elapsed_time": "10:37:40", "remaining_time": "1:34:06"}
|
| 146 |
+
{"current_steps": 730, "total_steps": 832, "loss": 0.7662, "lr": 2.2592001161370392e-06, "epoch": 1.7534493101379725, "percentage": 87.74, "elapsed_time": "10:41:31", "remaining_time": "1:29:38"}
|
| 147 |
+
{"current_steps": 735, "total_steps": 832, "loss": 0.7681, "lr": 2.0461379123170284e-06, "epoch": 1.7654469106178765, "percentage": 88.34, "elapsed_time": "10:46:17", "remaining_time": "1:25:17"}
|
| 148 |
+
{"current_steps": 740, "total_steps": 832, "loss": 0.7606, "lr": 1.8431979423369604e-06, "epoch": 1.7774445110977806, "percentage": 88.94, "elapsed_time": "10:50:49", "remaining_time": "1:20:54"}
|
| 149 |
+
{"current_steps": 745, "total_steps": 832, "loss": 0.7704, "lr": 1.650469699016116e-06, "epoch": 1.7894421115776846, "percentage": 89.54, "elapsed_time": "10:55:16", "remaining_time": "1:16:31"}
|
| 150 |
+
{"current_steps": 750, "total_steps": 832, "loss": 0.7502, "lr": 1.4680381719888807e-06, "epoch": 1.8014397120575885, "percentage": 90.14, "elapsed_time": "10:59:22", "remaining_time": "1:12:05"}
|
| 151 |
+
{"current_steps": 755, "total_steps": 832, "loss": 0.7713, "lr": 1.2959838102258536e-06, "epoch": 1.8134373125374925, "percentage": 90.75, "elapsed_time": "11:04:32", "remaining_time": "1:07:46"}
|
| 152 |
+
{"current_steps": 760, "total_steps": 832, "loss": 0.758, "lr": 1.134382486557342e-06, "epoch": 1.8254349130173964, "percentage": 91.35, "elapsed_time": "11:08:32", "remaining_time": "1:03:20"}
|
| 153 |
+
{"current_steps": 765, "total_steps": 832, "loss": 0.7521, "lr": 9.833054642148066e-07, "epoch": 1.8374325134973004, "percentage": 91.95, "elapsed_time": "11:12:44", "remaining_time": "0:58:55"}
|
| 154 |
+
{"current_steps": 770, "total_steps": 832, "loss": 0.7509, "lr": 8.428193654051036e-07, "epoch": 1.8494301139772045, "percentage": 92.55, "elapsed_time": "11:17:28", "remaining_time": "0:54:32"}
|
| 155 |
+
{"current_steps": 775, "total_steps": 832, "loss": 0.7655, "lr": 7.129861419312822e-07, "epoch": 1.8614277144571085, "percentage": 93.15, "elapsed_time": "11:21:20", "remaining_time": "0:50:06"}
|
| 156 |
+
{"current_steps": 780, "total_steps": 832, "loss": 0.7498, "lr": 5.938630478729917e-07, "epoch": 1.8734253149370126, "percentage": 93.75, "elapsed_time": "11:26:03", "remaining_time": "0:45:44"}
|
| 157 |
+
{"current_steps": 785, "total_steps": 832, "loss": 0.7536, "lr": 4.855026143384733e-07, "epoch": 1.8854229154169166, "percentage": 94.35, "elapsed_time": "11:30:30", "remaining_time": "0:41:20"}
|
| 158 |
+
{"current_steps": 790, "total_steps": 832, "loss": 0.7668, "lr": 3.8795262629928996e-07, "epoch": 1.8974205158968207, "percentage": 94.95, "elapsed_time": "11:35:24", "remaining_time": "0:36:58"}
|
| 159 |
+
{"current_steps": 795, "total_steps": 832, "loss": 0.7638, "lr": 3.0125610151804374e-07, "epoch": 1.9094181163767248, "percentage": 95.55, "elapsed_time": "11:39:06", "remaining_time": "0:32:32"}
|
| 160 |
+
{"current_steps": 800, "total_steps": 832, "loss": 0.755, "lr": 2.2545127157831413e-07, "epoch": 1.9214157168566288, "percentage": 96.15, "elapsed_time": "11:43:42", "remaining_time": "0:28:08"}
|
| 161 |
+
{"current_steps": 805, "total_steps": 832, "loss": 0.7509, "lr": 1.605715650252415e-07, "epoch": 1.9334133173365327, "percentage": 96.75, "elapsed_time": "11:47:47", "remaining_time": "0:23:44"}
|
| 162 |
+
{"current_steps": 810, "total_steps": 832, "loss": 0.7576, "lr": 1.0664559262413831e-07, "epoch": 1.9454109178164367, "percentage": 97.36, "elapsed_time": "11:51:39", "remaining_time": "0:19:19"}
|
| 163 |
+
{"current_steps": 815, "total_steps": 832, "loss": 0.7668, "lr": 6.369713474366212e-08, "epoch": 1.9574085182963408, "percentage": 97.96, "elapsed_time": "11:56:43", "remaining_time": "0:14:57"}
|
| 164 |
+
{"current_steps": 820, "total_steps": 832, "loss": 0.7593, "lr": 3.1745130869123566e-08, "epoch": 1.9694061187762446, "percentage": 98.56, "elapsed_time": "12:01:01", "remaining_time": "0:10:33"}
|
| 165 |
+
{"current_steps": 825, "total_steps": 832, "loss": 0.7563, "lr": 1.08036712505033e-08, "epoch": 1.9814037192561487, "percentage": 99.16, "elapsed_time": "12:05:16", "remaining_time": "0:06:09"}
|
| 166 |
+
{"current_steps": 830, "total_steps": 832, "loss": 0.7589, "lr": 8.819906889168117e-10, "epoch": 1.9934013197360527, "percentage": 99.76, "elapsed_time": "12:09:38", "remaining_time": "0:01:45"}
|
| 167 |
+
{"current_steps": 832, "total_steps": 832, "epoch": 1.9982003599280143, "percentage": 100.0, "elapsed_time": "12:12:24", "remaining_time": "0:00:00"}
|