| {"current_steps": 500, "total_steps": 18540, "loss": 0.6808, "learning_rate": 4.9910325182530915e-05, "epoch": 0.026967988997060488, "percentage": 2.7, "elapsed_time": "0:09:28", "remaining_time": "5:42:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1000, "total_steps": 18540, "loss": 0.458, "learning_rate": 4.9641944055954695e-05, "epoch": 0.053935977994120976, "percentage": 5.39, "elapsed_time": "0:09:39", "remaining_time": "2:49:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 1500, "total_steps": 18540, "loss": 0.4483, "learning_rate": 4.9196781982554374e-05, "epoch": 0.08090396699118146, "percentage": 8.09, "elapsed_time": "0:19:30", "remaining_time": "3:41:32", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2000, "total_steps": 18540, "loss": 0.45, "learning_rate": 4.857803254854406e-05, "epoch": 0.10787195598824195, "percentage": 10.79, "elapsed_time": "0:09:27", "remaining_time": "1:18:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2500, "total_steps": 18540, "loss": 0.4444, "learning_rate": 4.7790134653328074e-05, "epoch": 0.13483994498530244, "percentage": 13.48, "elapsed_time": "0:19:13", "remaining_time": "2:03:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3000, "total_steps": 18540, "loss": 0.438, "learning_rate": 4.6838740664901435e-05, "epoch": 0.16180793398236293, "percentage": 16.18, "elapsed_time": "0:29:06", "remaining_time": "2:30:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3500, "total_steps": 18540, "loss": 0.4406, "learning_rate": 4.573067586984441e-05, "epoch": 0.18877592297942342, "percentage": 18.88, "elapsed_time": "0:38:59", "remaining_time": "2:47:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4000, "total_steps": 18540, "loss": 0.4293, "learning_rate": 4.447388950881625e-05, "epoch": 0.2157439119764839, "percentage": 21.57, "elapsed_time": "0:48:45", "remaining_time": "2:57:15", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4500, "total_steps": 18540, "loss": 0.4347, "learning_rate": 4.307739774881878e-05, "epoch": 0.2427119009735444, "percentage": 24.27, "elapsed_time": "0:58:38", "remaining_time": "3:02:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 5000, "total_steps": 18540, "loss": 0.4303, "learning_rate": 4.1551219001346e-05, "epoch": 0.2696798899706049, "percentage": 26.97, "elapsed_time": "1:08:38", "remaining_time": "3:05:54", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 5500, "total_steps": 18540, "loss": 0.4335, "learning_rate": 3.990630205044629e-05, "epoch": 0.29664787896766537, "percentage": 29.67, "elapsed_time": "1:18:27", "remaining_time": "3:06:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 6000, "total_steps": 18540, "loss": 0.4307, "learning_rate": 3.815804970461473e-05, "epoch": 0.32361586796472586, "percentage": 32.36, "elapsed_time": "1:28:17", "remaining_time": "3:04:32", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 6500, "total_steps": 18540, "loss": 0.433, "learning_rate": 3.6312001077632294e-05, "epoch": 0.35058385696178634, "percentage": 35.06, "elapsed_time": "1:38:02", "remaining_time": "3:01:36", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 7000, "total_steps": 18540, "loss": 0.4305, "learning_rate": 3.438480032010211e-05, "epoch": 0.37755184595884683, "percentage": 37.76, "elapsed_time": "1:47:59", "remaining_time": "2:58:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 7500, "total_steps": 18540, "loss": 0.4292, "learning_rate": 3.2390273142116814e-05, "epoch": 0.4045198349559073, "percentage": 40.45, "elapsed_time": "1:57:58", "remaining_time": "2:53:39", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 8000, "total_steps": 18540, "loss": 0.4271, "learning_rate": 3.034272825252622e-05, "epoch": 0.4314878239529678, "percentage": 43.15, "elapsed_time": "2:07:52", "remaining_time": "2:48:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 8500, "total_steps": 18540, "loss": 0.4265, "learning_rate": 2.8256854708469055e-05, "epoch": 0.4584558129500283, "percentage": 45.85, "elapsed_time": "2:17:45", "remaining_time": "2:42:42", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 9000, "total_steps": 18540, "loss": 0.425, "learning_rate": 2.6147616536291464e-05, "epoch": 0.4854238019470888, "percentage": 48.54, "elapsed_time": "2:27:29", "remaining_time": "2:36:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 9500, "total_steps": 18540, "loss": 0.4263, "learning_rate": 2.4030145379840563e-05, "epoch": 0.5123917909441493, "percentage": 51.24, "elapsed_time": "2:37:21", "remaining_time": "2:29:44", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 10000, "total_steps": 18540, "loss": 0.4225, "learning_rate": 2.1919631946272402e-05, "epoch": 0.5393597799412098, "percentage": 53.94, "elapsed_time": "2:47:09", "remaining_time": "2:22:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 10500, "total_steps": 18540, "loss": 0.4264, "learning_rate": 1.9831217028140688e-05, "epoch": 0.5663277689382703, "percentage": 56.63, "elapsed_time": "2:57:05", "remaining_time": "2:15:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 11000, "total_steps": 18540, "loss": 0.4242, "learning_rate": 1.777988288357209e-05, "epoch": 0.5932957579353307, "percentage": 59.33, "elapsed_time": "3:06:56", "remaining_time": "2:08:08", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 11500, "total_steps": 18540, "loss": 0.4223, "learning_rate": 1.578034575376518e-05, "epoch": 0.6202637469323913, "percentage": 62.03, "elapsed_time": "3:16:41", "remaining_time": "2:00:24", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 12000, "total_steps": 18540, "loss": 0.4209, "learning_rate": 1.3850741762328944e-05, "epoch": 0.6472317359294517, "percentage": 64.72, "elapsed_time": "3:26:36", "remaining_time": "1:52:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 12500, "total_steps": 18540, "loss": 0.4232, "learning_rate": 1.1997184612520374e-05, "epoch": 0.6741997249265123, "percentage": 67.42, "elapsed_time": "3:36:28", "remaining_time": "1:44:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 13000, "total_steps": 18540, "loss": 0.4229, "learning_rate": 1.0236909470428333e-05, "epoch": 0.7011677139235727, "percentage": 70.12, "elapsed_time": "3:46:13", "remaining_time": "1:36:24", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 13500, "total_steps": 18540, "loss": 0.4187, "learning_rate": 8.585739531996178e-06, "epoch": 0.7281357029206332, "percentage": 72.82, "elapsed_time": "3:56:01", "remaining_time": "1:28:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 14000, "total_steps": 18540, "loss": 0.4244, "learning_rate": 7.048906317823642e-06, "epoch": 0.7551036919176937, "percentage": 75.51, "elapsed_time": "4:05:52", "remaining_time": "1:19:44", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 14500, "total_steps": 18540, "loss": 0.4178, "learning_rate": 5.640853987596667e-06, "epoch": 0.7820716809147542, "percentage": 78.21, "elapsed_time": "4:15:43", "remaining_time": "1:11:15", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 15000, "total_steps": 18540, "loss": 0.4195, "learning_rate": 4.371683888171277e-06, "epoch": 0.8090396699118146, "percentage": 80.91, "elapsed_time": "4:25:27", "remaining_time": "1:02:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 15500, "total_steps": 18540, "loss": 0.4203, "learning_rate": 3.250501027307715e-06, "epoch": 0.8360076589088752, "percentage": 83.6, "elapsed_time": "4:35:07", "remaining_time": "0:53:57", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 16000, "total_steps": 18540, "loss": 0.4187, "learning_rate": 2.287118546736572e-06, "epoch": 0.8629756479059356, "percentage": 86.3, "elapsed_time": "4:44:44", "remaining_time": "0:45:12", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 16500, "total_steps": 18540, "loss": 0.4202, "learning_rate": 1.4845888005343062e-06, "epoch": 0.8899436369029962, "percentage": 89.0, "elapsed_time": "4:54:30", "remaining_time": "0:36:24", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 17000, "total_steps": 18540, "loss": 0.4221, "learning_rate": 8.507582708938533e-07, "epoch": 0.9169116259000566, "percentage": 91.69, "elapsed_time": "5:04:13", "remaining_time": "0:27:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 17500, "total_steps": 18540, "loss": 0.4217, "learning_rate": 3.901740487793598e-07, "epoch": 0.9438796148971171, "percentage": 94.39, "elapsed_time": "5:14:03", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 18000, "total_steps": 18540, "loss": 0.4209, "learning_rate": 1.0614035867460847e-07, "epoch": 0.9708476038941776, "percentage": 97.09, "elapsed_time": "5:23:49", "remaining_time": "0:09:42", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 18500, "total_steps": 18540, "loss": 0.4205, "learning_rate": 6.94854124816402e-10, "epoch": 0.9978155928912381, "percentage": 99.78, "elapsed_time": "5:33:37", "remaining_time": "0:00:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 18540, "total_steps": 18540, "epoch": 0.999973032011003, "percentage": 100.0, "elapsed_time": "5:34:31", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} | |